459
459
"router" : {
460
460
"scheduler" : {},
461
461
},
462
- }
462
+ },
463
+ "router-with-gateway-ref" : {
464
+ "router" : {
465
+ "gateway" : {
466
+ "refs" : [
467
+ {"name" : "router-gateway-1" , "namespace" : KSERVE_TEST_NAMESPACE },
468
+ ],
469
+ },
470
+ },
471
+ },
472
+ "router-with-managed-route" : {
473
+ "router" : {
474
+ "route" : {}
475
+ },
476
+ },
477
+ "workload-llmd-simulator" : {
478
+ "replicas" : 1 ,
479
+ "model" : {"uri" : "hf://facebook/opt-125m" , "name" : "facebook/opt-125m" },
480
+ "template" : {
481
+ "containers" : [
482
+ {
483
+ "name" : "main" ,
484
+ "image" : "ghcr.io/llm-d/llm-d-inference-sim:v0.5.1" ,
485
+ "command" : ["/app/llm-d-inference-sim" ],
486
+ "args" : [
487
+ "--port" ,
488
+ "8000" ,
489
+ "--model" ,
490
+ "{{ .Spec.Model.Name }}" ,
491
+ "--mode" ,
492
+ "random" ,
493
+ "--ssl-certfile" ,
494
+ "/etc/ssl/certs/tls.crt" ,
495
+ "--ssl-keyfile" ,
496
+ "/etc/ssl/certs/tls.key"
497
+ ],
498
+ "resources" : {
499
+ "limits" : {"cpu" : "1" , "memory" : "2Gi" },
500
+ "requests" : {"cpu" : "1" , "memory" : "2Gi" },
501
+ },
502
+ }
503
+ ]
504
+ },
505
+ },
463
506
}
464
507
465
508
@@ -574,7 +617,7 @@ def _get_model_name_from_configs(config_names):
574
617
config = LLMINFERENCESERVICE_CONFIGS [config_name ]
575
618
if "model" in config and "name" in config ["model" ]:
576
619
return config ["model" ]["name" ]
577
- return "default- model"
620
+ return "default/ model"
578
621
579
622
580
623
def generate_k8s_safe_suffix (base_name : str , extra_parts : List [str ] = None ) -> str :
@@ -608,7 +651,7 @@ def generate_test_id(test_case) -> str:
608
651
return "-" .join (test_case .base_refs )
609
652
610
653
611
- def create_router_resources (gateways , routes , kserve_client = None ):
654
+ def create_router_resources (gateways , routes = None , kserve_client = None ):
612
655
if not kserve_client :
613
656
kserve_client = KServeClient (config_file = os .environ .get ("KUBECONFIG" , "~/.kube/config" ))
614
657
@@ -619,7 +662,7 @@ def create_router_resources(gateways, routes, kserve_client=None):
619
662
for gateway in gateways :
620
663
create_or_update_gateway (kserve_client , gateway )
621
664
gateways_created .append (gateway )
622
- for route in routes :
665
+ for route in routes or [] :
623
666
create_or_update_route (kserve_client , route )
624
667
routes_created .append (route )
625
668
except Exception as e :
@@ -628,11 +671,11 @@ def create_router_resources(gateways, routes, kserve_client=None):
628
671
raise
629
672
630
673
631
- def delete_router_resources (gateways , routes , kserve_client = None ):
674
+ def delete_router_resources (gateways , routes = None , kserve_client = None ):
632
675
if not kserve_client :
633
676
kserve_client = KServeClient (config_file = os .environ .get ("KUBECONFIG" , "~/.kube/config" ))
634
677
635
- for route in routes :
678
+ for route in routes or [] :
636
679
try :
637
680
logger .info (f"Cleaning up HttpRoute { route .get ('metadata' , {}).get ('name' )} " )
638
681
delete_route (kserve_client , route .get ("metadata" , {}).get ("name" ), route .get ("metadata" , {}).get ("namespace" , "default" ))
0 commit comments