File tree Expand file tree Collapse file tree 2 files changed +2
-22
lines changed
Expand file tree Collapse file tree 2 files changed +2
-22
lines changed Original file line number Diff line number Diff line change 11apiVersion : gateway.networking.k8s.io/v1
22kind : HTTPRoute
3- metadata :
4- name : vsr-default-svc
5- namespace : default
6- spec :
7- parentRefs :
8- - group : gateway.networking.k8s.io
9- kind : Gateway
10- name : inference-gateway
11- rules :
12- - backendRefs :
13- - name : vllm-llama3-8b-instruct
14- port : 8000
15- matches :
16- - path :
17- type : PathPrefix
18- value : /
19- timeouts :
20- request : 300s
21- ---
22- apiVersion : gateway.networking.k8s.io/v1
23- kind : HTTPRoute
243metadata :
254 name : vsr-llama8b-svc
265 namespace : default
Original file line number Diff line number Diff line change 1+ # Profile revision 2025-11-21: math -> phi4-mini; cs/default -> llama3-8b; removed global HTTPRoute catch-all.
12config :
23 # Allow Envoy to re-run route matching after Semantic Router sets x-selected-model.
34 # Without this, Gateway API routes that depend on that header won't be chosen and return 404.
@@ -30,7 +31,7 @@ config:
3031 - type : domain
3132 name : math
3233 modelRefs :
33- - model : llama3-8b
34+ - model : phi4-mini
3435 use_reasoning : false
3536 - name : cs_route
3637 priority : 10
You can’t perform that action at this time.
0 commit comments