Skip to content

Commit 8c63a03

Browse files
authored
fix math routing
Signed-off-by: GitHub <[email protected]>
1 parent 137d03f commit 8c63a03

File tree

2 files changed

+2
-22
lines changed

2 files changed

+2
-22
lines changed

e2e/profiles/llm-d/manifests/httproute-services.yaml

Lines changed: 0 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -1,26 +1,5 @@
11
apiVersion: gateway.networking.k8s.io/v1
22
kind: HTTPRoute
3-
metadata:
4-
name: vsr-default-svc
5-
namespace: default
6-
spec:
7-
parentRefs:
8-
- group: gateway.networking.k8s.io
9-
kind: Gateway
10-
name: inference-gateway
11-
rules:
12-
- backendRefs:
13-
- name: vllm-llama3-8b-instruct
14-
port: 8000
15-
matches:
16-
- path:
17-
type: PathPrefix
18-
value: /
19-
timeouts:
20-
request: 300s
21-
---
22-
apiVersion: gateway.networking.k8s.io/v1
23-
kind: HTTPRoute
243
metadata:
254
name: vsr-llama8b-svc
265
namespace: default

e2e/profiles/llm-d/values.yaml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1+
# Profile revision 2025-11-21: math -> phi4-mini; cs/default -> llama3-8b; removed global HTTPRoute catch-all.
12
config:
23
# Allow Envoy to re-run route matching after Semantic Router sets x-selected-model.
34
# Without this, Gateway API routes that depend on that header won't be chosen and return 404.
@@ -30,7 +31,7 @@ config:
3031
- type: domain
3132
name: math
3233
modelRefs:
33-
- model: llama3-8b
34+
- model: phi4-mini
3435
use_reasoning: false
3536
- name: cs_route
3637
priority: 10

0 commit comments

Comments
 (0)