Skip to content

Commit f900752

Browse files
authored
Merge branch 'main' into fix_quickstart_script
2 parents e1b0851 + 75523aa commit f900752

File tree

2 files changed

+16
-4
lines changed

2 files changed

+16
-4
lines changed

.github/workflows/k8s-kind-integration-test.yml

Lines changed: 15 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -186,6 +186,17 @@ jobs:
186186
- op: replace
187187
path: /spec/template/spec/containers/0/resources/limits/cpu
188188
value: "1"
189+
- op: replace
190+
path: /spec/template/spec/containers/0/readinessProbe
191+
value:
192+
httpGet:
193+
path: /health
194+
port: classify-api
195+
scheme: HTTP
196+
initialDelaySeconds: 120
197+
periodSeconds: 15
198+
timeoutSeconds: 5
199+
failureThreshold: 20
189200
- op: add
190201
path: /spec/template/spec/containers/0/imagePullPolicy
191202
value: "IfNotPresent"
@@ -244,22 +255,22 @@ jobs:
244255
245256
# Wait for PVC to be bound
246257
echo "Waiting for PVC to be bound..."
247-
kubectl wait --for=jsonpath='{.status.phase}'=Bound pvc/semantic-router-models -n vllm-semantic-router-system --timeout=120s || {
258+
kubectl wait --for=jsonpath='{.status.phase}'=Bound pvc/semantic-router-models -n vllm-semantic-router-system --timeout=300s || {
248259
echo "PVC binding timeout. Checking PVC status..."
249260
kubectl describe pvc -n vllm-semantic-router-system
250261
exit 1
251262
}
252263
253264
# Wait for pods to be created
254265
echo "Waiting for pods to be created..."
255-
timeout 120 bash -c 'until kubectl get pods -n vllm-semantic-router-system | grep -q semantic-router; do echo "Waiting for pod creation..."; sleep 5; done'
266+
timeout 300 bash -c 'until kubectl get pods -n vllm-semantic-router-system | grep -q semantic-router; do echo "Waiting for pod creation..."; sleep 5; done'
256267
257268
# Show pod status
258269
kubectl get pods -n vllm-semantic-router-system
259270
260271
# Wait for init container to complete (model download)
261272
echo "Waiting for init container to complete (downloading models)..."
262-
kubectl wait --for=condition=Initialized pods -l app=semantic-router -n vllm-semantic-router-system --timeout=600s || {
273+
kubectl wait --for=condition=Initialized pods -l app=semantic-router -n vllm-semantic-router-system --timeout=1200s || {
263274
echo "❌ Init container did not complete in time. Showing logs..."
264275
kubectl logs -n vllm-semantic-router-system -l app=semantic-router -c model-downloader --tail=200 || true
265276
kubectl describe pods -n vllm-semantic-router-system -l app=semantic-router
@@ -268,7 +279,7 @@ jobs:
268279
269280
# Wait for main container to be ready (increased timeout for model loading)
270281
echo "Waiting for main container to be ready..."
271-
kubectl wait --for=condition=Ready pods -l app=semantic-router -n vllm-semantic-router-system --timeout=600s || {
282+
kubectl wait --for=condition=Ready pods -l app=semantic-router -n vllm-semantic-router-system --timeout=1200s || {
272283
echo "❌ Pod did not become ready in time. Showing status and logs..."
273284
kubectl describe pods -n vllm-semantic-router-system -l app=semantic-router
274285
kubectl logs -n vllm-semantic-router-system -l app=semantic-router --tail=200 || true

deploy/kubernetes/deployment.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -141,6 +141,7 @@ spec:
141141
periodSeconds: 30
142142
timeoutSeconds: 10
143143
failureThreshold: 3
144+
# Note: CI overrides readinessProbe via workflow kustomize patch to use HTTP GET /health on port 'classify-api'
144145
readinessProbe:
145146
tcpSocket:
146147
port: 50051

0 commit comments

Comments
 (0)