@@ -186,6 +186,17 @@ jobs:
186186 - op: replace
187187 path: /spec/template/spec/containers/0/resources/limits/cpu
188188 value: "1"
189+ - op: replace
190+ path: /spec/template/spec/containers/0/readinessProbe
191+ value:
192+ httpGet:
193+ path: /health
194+ port: classify-api
195+ scheme: HTTP
196+ initialDelaySeconds: 120
197+ periodSeconds: 15
198+ timeoutSeconds: 5
199+ failureThreshold: 20
189200 - op: add
190201 path: /spec/template/spec/containers/0/imagePullPolicy
191202 value: "IfNotPresent"
@@ -244,22 +255,22 @@ jobs:
244255
245256 # Wait for PVC to be bound
246257 echo "Waiting for PVC to be bound..."
247- kubectl wait --for=jsonpath='{.status.phase}'=Bound pvc/semantic-router-models -n vllm-semantic-router-system --timeout=120s || {
258+ kubectl wait --for=jsonpath='{.status.phase}'=Bound pvc/semantic-router-models -n vllm-semantic-router-system --timeout=300s || {
248259 echo "PVC binding timeout. Checking PVC status..."
249260 kubectl describe pvc -n vllm-semantic-router-system
250261 exit 1
251262 }
252263
253264 # Wait for pods to be created
254265 echo "Waiting for pods to be created..."
255- timeout 120 bash -c 'until kubectl get pods -n vllm-semantic-router-system | grep -q semantic-router; do echo "Waiting for pod creation..."; sleep 5; done'
266+ timeout 300 bash -c 'until kubectl get pods -n vllm-semantic-router-system | grep -q semantic-router; do echo "Waiting for pod creation..."; sleep 5; done'
256267
257268 # Show pod status
258269 kubectl get pods -n vllm-semantic-router-system
259270
260271 # Wait for init container to complete (model download)
261272 echo "Waiting for init container to complete (downloading models)..."
262- kubectl wait --for=condition=Initialized pods -l app=semantic-router -n vllm-semantic-router-system --timeout=600s || {
273+ kubectl wait --for=condition=Initialized pods -l app=semantic-router -n vllm-semantic-router-system --timeout=1200s || {
263274 echo "❌ Init container did not complete in time. Showing logs..."
264275 kubectl logs -n vllm-semantic-router-system -l app=semantic-router -c model-downloader --tail=200 || true
265276 kubectl describe pods -n vllm-semantic-router-system -l app=semantic-router
@@ -268,7 +279,7 @@ jobs:
268279
269280 # Wait for main container to be ready (increased timeout for model loading)
270281 echo "Waiting for main container to be ready..."
271- kubectl wait --for=condition=Ready pods -l app=semantic-router -n vllm-semantic-router-system --timeout=600s || {
282+ kubectl wait --for=condition=Ready pods -l app=semantic-router -n vllm-semantic-router-system --timeout=1200s || {
272283 echo "❌ Pod did not become ready in time. Showing status and logs..."
273284 kubectl describe pods -n vllm-semantic-router-system -l app=semantic-router
274285 kubectl logs -n vllm-semantic-router-system -l app=semantic-router --tail=200 || true
0 commit comments