File tree Expand file tree Collapse file tree 3 files changed +5
-8
lines changed
charts/model-engine/templates
model-engine/model_engine_server Expand file tree Collapse file tree 3 files changed +5
-8
lines changed Original file line number Diff line number Diff line change @@ -127,6 +127,7 @@ data:
127127 port: ${FORWARDER_PORT}
128128 initialDelaySeconds: ${READINESS_INITIAL_DELAY}
129129 periodSeconds: 5
130+ timeoutSeconds: 5
130131 resources:
131132 requests:
132133 cpu: 0.1
@@ -172,6 +173,7 @@ data:
172173 port: ${FORWARDER_PORT}
173174 initialDelaySeconds: ${READINESS_INITIAL_DELAY}
174175 periodSeconds: 5
176+ timeoutSeconds: 5
175177 resources:
176178 requests:
177179 cpu: 0.1
@@ -285,11 +287,6 @@ data:
285287 port: ${USER_CONTAINER_PORT}
286288 initialDelaySeconds: ${READINESS_INITIAL_DELAY}
287289 periodSeconds: 5
288- livenessProbe:
289- httpGet:
290- path: ${HEALTHCHECK_ROUTE}
291- port: ${USER_CONTAINER_PORT}
292- initialDelaySeconds: ${READINESS_INITIAL_DELAY}
293290 timeoutSeconds: 5
294291 resources:
295292 requests:
Original file line number Diff line number Diff line change 4343 GpuType .NVIDIA_AMPERE_A100E : A100_INSTANCE_LIMITS ,
4444}
4545
46- FORWARDER_CPU_USAGE = 0.5
47- FORWARDER_MEMORY_USAGE = "1Gi "
46+ FORWARDER_CPU_USAGE = 1
47+ FORWARDER_MEMORY_USAGE = "2Gi "
4848FORWARDER_STORAGE_USAGE = "1G"
4949
5050logger = make_logger (filename_wo_ext (__name__ ))
Original file line number Diff line number Diff line change @@ -16,4 +16,4 @@ forwarder:
1616 batch_route : null
1717 model_engine_unwrap : true
1818 serialize_results_as_string : false
19- max_concurrency : 20
19+ max_concurrency : 100
You can’t perform that action at this time.
0 commit comments