File tree Expand file tree Collapse file tree 3 files changed +15
-2
lines changed
model-engine/model_engine_server/inference Expand file tree Collapse file tree 3 files changed +15
-2
lines changed Original file line number Diff line number Diff line change @@ -33,7 +33,7 @@ def entrypoint():
3333 parser .add_argument ("--host" , type = str , default = "[::]" )
3434 parser .add_argument ("--port" , type = int , default = 5009 )
3535
36- args = parser .parse_args ()
36+ args , extra_args = parser .parse_known_args ()
3737
3838 command = [
3939 "gunicorn" ,
@@ -48,6 +48,7 @@ def entrypoint():
4848 "--workers" ,
4949 str (args .num_workers ),
5050 "model_engine_server.inference.forwarding.echo_server:app" ,
51+ * extra_args ,
5152 ]
5253 subprocess .run (command )
5354
Original file line number Diff line number Diff line change @@ -138,8 +138,9 @@ def entrypoint():
138138 parser .add_argument ("--host" , type = str , default = "[::]" )
139139 parser .add_argument ("--port" , type = int , default = 5000 )
140140 parser .add_argument ("--set" , type = str , action = "append" )
141+ parser .add_argument ("--graceful-timeout" , type = int , default = 600 )
141142
142- args = parser .parse_args ()
143+ args , extra_args = parser .parse_known_args ()
143144
144145 values = [f"CONFIG_FILE={ args .config } " ]
145146 if args .set is not None :
@@ -160,8 +161,11 @@ def entrypoint():
160161 "uvicorn.workers.UvicornWorker" ,
161162 "--workers" ,
162163 str (args .num_workers ),
164+ "--graceful-timeout" ,
165+ str (args .graceful_timeout ),
163166 * envs ,
164167 "model_engine_server.inference.forwarding.http_forwarder:app" ,
168+ * extra_args ,
165169 ]
166170 subprocess .run (command )
167171
Original file line number Diff line number Diff line change 1+ import argparse
12import os
23import subprocess
34
89
910
1011def start_server ():
12+ parser = argparse .ArgumentParser ()
13+ parser .add_argument ("--graceful-timeout" , type = int , default = 600 )
14+ args , extra_args = parser .parse_known_args ()
15+
1116 # TODO: HTTPS
1217 command = [
1318 "gunicorn" ,
@@ -21,7 +26,10 @@ def start_server():
2126 "uvicorn.workers.UvicornWorker" ,
2227 "--workers" ,
2328 str (NUM_PROCESSES ),
29+ "--graceful-timeout" ,
30+ str (args .graceful_timeout ),
2431 "model_engine_server.inference.sync_inference.fastapi_server:app" ,
32+ * extra_args ,
2533 ]
2634 unset_sensitive_envvars ()
2735 subprocess .run (command )
You can’t perform that action at this time.
0 commit comments