We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9098ae8 commit 5f0647fCopy full SHA for 5f0647f
lmdeploy/cli/serve.py
@@ -359,6 +359,8 @@ def api_server(args):
359
cache_block_seq_len=args.cache_block_seq_len,
360
enable_prefix_caching=args.enable_prefix_caching,
361
max_prefill_token_num=args.max_prefill_token_num,
362
+ num_tokens_per_iter=args.num_tokens_per_iter,
363
+ max_prefill_iters=args.max_prefill_iters,
364
communicator=args.communicator,
365
hf_overrides=args.hf_overrides)
366
chat_template_config = get_chat_template(args.chat_template)
0 commit comments