We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c7d7a1b commit 7f4606dCopy full SHA for 7f4606d
lightllm/server/httpserver/manager.py
@@ -604,6 +604,7 @@ async def _wait_to_token_package(
604
f"prompt_cache_len:{prompt_cache_len} "
605
f"prompt_cache_ratio:{prompt_cache_ratio} "
606
f"cpu_prompt_cache_len:{cpu_prompt_cache_len} "
607
+ f"used_cpu_prompt_cache_len:{cpu_prompt_cache_len - prompt_cache_len} "
608
f"mtp_avg_token_per_step:{mtp_avg_token_per_step} "
609
)
610
if group_request_id < 0:
0 commit comments