We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d9e3f88 commit 09cc4e2Copy full SHA for 09cc4e2
fastdeploy/entrypoints/openai/serving_completion.py
@@ -358,6 +358,7 @@ async def completion_stream_generator(
358
usage=UsageInfo(
359
prompt_tokens=len(prompt_batched_token_ids[idx]),
360
completion_tokens=output_tokens[idx],
361
+ total_tokens=len(prompt_batched_token_ids[idx]) + output_tokens[idx],
362
),
363
)
364
yield f"data: {usage_chunk.model_dump_json(exclude_unset=True)}\n\n"
0 commit comments