We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c116cc3 commit 66c6973Copy full SHA for 66c6973
xllm/core/framework/batch/batch_factory.cpp
@@ -69,8 +69,10 @@ std::vector<Batch> BatchFactory::create_batches(
69
COUNTER_ADD(num_processing_tokens_total_prompt, num_prompt_tokens);
70
COUNTER_ADD(num_processing_tokens_total_generated, num_generated_tokens);
71
72
- HISTOGRAM_OBSERVE(num_prompt_tokens_per_request, num_prompt_tokens);
73
- HISTOGRAM_OBSERVE(num_generated_tokens_per_request, num_generated_tokens);
+ HISTOGRAM_OBSERVE(num_prompt_tokens_per_request,
+ num_prompt_tokens / running_sequences.size());
74
+ HISTOGRAM_OBSERVE(num_generated_tokens_per_request,
75
+ num_generated_tokens / running_sequences.size());
76
77
return batches;
78
}
0 commit comments