[CI][Bugfix] Fix token counting in chunked prefill compl test (vllm-project#31630)

AndreasKaratzas · web-flow · commit 4f9ce35afe45 · 2026-01-03T14:28:49.000+08:00
Signed-off-by: Andreas Karatzas &lt;akaratza@amd.com&gt;
diff --git a/tests/entrypoints/openai/test_chunked_prompt.py b/tests/entrypoints/openai/test_chunked_prompt.py
@@ -66,8 +66,11 @@ async def test_completion_stream_options_and_logprobs_with_long_prompts(
             chunk.usage.prompt_tokens + chunk.usage.completion_tokens
         )
         if not finished:
-            tokens_received += 1
             assert chunk.choices[0].text
+            # Count actual tokens from logprobs since multiple tokens
+            # can be batched into a single chunk
+            assert chunk.choices[0].logprobs and chunk.choices[0].logprobs.tokens
+            tokens_received += len(chunk.choices[0].logprobs.tokens)
 
             if chunk.choices[0].finish_reason is not None:
                 finished = True