We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5446ad1 commit 0e93ac0Copy full SHA for 0e93ac0
tests/models/language/generation/test_hybrid.py
@@ -240,12 +240,12 @@ def test_distributed_correctness(
240
num_logprobs: int,
241
) -> None:
242
with vllm_runner(model, tensor_parallel_size=1,
243
- max_num_seqs=2) as vllm_model:
+ max_num_seqs=MAX_NUM_SEQS) as vllm_model:
244
vllm_outputs_tp_1 = vllm_model.generate_greedy_logprobs(
245
example_prompts, max_tokens, num_logprobs)
246
247
with vllm_runner(model, tensor_parallel_size=2,
248
249
vllm_outputs_tp_2 = vllm_model.generate_greedy_logprobs(
250
251
0 commit comments