diff --git a/tests/models/language/generation/test_hybrid.py b/tests/models/language/generation/test_hybrid.py index e60a86075b8bc..9d67b46f2e3e4 100644 --- a/tests/models/language/generation/test_hybrid.py +++ b/tests/models/language/generation/test_hybrid.py @@ -240,12 +240,12 @@ def test_distributed_correctness( num_logprobs: int, ) -> None: with vllm_runner(model, tensor_parallel_size=1, - max_num_seqs=2) as vllm_model: + max_num_seqs=MAX_NUM_SEQS) as vllm_model: vllm_outputs_tp_1 = vllm_model.generate_greedy_logprobs( example_prompts, max_tokens, num_logprobs) with vllm_runner(model, tensor_parallel_size=2, - max_num_seqs=2) as vllm_model: + max_num_seqs=MAX_NUM_SEQS) as vllm_model: vllm_outputs_tp_2 = vllm_model.generate_greedy_logprobs( example_prompts, max_tokens, num_logprobs)