diff --git a/tests/v1/e2e/test_lora_with_spec_decode.py b/tests/v1/e2e/test_lora_with_spec_decode.py index 14532f2795443..8c9ab58c3c0ab 100644 --- a/tests/v1/e2e/test_lora_with_spec_decode.py +++ b/tests/v1/e2e/test_lora_with_spec_decode.py @@ -61,8 +61,6 @@ def test_batch_inference_correctness( model_setup: (method, model_name, spec_model_name, lora_path, tp_size) """ with monkeypatch.context() as m: - m.setenv("VLLM_USE_V1", "1") - # Disable randomness m.setenv("CUBLAS_WORKSPACE_CONFIG", ":4096:8") torch.manual_seed(SEED)