diff --git a/vllm/v1/worker/gpu_worker.py b/vllm/v1/worker/gpu_worker.py index d5b3d9255c60e..3a2de668f963b 100644 --- a/vllm/v1/worker/gpu_worker.py +++ b/vllm/v1/worker/gpu_worker.py @@ -421,6 +421,7 @@ class Worker(WorkerBase): return self.model_runner.get_model() def get_supported_tasks(self) -> tuple[SupportedTask, ...]: + return "generate" return self.model_runner.get_supported_tasks() @torch.inference_mode()