diff --git a/vllm/worker/tpu_worker.py b/vllm/worker/tpu_worker.py index 37d810e8392a9..d58c7dc994184 100644 --- a/vllm/worker/tpu_worker.py +++ b/vllm/worker/tpu_worker.py @@ -215,7 +215,7 @@ class TPUWorker(LoraNotSupportedWorkerBase): assert len(seq_group_metadata_list) > 0 output = self.model_runner.execute_model(seq_group_metadata_list, self.tpu_cache) - return [output] + return output def cache_swap( self,