[Bugfix] Fix torch.compile() error when using MultiprocessingGPUExecutor (#5229)

2025-12-10 13:36:12 +08:00 · 2024-06-03 20:55:50 -07:00 · 2024-06-03 20:55:50 -07:00 · a58f24e590
commit a58f24e590
parent f42a006b15
1 changed files with 3 additions and 0 deletions
--- a/vllm/executor/multiproc_gpu_executor.py
+++ b/vllm/executor/multiproc_gpu_executor.py
@ -34,6 +34,9 @@ class MultiprocessingGPUExecutor(DistributedGPUExecutor):
        # Ensure that VLLM_INSTANCE_ID is set, to be inherited by workers
        os.environ["VLLM_INSTANCE_ID"] = get_vllm_instance_id()
        # Disable torch async compiling which won't work with daemonic processes
        os.environ["TORCHINDUCTOR_COMPILE_THREADS"] = "1"
        from torch.cuda import device_count
        assert world_size <= device_count(), (
            "please set tensor_parallel_size to less than max local gpu count")