[Misc]Minor Changes about Worker (#11555)

Signed-off-by: Chenguang Li <757486878@qq.com>
2026-06-30 19:47:21 +08:00 · 2025-01-13 15:47:05 +08:00 · 2025-01-13 15:47:05 +08:00 · c3f05b09a0
commit c3f05b09a0
parent cf6bbcb493
2 changed files with 0 additions and 2 deletions
--- a/vllm/v1/worker/gpu_worker.py
+++ b/vllm/v1/worker/gpu_worker.py
@ -132,7 +132,6 @@ class Worker:
        # Execute a forward pass with dummy inputs to profile the memory usage
        # of the model.
        self.model_runner.profile_run()
-        torch.cuda.synchronize()

        free_gpu_memory, _ = torch.cuda.mem_get_info()
        # NOTE(woosuk): Here we assume that the other processes using the same
--- a/vllm/worker/worker.py
+++ b/vllm/worker/worker.py
@ -200,7 +200,6 @@ class Worker(LocalOrDistributedWorkerBase):
                              weights_memory_in_bytes=self.model_runner.
                              model_memory_usage) as result:
            self.model_runner.profile_run()
-            torch.cuda.synchronize()

        self._assert_memory_footprint_increased_during_profiling()