From 325aa3dee922b344a26b9e74d9ae3c769828e70e Mon Sep 17 00:00:00 2001 From: Ning Xie Date: Fri, 22 Aug 2025 22:01:35 +0800 Subject: [PATCH] [Misc] local import code clean (#23420) Signed-off-by: Andy Xie --- vllm/v1/worker/gpu_worker.py | 1 - vllm/worker/worker.py | 3 +-- 2 files changed, 1 insertion(+), 3 deletions(-) diff --git a/vllm/v1/worker/gpu_worker.py b/vllm/v1/worker/gpu_worker.py index d61177d4245dd..f83a4f4faeb5e 100644 --- a/vllm/v1/worker/gpu_worker.py +++ b/vllm/v1/worker/gpu_worker.py @@ -292,7 +292,6 @@ class Worker(WorkerBase): allocator = CuMemAllocator.get_instance() context = allocator.use_memory_pool(tag="kv_cache") else: - from contextlib import nullcontext context = nullcontext() with context: self.model_runner.initialize_kv_cache(kv_cache_config) diff --git a/vllm/worker/worker.py b/vllm/worker/worker.py index 7a01e585ba6d0..fc24d95b80f2c 100644 --- a/vllm/worker/worker.py +++ b/vllm/worker/worker.py @@ -3,6 +3,7 @@ """A GPU worker class.""" import gc import os +from contextlib import nullcontext from typing import Dict, List, Optional, Set, Tuple, Type, Union import torch @@ -206,7 +207,6 @@ class Worker(LocalOrDistributedWorkerBase): "used for one instance per process.") context = allocator.use_memory_pool(tag="weights") else: - from contextlib import nullcontext context = nullcontext() with context: self.model_runner.load_model() @@ -330,7 +330,6 @@ class Worker(LocalOrDistributedWorkerBase): allocator = CuMemAllocator.get_instance() context = allocator.use_memory_pool(tag="kv_cache") else: - from contextlib import nullcontext context = nullcontext() with context: self._init_cache_engine()