[Refactor] refactor freezing_value/cuda_event initialize outside try finally (#23758)

Signed-off-by: Andy Xie <andy.xning@gmail.com>
2025-12-25 16:14:03 +08:00 · 2025-08-30 21:42:25 +08:00 · 2025-08-30 21:42:25 +08:00 · e80bca309e
commit e80bca309e
parent fb4983e112
1 changed files with 3 additions and 3 deletions
--- a/vllm/v1/worker/cpu_model_runner.py
+++ b/vllm/v1/worker/cpu_model_runner.py
@ -128,8 +128,8 @@ def _torch_cuda_wrapper():
            self.record = lambda: None
            self.synchronize = lambda: None

+    cuda_event = torch.cuda.Event
    try:
-        cuda_event = torch.cuda.Event
        torch.cuda.Event = _EventPlaceholder
        yield
    finally:
@ -141,9 +141,9 @@ def _set_global_compilation_settings(config: VllmConfig):
    import torch._inductor.config

    inductor_config = config.compilation_config.inductor_compile_config
+    # Note: The MKLDNN and CPPGEMM backend requires freezing parameters.
+    freezing_value = torch._inductor.config.freezing
    try:
-        # Note: The MKLDNN and CPPGEMM backend requires freezing parameters.
-        freezing_value = torch._inductor.config.freezing
        if inductor_config.get("max_autotune", False):
            torch._inductor.config.freezing = True
        yield