Use math.prod instead of np.prod for trivial ops (#14142)

2026-07-16 03:27:10 +08:00 · 2025-03-04 00:09:22 -05:00 · 2025-03-04 00:09:22 -05:00 · 66233af7b6
commit 66233af7b6
parent bf13d40972
1 changed files with 2 additions and 2 deletions
--- a/vllm/worker/cache_engine.py
+++ b/vllm/worker/cache_engine.py
@ -1,8 +1,8 @@
 # SPDX-License-Identifier: Apache-2.0
 """CacheEngine class for managing the KV cache."""
+from math import prod
 from typing import List

-import numpy as np
 import torch

 from vllm import envs
@ -90,7 +90,7 @@ class CacheEngine:
            # NOTE this assumption currently only holds for MLA so we only apply
            # this optimization when `use_mla` is true
            entry_shape = kv_cache_shape[2:]
-            entry_size = np.prod(entry_shape)
+            entry_size = prod(entry_shape)
            alloc_entry_size = align_to_256bytes(entry_size, self.dtype)
            alloc_shape = (*kv_cache_shape[:2], alloc_entry_size)
        else: