[Bugfix][CPU] Disable dual stream execution for experts on CPU (#27320)

Signed-off-by: jiang1.li <jiang1.li@intel.com>
This commit is contained in:
Li, Jiang 2025-10-22 19:02:27 +08:00 committed by GitHub
parent 1f633b8632
commit 843af7f7fc
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -297,6 +297,9 @@ class CpuPlatform(Platform):
# Disable torch async compiling which won't work with daemonic processes
os.environ["TORCHINDUCTOR_COMPILE_THREADS"] = "1"
# Disable multi-stream for shared experts as no Stream on CPU
os.environ["VLLM_DISABLE_SHARED_EXPERTS_STREAM"] = "0"
# Intel OpenMP setting
ld_prealod_str = os.getenv("LD_PRELOAD", "")
if "libiomp5.so" in ld_prealod_str: