mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-25 17:34:03 +08:00
[Bugfix][CPU] Disable dual stream execution for experts on CPU (#27320)
Signed-off-by: jiang1.li <jiang1.li@intel.com>
This commit is contained in:
parent
1f633b8632
commit
843af7f7fc
@ -297,6 +297,9 @@ class CpuPlatform(Platform):
|
||||
# Disable torch async compiling which won't work with daemonic processes
|
||||
os.environ["TORCHINDUCTOR_COMPILE_THREADS"] = "1"
|
||||
|
||||
# Disable multi-stream for shared experts as no Stream on CPU
|
||||
os.environ["VLLM_DISABLE_SHARED_EXPERTS_STREAM"] = "0"
|
||||
|
||||
# Intel OpenMP setting
|
||||
ld_prealod_str = os.getenv("LD_PRELOAD", "")
|
||||
if "libiomp5.so" in ld_prealod_str:
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user