mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-02 20:57:58 +08:00
[Bugfix][CPU] Disable dual stream execution for experts on CPU (#27320)
Signed-off-by: jiang1.li <jiang1.li@intel.com>
This commit is contained in:
parent
1f633b8632
commit
843af7f7fc
@ -297,6 +297,9 @@ class CpuPlatform(Platform):
|
|||||||
# Disable torch async compiling which won't work with daemonic processes
|
# Disable torch async compiling which won't work with daemonic processes
|
||||||
os.environ["TORCHINDUCTOR_COMPILE_THREADS"] = "1"
|
os.environ["TORCHINDUCTOR_COMPILE_THREADS"] = "1"
|
||||||
|
|
||||||
|
# Disable multi-stream for shared experts as no Stream on CPU
|
||||||
|
os.environ["VLLM_DISABLE_SHARED_EXPERTS_STREAM"] = "0"
|
||||||
|
|
||||||
# Intel OpenMP setting
|
# Intel OpenMP setting
|
||||||
ld_prealod_str = os.getenv("LD_PRELOAD", "")
|
ld_prealod_str = os.getenv("LD_PRELOAD", "")
|
||||||
if "libiomp5.so" in ld_prealod_str:
|
if "libiomp5.so" in ld_prealod_str:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user