We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
VLLM_DISABLE_SHARED_EXPERTS_STREAM
1 parent b6a248b commit d79d9f0Copy full SHA for d79d9f0
vllm/platforms/cpu.py
@@ -299,7 +299,7 @@ def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
299
os.environ["TORCHINDUCTOR_COMPILE_THREADS"] = "1"
300
301
# Disable multi-stream for shared experts as no Stream on CPU
302
- os.environ["VLLM_DISABLE_SHARED_EXPERTS_STREAM"] = "0"
+ os.environ["VLLM_DISABLE_SHARED_EXPERTS_STREAM"] = "1"
303
304
# Intel OpenMP setting
305
ld_preload_str = os.getenv("LD_PRELOAD", "")
0 commit comments