mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-18 03:25:01 +08:00
[ROCm][AMD] Disable auto enabling chunked prefill on ROCm (#11146)
Signed-off-by: Gregory Shtrasberg <Gregory.Shtrasberg@amd.com>
This commit is contained in:
parent
3989a79824
commit
00c1bde5d8
@ -1074,7 +1074,8 @@ class EngineArgs:
|
|||||||
if (is_gpu and not use_sliding_window and not use_spec_decode
|
if (is_gpu and not use_sliding_window and not use_spec_decode
|
||||||
and not self.enable_lora
|
and not self.enable_lora
|
||||||
and not self.enable_prompt_adapter
|
and not self.enable_prompt_adapter
|
||||||
and model_config.runner_type != "pooling"):
|
and model_config.runner_type != "pooling"
|
||||||
|
and not current_platform.is_rocm()):
|
||||||
self.enable_chunked_prefill = True
|
self.enable_chunked_prefill = True
|
||||||
logger.warning(
|
logger.warning(
|
||||||
"Chunked prefill is enabled by default for models with "
|
"Chunked prefill is enabled by default for models with "
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user