diff --git a/vllm/v1/engine/processor.py b/vllm/v1/engine/processor.py index 69509d5d4712a..0404f6ff2771c 100644 --- a/vllm/v1/engine/processor.py +++ b/vllm/v1/engine/processor.py @@ -579,6 +579,7 @@ class Processor: prompt_len == max_prompt_len and prompt_type == "decoder" and not model_config.is_multimodal_model + and self.model_config.runner_type != "pooling" ): suggestion = ( "Make sure that `max_model_len` is no smaller than the "