From b1340f9d55cd36a92aff713213e95f354a1bd1b4 Mon Sep 17 00:00:00 2001 From: Robert Shaw <114415538+robertgshaw2-redhat@users.noreply.github.com> Date: Fri, 31 Jan 2025 21:32:04 -0500 Subject: [PATCH] [V1] Bugfix: Validate Model Input Length (#12600) SUMMARY: * avoid crashing the engine when we get an input longer than max_model_len FIX #12567(*link existing issues this PR will resolve*) --- vllm/v1/engine/processor.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/vllm/v1/engine/processor.py b/vllm/v1/engine/processor.py index 43419d2ff5381..6196c11052078 100644 --- a/vllm/v1/engine/processor.py +++ b/vllm/v1/engine/processor.py @@ -206,6 +206,11 @@ class Processor: if prompt_ids is None or len(prompt_ids) == 0: raise ValueError("Prompt cannot be empty") + if len(prompt_ids) >= self.model_config.max_model_len: + raise ValueError( + f"Prompt length of {len(prompt_ids)} is longer than the " + f"maximum model length of {self.model_config.max_model_len}.") + if self.model_config.is_multimodal_model: max_prompt_len = self.model_config.max_model_len