diff --git a/vllm/config/model.py b/vllm/config/model.py index 6ce91ebb87b90..49b66039d4a0a 100644 --- a/vllm/config/model.py +++ b/vllm/config/model.py @@ -1619,6 +1619,13 @@ class ModelConfig: @property def is_hybrid(self) -> bool: + # Handle granite-4.0-micro case which uses hybrid config but does not + # actually contain any non-attention layers. + layer_types = getattr(self.hf_config, "layer_types", None) + if layer_types is not None and all( + layer == "attention" for layer in layer_types + ): + return False return self._model_info.is_hybrid @property