diff --git a/vllm/model_executor/models/transformers.py b/vllm/model_executor/models/transformers.py index 6ea149506581c..bdc390689104e 100644 --- a/vllm/model_executor/models/transformers.py +++ b/vllm/model_executor/models/transformers.py @@ -229,7 +229,10 @@ class TransformersModel(nn.Module): Apply the model's tensor parallelization plan. Currently only supports linear layers. """ - if self.tp_size > 1 and self.config.base_model_tp_plan is None: + if not self.model.supports_tp_plan: + if self.tp_size <= 1: + return + raise ValueError( f"{type(self.model)} does not support tensor parallel yet!")