diff --git a/docs/source/models/supported_models.md b/docs/source/models/supported_models.md index 5db82c8e5567d..bcbd7bf9600c5 100644 --- a/docs/source/models/supported_models.md +++ b/docs/source/models/supported_models.md @@ -786,9 +786,9 @@ See [this page](#generative-models) for more information on how to use generativ * * ✅︎ - * `InternVLChatModel` - * InternVL 2.5, Mono-InternVL, InternVL 2.0 + * InternVideo 2.5, InternVL 2.5, Mono-InternVL, InternVL 2.0 * T + IE+ - * `OpenGVLab/InternVL2_5-4B`, `OpenGVLab/Mono-InternVL-2B`, `OpenGVLab/InternVL2-4B`, etc. + * `OpenGVLab/InternVideo2_5_Chat_8B`, `OpenGVLab/InternVL2_5-4B`, `OpenGVLab/Mono-InternVL-2B`, `OpenGVLab/InternVL2-4B`, etc. * * ✅︎ * ✅︎ diff --git a/vllm/model_executor/models/internvl.py b/vllm/model_executor/models/internvl.py index 1aa8455bad821..fcaf7fecaafc9 100644 --- a/vllm/model_executor/models/internvl.py +++ b/vllm/model_executor/models/internvl.py @@ -981,5 +981,12 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP): def load_weights(self, weights: Iterable[Tuple[str, torch.Tensor]]) -> Set[str]: - loader = AutoWeightsLoader(self) + # unused modules appear in OpenGVLab/InternVideo2_5_Chat_8B + skip_prefixes = [ + "action_embed", "temporal_embed", "track_embed", + "track_embed_decoder", "box_token", "cg_criterion", "cg_model", + "loc_encoder", "loc_decoder", "sam", "temporal_token", + "track_token" + ] + loader = AutoWeightsLoader(self, skip_prefixes=skip_prefixes) return loader.load_weights(weights)