From 6fe58876528751a808c0d25016d3c97b432b909f Mon Sep 17 00:00:00 2001 From: Isotr0py Date: Thu, 18 Dec 2025 11:54:39 +0800 Subject: [PATCH] [Chore] Remove v0 dead code for Qwen2.5-omni (#30883) Signed-off-by: Isotr0py --- .../models/qwen2_5_omni_thinker.py | 22 ------------------- 1 file changed, 22 deletions(-) diff --git a/vllm/model_executor/models/qwen2_5_omni_thinker.py b/vllm/model_executor/models/qwen2_5_omni_thinker.py index f9bce4bf981b2..94deeb867c9f8 100644 --- a/vllm/model_executor/models/qwen2_5_omni_thinker.py +++ b/vllm/model_executor/models/qwen2_5_omni_thinker.py @@ -70,7 +70,6 @@ from vllm.multimodal.inputs import ( MultiModalFeatureSpec, MultiModalFieldConfig, MultiModalKwargsItems, - NestedTensors, ) from vllm.multimodal.parse import ( AudioProcessorItems, @@ -1150,27 +1149,6 @@ class Qwen2_5OmniThinkerForConditionalGeneration( handle_oov_mm_token=handle_oov_mm_token, ) - def embed_multimodal_v0(self, **kwargs: object) -> NestedTensors | None: - audio_input = self._parse_and_validate_audio_input(**kwargs) - image_input = self._parse_and_validate_image_input(**kwargs) - video_input = self._parse_and_validate_video_input(**kwargs) - - if audio_input is None and image_input is None and video_input is None: - return None - - multimodal_embeddings: list[tuple[NestedTensors, str]] = [] - - if audio_input is not None: - audio_embeds = self._process_audio_input(audio_input) - multimodal_embeddings.append((audio_embeds, "audio")) - if image_input is not None: - image_embeds = self._process_image_input(image_input) - multimodal_embeddings.append((image_embeds, "image")) - if video_input is not None: - video_embeds = self._process_video_input(video_input) - multimodal_embeddings.append((video_embeds, "video")) - return multimodal_embeddings - def forward( self, input_ids: torch.Tensor,