Signed-off-by: bk-201 <joy25810@foxmail.com>
This commit is contained in:
bk-201 2025-12-20 04:05:59 +00:00
parent d053aa73e1
commit 9c9950c080

View File

@ -121,7 +121,7 @@ class LoRAModelManager:
) )
self.punica_wrapper_mapping: dict[str, PunicaWrapperBase] = {} self.punica_wrapper_mapping: dict[str, PunicaWrapperBase] = {}
if self.supports_mm: if self.supports_mm:
self._maybe_init_mm(vllm_config,max_num_batched_tokens) self._maybe_init_mm(vllm_config, max_num_batched_tokens)
else: else:
llm_punica_wrapper = get_punica_wrapper( llm_punica_wrapper = get_punica_wrapper(
max_num_batched_tokens, max_num_batched_tokens,
@ -350,7 +350,7 @@ class LoRAModelManager:
punica_wrapper = self._get_punica_wrapper(target_prefix) punica_wrapper = self._get_punica_wrapper(target_prefix)
assert punica_wrapper is not None assert punica_wrapper is not None
punica_wrapper.wrapper.update_metadata( punica_wrapper.update_metadata(
mapping, mapping,
self.lora_index_to_id, self.lora_index_to_id,
self.lora_slots + 1, self.lora_slots + 1,
@ -563,16 +563,12 @@ class LoRAModelManager:
if not self.supports_mm: if not self.supports_mm:
return self.punica_wrapper_mapping[DEFAULT_LANGUAGE_WRAPPER_KEY] return self.punica_wrapper_mapping[DEFAULT_LANGUAGE_WRAPPER_KEY]
# For multimodal model # For multimodal model
# for prefix, wrapper in self.punica_wrapper_mapping.items(): # NOTE Sort by prefix length (descending) to match the longest prefix first
# is_language_model = ( # e.g., 'visual.merger' should match 'visual.merger' instead of 'visual.'
# prefix == DEFAULT_LANGUAGE_WRAPPER_KEY for prefix in sorted(self.punica_wrapper_mapping.keys(), key=len, reverse=True):
# and module_name.startswith(self.mm_mapping.language_model[0]) if module_name.startswith(prefix):
# ) return self.punica_wrapper_mapping[prefix]
# if is_language_model or module_name.startswith(prefix):
# return LoRATarget(wrapper=wrapper, prefix=prefix)
return None return None