mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-19 19:26:59 +08:00
fix
Signed-off-by: bk-201 <joy25810@foxmail.com>
This commit is contained in:
parent
d053aa73e1
commit
9c9950c080
@ -121,7 +121,7 @@ class LoRAModelManager:
|
|||||||
)
|
)
|
||||||
self.punica_wrapper_mapping: dict[str, PunicaWrapperBase] = {}
|
self.punica_wrapper_mapping: dict[str, PunicaWrapperBase] = {}
|
||||||
if self.supports_mm:
|
if self.supports_mm:
|
||||||
self._maybe_init_mm(vllm_config,max_num_batched_tokens)
|
self._maybe_init_mm(vllm_config, max_num_batched_tokens)
|
||||||
else:
|
else:
|
||||||
llm_punica_wrapper = get_punica_wrapper(
|
llm_punica_wrapper = get_punica_wrapper(
|
||||||
max_num_batched_tokens,
|
max_num_batched_tokens,
|
||||||
@ -350,7 +350,7 @@ class LoRAModelManager:
|
|||||||
punica_wrapper = self._get_punica_wrapper(target_prefix)
|
punica_wrapper = self._get_punica_wrapper(target_prefix)
|
||||||
assert punica_wrapper is not None
|
assert punica_wrapper is not None
|
||||||
|
|
||||||
punica_wrapper.wrapper.update_metadata(
|
punica_wrapper.update_metadata(
|
||||||
mapping,
|
mapping,
|
||||||
self.lora_index_to_id,
|
self.lora_index_to_id,
|
||||||
self.lora_slots + 1,
|
self.lora_slots + 1,
|
||||||
@ -563,16 +563,12 @@ class LoRAModelManager:
|
|||||||
if not self.supports_mm:
|
if not self.supports_mm:
|
||||||
return self.punica_wrapper_mapping[DEFAULT_LANGUAGE_WRAPPER_KEY]
|
return self.punica_wrapper_mapping[DEFAULT_LANGUAGE_WRAPPER_KEY]
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
# For multimodal model
|
# For multimodal model
|
||||||
# for prefix, wrapper in self.punica_wrapper_mapping.items():
|
# NOTE Sort by prefix length (descending) to match the longest prefix first
|
||||||
# is_language_model = (
|
# e.g., 'visual.merger' should match 'visual.merger' instead of 'visual.'
|
||||||
# prefix == DEFAULT_LANGUAGE_WRAPPER_KEY
|
for prefix in sorted(self.punica_wrapper_mapping.keys(), key=len, reverse=True):
|
||||||
# and module_name.startswith(self.mm_mapping.language_model[0])
|
if module_name.startswith(prefix):
|
||||||
# )
|
return self.punica_wrapper_mapping[prefix]
|
||||||
# if is_language_model or module_name.startswith(prefix):
|
|
||||||
# return LoRATarget(wrapper=wrapper, prefix=prefix)
|
|
||||||
|
|
||||||
return None
|
return None
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user