mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-12 03:13:36 +08:00
fix attention free models
Signed-off-by: Xingyu Liu <charlotteliu12x@gmail.com>
This commit is contained in:
parent
0a4f4724ef
commit
1cf506d89e
@ -269,6 +269,22 @@ class ModelArchConfigConvertorBase:
|
|||||||
return model_arch_config
|
return model_arch_config
|
||||||
|
|
||||||
|
|
||||||
|
class MambaModelArchConfigConvertor(ModelArchConfigConvertorBase):
|
||||||
|
def get_head_size(self) -> int:
|
||||||
|
return 0
|
||||||
|
|
||||||
|
def get_total_num_kv_heads(self) -> int:
|
||||||
|
return 0
|
||||||
|
|
||||||
|
|
||||||
|
class TerratorchModelArchConfigConvertor(ModelArchConfigConvertorBase):
|
||||||
|
def get_head_size(self) -> int:
|
||||||
|
return 0
|
||||||
|
|
||||||
|
def get_total_num_kv_heads(self) -> int:
|
||||||
|
return 0
|
||||||
|
|
||||||
|
|
||||||
class Zamba2ModelArchConfigConvertor(ModelArchConfigConvertorBase):
|
class Zamba2ModelArchConfigConvertor(ModelArchConfigConvertorBase):
|
||||||
def get_head_size(self) -> int:
|
def get_head_size(self) -> int:
|
||||||
return getattr(self.hf_text_config, "attention_head_dim", 0)
|
return getattr(self.hf_text_config, "attention_head_dim", 0)
|
||||||
@ -357,6 +373,9 @@ class LongCatFlashMTPModelArchConfigConvertor(ModelArchConfigConvertorBase):
|
|||||||
|
|
||||||
# hf_config.model_type -> convertor class
|
# hf_config.model_type -> convertor class
|
||||||
MODEL_ARCH_CONFIG_CONVERTORS = {
|
MODEL_ARCH_CONFIG_CONVERTORS = {
|
||||||
|
"mamba": MambaModelArchConfigConvertor,
|
||||||
|
"mamba2": MambaModelArchConfigConvertor,
|
||||||
|
"terratorch": TerratorchModelArchConfigConvertor,
|
||||||
"zamba2": Zamba2ModelArchConfigConvertor,
|
"zamba2": Zamba2ModelArchConfigConvertor,
|
||||||
"mpt": MPTModelArchConfigConvertor,
|
"mpt": MPTModelArchConfigConvertor,
|
||||||
"dbrx": DbrxModelArchConfigConvertor,
|
"dbrx": DbrxModelArchConfigConvertor,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user