mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-31 00:17:09 +08:00
[Ernie 4.5] Name Change for Base 0.3B Model (#21735)
Signed-off-by: vasqu <antonprogamer@gmail.com> Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk> Co-authored-by: DarkLight1337 <tlleungac@connect.ust.hk>
This commit is contained in:
parent
63fe3a700f
commit
656c24f1b5
@ -336,7 +336,7 @@ th {
|
|||||||
| `DeepseekV2ForCausalLM` | DeepSeek-V2 | `deepseek-ai/DeepSeek-V2`, `deepseek-ai/DeepSeek-V2-Chat`, etc. | | ✅︎ | ✅︎ |
|
| `DeepseekV2ForCausalLM` | DeepSeek-V2 | `deepseek-ai/DeepSeek-V2`, `deepseek-ai/DeepSeek-V2-Chat`, etc. | | ✅︎ | ✅︎ |
|
||||||
| `DeepseekV3ForCausalLM` | DeepSeek-V3 | `deepseek-ai/DeepSeek-V3-Base`, `deepseek-ai/DeepSeek-V3`, etc. | | ✅︎ | ✅︎ |
|
| `DeepseekV3ForCausalLM` | DeepSeek-V3 | `deepseek-ai/DeepSeek-V3-Base`, `deepseek-ai/DeepSeek-V3`, etc. | | ✅︎ | ✅︎ |
|
||||||
| `Dots1ForCausalLM` | dots.llm1 | `rednote-hilab/dots.llm1.base`, `rednote-hilab/dots.llm1.inst`, etc. | | ✅︎ | ✅︎ |
|
| `Dots1ForCausalLM` | dots.llm1 | `rednote-hilab/dots.llm1.base`, `rednote-hilab/dots.llm1.inst`, etc. | | ✅︎ | ✅︎ |
|
||||||
| `Ernie4_5_ForCausalLM` | Ernie4.5 | `baidu/ERNIE-4.5-0.3B-PT`, etc. | ✅︎ | ✅︎ | ✅︎ |
|
| `Ernie4_5ForCausalLM` | Ernie4.5 | `baidu/ERNIE-4.5-0.3B-PT`, etc. | ✅︎ | ✅︎ | ✅︎ |
|
||||||
| `Ernie4_5_MoeForCausalLM` | Ernie4.5MoE | `baidu/ERNIE-4.5-21B-A3B-PT`, `baidu/ERNIE-4.5-300B-A47B-PT`, etc. |✅︎| ✅︎ | ✅︎ |
|
| `Ernie4_5_MoeForCausalLM` | Ernie4.5MoE | `baidu/ERNIE-4.5-21B-A3B-PT`, `baidu/ERNIE-4.5-300B-A47B-PT`, etc. |✅︎| ✅︎ | ✅︎ |
|
||||||
| `ExaoneForCausalLM` | EXAONE-3 | `LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct`, etc. | ✅︎ | ✅︎ | ✅︎ |
|
| `ExaoneForCausalLM` | EXAONE-3 | `LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct`, etc. | ✅︎ | ✅︎ | ✅︎ |
|
||||||
| `Exaone4ForCausalLM` | EXAONE-4 | `LGAI-EXAONE/EXAONE-4.0-32B`, etc. | ✅︎ | ✅︎ | ✅︎ |
|
| `Exaone4ForCausalLM` | EXAONE-4 | `LGAI-EXAONE/EXAONE-4.0-32B`, etc. | ✅︎ | ✅︎ | ✅︎ |
|
||||||
@ -634,10 +634,10 @@ Some models are supported only via the [Transformers backend](#transformers). Th
|
|||||||
|--------------|--------|--------|-------------------|-----------------------------|-----------------------------------------|---------------------|
|
|--------------|--------|--------|-------------------|-----------------------------|-----------------------------------------|---------------------|
|
||||||
| `Emu3ForConditionalGeneration` | Emu3 | T + I | `BAAI/Emu3-Chat-hf` | ✅︎ | ✅︎ | ✅︎ |
|
| `Emu3ForConditionalGeneration` | Emu3 | T + I | `BAAI/Emu3-Chat-hf` | ✅︎ | ✅︎ | ✅︎ |
|
||||||
|
|
||||||
<sup>^</sup> You need to set the architecture name via `--hf-overrides` to match the one in vLLM.
|
<sup>^</sup> You need to set the architecture name via `--hf-overrides` to match the one in vLLM.
|
||||||
• For example, to use DeepSeek-VL2 series models:
|
• For example, to use DeepSeek-VL2 series models:
|
||||||
`--hf-overrides '{"architectures": ["DeepseekVLV2ForCausalLM"]}'`
|
`--hf-overrides '{"architectures": ["DeepseekVLV2ForCausalLM"]}'`
|
||||||
<sup>E</sup> Pre-computed embeddings can be inputted for this modality.
|
<sup>E</sup> Pre-computed embeddings can be inputted for this modality.
|
||||||
<sup>+</sup> Multiple items can be inputted per text prompt for this modality.
|
<sup>+</sup> Multiple items can be inputted per text prompt for this modality.
|
||||||
|
|
||||||
!!! warning
|
!!! warning
|
||||||
|
|||||||
@ -166,7 +166,7 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
|
|||||||
trust_remote_code=True),
|
trust_remote_code=True),
|
||||||
"DeepseekV3ForCausalLM": _HfExamplesInfo("deepseek-ai/DeepSeek-V3", # noqa: E501
|
"DeepseekV3ForCausalLM": _HfExamplesInfo("deepseek-ai/DeepSeek-V3", # noqa: E501
|
||||||
trust_remote_code=True),
|
trust_remote_code=True),
|
||||||
"Ernie4_5_ForCausalLM": _HfExamplesInfo("baidu/ERNIE-4.5-0.3B-PT",
|
"Ernie4_5ForCausalLM": _HfExamplesInfo("baidu/ERNIE-4.5-0.3B-PT",
|
||||||
min_transformers_version="4.54"),
|
min_transformers_version="4.54"),
|
||||||
"Ernie4_5_MoeForCausalLM": _HfExamplesInfo("baidu/ERNIE-4.5-21B-A3B-PT",
|
"Ernie4_5_MoeForCausalLM": _HfExamplesInfo("baidu/ERNIE-4.5-21B-A3B-PT",
|
||||||
min_transformers_version="4.54"),
|
min_transformers_version="4.54"),
|
||||||
|
|||||||
@ -28,7 +28,7 @@ from vllm.model_executor.models.llama import LlamaForCausalLM
|
|||||||
from .utils import PPMissingLayer
|
from .utils import PPMissingLayer
|
||||||
|
|
||||||
|
|
||||||
class Ernie4_5_ForCausalLM(LlamaForCausalLM):
|
class Ernie4_5ForCausalLM(LlamaForCausalLM):
|
||||||
|
|
||||||
def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
|
def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
|
||||||
super().__init__(vllm_config=vllm_config, prefix=prefix)
|
super().__init__(vllm_config=vllm_config, prefix=prefix)
|
||||||
|
|||||||
@ -60,7 +60,7 @@ _TEXT_GENERATION_MODELS = {
|
|||||||
"DeepseekV2ForCausalLM": ("deepseek_v2", "DeepseekV2ForCausalLM"),
|
"DeepseekV2ForCausalLM": ("deepseek_v2", "DeepseekV2ForCausalLM"),
|
||||||
"DeepseekV3ForCausalLM": ("deepseek_v2", "DeepseekV3ForCausalLM"),
|
"DeepseekV3ForCausalLM": ("deepseek_v2", "DeepseekV3ForCausalLM"),
|
||||||
"Dots1ForCausalLM": ("dots1", "Dots1ForCausalLM"),
|
"Dots1ForCausalLM": ("dots1", "Dots1ForCausalLM"),
|
||||||
"Ernie4_5_ForCausalLM": ("ernie45", "Ernie4_5_ForCausalLM"),
|
"Ernie4_5ForCausalLM": ("ernie45", "Ernie4_5ForCausalLM"),
|
||||||
"Ernie4_5_MoeForCausalLM": ("ernie45_moe", "Ernie4_5_MoeForCausalLM"),
|
"Ernie4_5_MoeForCausalLM": ("ernie45_moe", "Ernie4_5_MoeForCausalLM"),
|
||||||
"ExaoneForCausalLM": ("exaone", "ExaoneForCausalLM"),
|
"ExaoneForCausalLM": ("exaone", "ExaoneForCausalLM"),
|
||||||
"Exaone4ForCausalLM": ("exaone4", "Exaone4ForCausalLM"),
|
"Exaone4ForCausalLM": ("exaone4", "Exaone4ForCausalLM"),
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user