mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-01 05:57:04 +08:00
remove dtype_original_type
Signed-off-by: Xingyu Liu <charlotteliu12x@gmail.com>
This commit is contained in:
parent
9b19e3b94f
commit
0a4f4724ef
@ -14,8 +14,7 @@
|
|||||||
"num_experts": 0,
|
"num_experts": 0,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"mosaicml/mpt-7b": {
|
"mosaicml/mpt-7b": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -32,8 +31,7 @@
|
|||||||
"num_experts": 0,
|
"num_experts": 0,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"databricks/dbrx-instruct": {
|
"databricks/dbrx-instruct": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -50,8 +48,7 @@
|
|||||||
"num_experts": 0,
|
"num_experts": 0,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"tiiuae/falcon-7b": {
|
"tiiuae/falcon-7b": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -68,8 +65,7 @@
|
|||||||
"num_experts": 0,
|
"num_experts": 0,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"tiiuae/falcon-40b": {
|
"tiiuae/falcon-40b": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -86,8 +82,7 @@
|
|||||||
"num_experts": 0,
|
"num_experts": 0,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"luccafong/deepseek_mtp_main_random": {
|
"luccafong/deepseek_mtp_main_random": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -104,8 +99,7 @@
|
|||||||
"num_experts": 72,
|
"num_experts": 72,
|
||||||
"is_deepseek_mla": true,
|
"is_deepseek_mla": true,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"luccafong/deepseek_mtp_draft_random": {
|
"luccafong/deepseek_mtp_draft_random": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -122,8 +116,7 @@
|
|||||||
"num_experts": 72,
|
"num_experts": 72,
|
||||||
"is_deepseek_mla": true,
|
"is_deepseek_mla": true,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"Qwen/Qwen3-Next-80B-A3B-Instruct": {
|
"Qwen/Qwen3-Next-80B-A3B-Instruct": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -140,8 +133,7 @@
|
|||||||
"num_experts": 512,
|
"num_experts": 512,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"tiny-random/qwen3-next-moe": {
|
"tiny-random/qwen3-next-moe": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -158,8 +150,7 @@
|
|||||||
"num_experts": 32,
|
"num_experts": 32,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"zai-org/GLM-4.5": {
|
"zai-org/GLM-4.5": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -176,8 +167,7 @@
|
|||||||
"num_experts": 160,
|
"num_experts": 160,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"baidu/ERNIE-4.5-21B-A3B-PT": {
|
"baidu/ERNIE-4.5-21B-A3B-PT": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -194,8 +184,7 @@
|
|||||||
"num_experts": 64,
|
"num_experts": 64,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"lmsys/gpt-oss-20b-bf16": {
|
"lmsys/gpt-oss-20b-bf16": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -212,8 +201,7 @@
|
|||||||
"num_experts": 32,
|
"num_experts": 32,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"deepseek-ai/DeepSeek-V3.2-Exp": {
|
"deepseek-ai/DeepSeek-V3.2-Exp": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -230,8 +218,7 @@
|
|||||||
"num_experts": 256,
|
"num_experts": 256,
|
||||||
"is_deepseek_mla": true,
|
"is_deepseek_mla": true,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"meta-llama/Llama-4-Scout-17B-16E-Instruct": {
|
"meta-llama/Llama-4-Scout-17B-16E-Instruct": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -248,8 +235,7 @@
|
|||||||
"num_experts": 16,
|
"num_experts": 16,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": true,
|
"is_multimodal_model": true,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"nvidia/Llama-3_3-Nemotron-Super-49B-v1": {
|
"nvidia/Llama-3_3-Nemotron-Super-49B-v1": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -266,8 +252,7 @@
|
|||||||
"num_experts": 0,
|
"num_experts": 0,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"XiaomiMiMo/MiMo-7B-RL": {
|
"XiaomiMiMo/MiMo-7B-RL": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -284,8 +269,7 @@
|
|||||||
"num_experts": 0,
|
"num_experts": 0,
|
||||||
"is_deepseek_mla": false,
|
"is_deepseek_mla": false,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.bfloat16",
|
"dtype": "torch.bfloat16"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
},
|
},
|
||||||
"meituan-longcat/LongCat-Flash-Chat": {
|
"meituan-longcat/LongCat-Flash-Chat": {
|
||||||
"architectures": [
|
"architectures": [
|
||||||
@ -302,7 +286,6 @@
|
|||||||
"num_experts": 512,
|
"num_experts": 512,
|
||||||
"is_deepseek_mla": true,
|
"is_deepseek_mla": true,
|
||||||
"is_multimodal_model": false,
|
"is_multimodal_model": false,
|
||||||
"dtype": "torch.float32",
|
"dtype": "torch.float32"
|
||||||
"dtype_original_type": "torch.dtype"
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@ -3,8 +3,6 @@
|
|||||||
import json
|
import json
|
||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
|
|
||||||
import torch
|
|
||||||
|
|
||||||
from vllm.config import ModelConfig
|
from vllm.config import ModelConfig
|
||||||
|
|
||||||
|
|
||||||
@ -67,12 +65,6 @@ def test_model_arch_config():
|
|||||||
|
|
||||||
dtype = model_arch_config.torch_dtype
|
dtype = model_arch_config.torch_dtype
|
||||||
assert str(dtype) == expected["dtype"]
|
assert str(dtype) == expected["dtype"]
|
||||||
if expected["dtype_original_type"] == "str":
|
|
||||||
assert isinstance(dtype, str)
|
|
||||||
elif expected["dtype_original_type"] == "torch.dtype":
|
|
||||||
assert isinstance(dtype, torch.dtype)
|
|
||||||
else:
|
|
||||||
raise ValueError(f"Unknown dtype_original_type: {expected['dtype']}")
|
|
||||||
|
|
||||||
# Test that model_config methods return expected values
|
# Test that model_config methods return expected values
|
||||||
assert model_config.architectures == expected["architectures"]
|
assert model_config.architectures == expected["architectures"]
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user