vllm/tests/config/draft_model_arch_groundtruth.json

{
    "abhigoyal/vllm-medusa-llama-68m-random": {
        "architectures": [
            "MedusaModel"
        ],
        "model_type": "medusa",
        "text_model_type": "medusa",
        "hidden_size": 768,
        "total_num_hidden_layers": 1,
        "total_num_attention_heads": 0,
        "head_size": "Error: integer division or modulo by zero",
        "vocab_size": 32000,
        "total_num_kv_heads": 0,
        "num_experts": 0,
        "is_deepseek_mla": false,
        "is_multimodal_model": false,
        "dtype": "torch.float32"
    },
    "luccafong/deepseek_mtp_draft_random": {
        "architectures": [
            "DeepSeekMTPModel"
        ],
        "model_type": "deepseek_mtp",
        "text_model_type": "deepseek_mtp",
        "hidden_size": 2560,
        "total_num_hidden_layers": 1,
        "total_num_attention_heads": 32,
        "head_size": 576,
        "vocab_size": 129280,
        "total_num_kv_heads": 32,
        "num_experts": 72,
        "is_deepseek_mla": true,
        "is_multimodal_model": false,
        "dtype": "torch.bfloat16"
    },
    "eagle618/eagle-deepseek-v3-random": {
        "architectures": [
            "EagleDeepSeekMTPModel"
        ],
        "model_type": "eagle",
        "text_model_type": "deepseek_mtp",
        "hidden_size": 2560,
        "total_num_hidden_layers": 1,
        "total_num_attention_heads": 32,
        "head_size": 576,
        "vocab_size": 129280,
        "total_num_kv_heads": 32,
        "num_experts": 72,
        "is_deepseek_mla": true,
        "is_multimodal_model": false,
        "dtype": "bfloat16"
    },
    "yuhuili/EAGLE-LLaMA3-Instruct-8B": {
        "architectures": [
            "EagleLlamaForCausalLM"
        ],
        "model_type": "eagle",
        "text_model_type": "llama",
        "hidden_size": 4096,
        "total_num_hidden_layers": 1,
        "total_num_attention_heads": 32,
        "head_size": 128,
        "vocab_size": 128256,
        "total_num_kv_heads": 8,
        "num_experts": 0,
        "is_deepseek_mla": false,
        "is_multimodal_model": false,
        "dtype": "float16"
    },
    "yuhuili/EAGLE3-LLaMA3.1-Instruct-8B": {
        "architectures": [
            "Eagle3LlamaForCausalLM"
        ],
        "model_type": "eagle",
        "text_model_type": "llama",
        "hidden_size": 4096,
        "total_num_hidden_layers": 1,
        "total_num_attention_heads": 32,
        "head_size": 128,
        "vocab_size": 128256,
        "total_num_kv_heads": 8,
        "num_experts": 0,
        "is_deepseek_mla": false,
        "is_multimodal_model": false,
        "dtype": "float16"
    }
}