mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-04 00:49:10 +08:00
11 lines
423 B
Plaintext
11 lines
423 B
Plaintext
Meta-Llama-3-8B-Instruct.yaml
|
|
Meta-Llama-3-8B-Instruct-FP8.yaml
|
|
Meta-Llama-3-8B-Instruct-FP8-compressed-tensors.yaml
|
|
Meta-Llama-3-8B-Instruct-INT8-compressed-tensors.yaml
|
|
Meta-Llama-3-8B-Instruct-nonuniform-compressed-tensors.yaml
|
|
Meta-Llama-3-8B-Instruct-Channelwise-compressed-tensors.yaml
|
|
Minitron-4B-Base-FP8.yaml
|
|
Qwen2-1.5B-Instruct-INT8-compressed-tensors.yaml
|
|
Qwen2-1.5B-Instruct-FP8W8.yaml
|
|
Meta-Llama-3-8B-QQQ.yaml
|