mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-20 14:37:04 +08:00
[rocm] enable torchao quantization for rocm (#24400)
Signed-off-by: Lifan Shen <lifans@meta.com>
This commit is contained in:
parent
492196ed0e
commit
d6069887c6
@ -171,7 +171,7 @@ class RocmPlatform(Platform):
|
|||||||
|
|
||||||
supported_quantization: list[str] = [
|
supported_quantization: list[str] = [
|
||||||
"awq", "gptq", "fp8", "compressed-tensors", "fbgemm_fp8", "gguf",
|
"awq", "gptq", "fp8", "compressed-tensors", "fbgemm_fp8", "gguf",
|
||||||
"quark", "ptpc_fp8", "mxfp4", "petit_nvfp4"
|
"quark", "ptpc_fp8", "mxfp4", "petit_nvfp4", "torchao"
|
||||||
]
|
]
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user