mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-01 17:07:06 +08:00
Merge b6520e5ec6e0aad1bec5b7d142f1e05d26c7849c into 254f6b986720c92ddf97fbb1a6a6465da8e87e29
This commit is contained in:
commit
1ab2ef6ebc
@ -10,6 +10,10 @@ def is_quant_method_supported(quant_method: str) -> bool:
|
|||||||
if not (current_platform.is_cuda() or current_platform.is_rocm()):
|
if not (current_platform.is_cuda() or current_platform.is_rocm()):
|
||||||
return False
|
return False
|
||||||
|
|
||||||
|
# RTN quantization is currently not supported on ROCm
|
||||||
|
if current_platform.is_rocm() and quant_method == "rtn":
|
||||||
|
return False
|
||||||
|
|
||||||
capability = current_platform.get_device_capability()
|
capability = current_platform.get_device_capability()
|
||||||
assert capability is not None
|
assert capability is not None
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user