mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-20 11:17:00 +08:00
Fix torch version check for SM100 mxfp4 (#22535)
Signed-off-by: Zifei Tong <zifeitong@gmail.com> Signed-off-by: mgoin <mgoin64@gmail.com> Co-authored-by: mgoin <mgoin64@gmail.com>
This commit is contained in:
parent
422f22e012
commit
6534d2fc97
@ -741,12 +741,14 @@ class FusedMoE(torch.nn.Module):
|
|||||||
|
|
||||||
# we padding globally so EP buffer allocation works
|
# we padding globally so EP buffer allocation works
|
||||||
if quant_config and quant_config.get_name() == "mxfp4":
|
if quant_config and quant_config.get_name() == "mxfp4":
|
||||||
if not is_torch_equal_or_newer("2.8.0"):
|
if not current_platform.is_device_capability(100):
|
||||||
raise RuntimeError("Mxfp4 on hopper requires torch >= 2.8.0")
|
if not is_torch_equal_or_newer("2.8.0"):
|
||||||
if current_platform.is_device_capability(
|
raise RuntimeError(
|
||||||
90) and not has_triton_kernels():
|
"Mxfp4 on non-blackwell requires torch >= 2.8.0")
|
||||||
raise NotImplementedError(
|
if not has_triton_kernels():
|
||||||
"Triton kernels must be installed for mxfp4 on hopper")
|
raise NotImplementedError(
|
||||||
|
"triton_kernels must be installed for "
|
||||||
|
"mxfp4 on non-blackwell")
|
||||||
if (current_platform.is_rocm()
|
if (current_platform.is_rocm()
|
||||||
or envs.VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8
|
or envs.VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8
|
||||||
or envs.VLLM_USE_FLASHINFER_MOE_MXFP4_BF16):
|
or envs.VLLM_USE_FLASHINFER_MOE_MXFP4_BF16):
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user