mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-23 18:44:30 +08:00
[Bugfix] Move flashinfer kernel check into ``__init__` function of `FusedMoE`` (#29018)
Signed-off-by: Max Hu <hyoung2991@gmail.com>
This commit is contained in:
parent
8f4f77a727
commit
cb0a7b4bea
@ -574,6 +574,9 @@ class FusedMoE(CustomOp):
|
||||
is_act_and_mul=is_act_and_mul,
|
||||
is_lora_enabled=vllm_config.lora_config is not None,
|
||||
)
|
||||
self.moe_config_use_flashinfer_cutlass_kernels = (
|
||||
self.moe_config.use_flashinfer_cutlass_kernels
|
||||
)
|
||||
|
||||
self.quant_config = quant_config
|
||||
|
||||
@ -728,7 +731,7 @@ class FusedMoE(CustomOp):
|
||||
return (
|
||||
self.moe_quant_config is not None
|
||||
and self.moe_quant_config.quant_dtype == "nvfp4"
|
||||
and self.moe_config.use_flashinfer_cutlass_kernels
|
||||
and self.moe_config_use_flashinfer_cutlass_kernels
|
||||
)
|
||||
|
||||
@property
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user