mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-11 06:45:01 +08:00
[Bug] DeepGemm: Fix TypeError: per_block_cast_to_fp8() missing 1 required positional argument: 'use_ue8m0' for SM100 (#21187)
Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
468e2400fe
commit
37bd8d6e4c
@ -99,7 +99,7 @@ def fp8_m_grouped_gemm_nt_masked(*args, **kwargs):
|
||||
|
||||
def per_block_cast_to_fp8(x, *args, **kwargs):
|
||||
if _per_block_cast_impl is not None and is_blackwell_deep_gemm_used():
|
||||
return _per_block_cast_impl(x)
|
||||
return _per_block_cast_impl(x, use_ue8m0=True)
|
||||
# TODO: refactor the `per_block_cast_to_fp8` from tests to vllm utils
|
||||
from tests.kernels.quant_utils import per_block_cast_to_fp8 as _pbcf
|
||||
return _pbcf(x, *args, **kwargs)
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user