mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 05:25:00 +08:00
[Bugfix][W8A8] fixed cutlass block fp8 binding (#14796)
This commit is contained in:
parent
c77620d22d
commit
40253bab44
@ -370,7 +370,7 @@ TORCH_LIBRARY_EXPAND(TORCH_EXTENSION_NAME, ops) {
|
|||||||
"cutlass_scaled_mm_supports_block_fp8(int cuda_device_capability) -> "
|
"cutlass_scaled_mm_supports_block_fp8(int cuda_device_capability) -> "
|
||||||
"bool");
|
"bool");
|
||||||
ops.impl("cutlass_scaled_mm_supports_block_fp8",
|
ops.impl("cutlass_scaled_mm_supports_block_fp8",
|
||||||
&cutlass_scaled_mm_supports_fp8);
|
&cutlass_scaled_mm_supports_block_fp8);
|
||||||
|
|
||||||
// Check if cutlass sparse scaled_mm is supported for CUDA devices of the
|
// Check if cutlass sparse scaled_mm is supported for CUDA devices of the
|
||||||
// given capability
|
// given capability
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user