mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-15 17:25:01 +08:00
Signed-off-by: Roger Wang <ywang@roblox.com>
This commit is contained in:
parent
78ac0f591d
commit
82e0d601fc
@ -31,7 +31,8 @@ void cutlass_scaled_fp4_mm(torch::Tensor& D, torch::Tensor const& A,
|
|||||||
#if defined ENABLE_NVFP4 && ENABLE_NVFP4
|
#if defined ENABLE_NVFP4 && ENABLE_NVFP4
|
||||||
return cutlass_scaled_fp4_mm_sm100a(D, A, B, A_sf, B_sf, alpha);
|
return cutlass_scaled_fp4_mm_sm100a(D, A, B, A_sf, B_sf, alpha);
|
||||||
#endif
|
#endif
|
||||||
TORCH_CHECK_NOT_IMPLEMENTED(false, "No compiled nvfp4 mm kernel, vLLM should "
|
TORCH_CHECK_NOT_IMPLEMENTED(false,
|
||||||
|
"No compiled nvfp4 mm kernel, vLLM should "
|
||||||
"be compiled using CUDA 12.8 and target "
|
"be compiled using CUDA 12.8 and target "
|
||||||
"compute capability 100 or above.");
|
"compute capability 100 or above.");
|
||||||
}
|
}
|
||||||
|
|||||||
@ -194,7 +194,8 @@ void runGemm(at::Tensor& D, at::Tensor const& A, at::Tensor const& B,
|
|||||||
at::Tensor const& A_sf, at::Tensor const& B_sf,
|
at::Tensor const& A_sf, at::Tensor const& B_sf,
|
||||||
at::Tensor const& alpha, int64_t m, int64_t n, int64_t k,
|
at::Tensor const& alpha, int64_t m, int64_t n, int64_t k,
|
||||||
cudaStream_t stream) {
|
cudaStream_t stream) {
|
||||||
TORCH_CHECK(false, "Unsupported CUTLASS version. Set VLLM_CUTLASS_SRC_DIR to "
|
TORCH_CHECK(false,
|
||||||
|
"Unsupported CUTLASS version. Set VLLM_CUTLASS_SRC_DIR to "
|
||||||
"a CUTLASS 3.8 source directory to enable support.");
|
"a CUTLASS 3.8 source directory to enable support.");
|
||||||
}
|
}
|
||||||
#endif // defined(CUTLASS_ARCH_MMA_SM100_SUPPORTED)
|
#endif // defined(CUTLASS_ARCH_MMA_SM100_SUPPORTED)
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user