mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-09 21:15:41 +08:00
[Bugfix][kernels] Fix half2float conversion in gguf kernels (#15995)
Signed-off-by: Isotr0py <2037008807@qq.com>
This commit is contained in:
parent
0812d8dd41
commit
230b131b54
@ -1090,6 +1090,11 @@ __device__ __forceinline__ c10::BFloat16 convert_from_half<c10::BFloat16>(half v
|
|||||||
#endif // defined(__CUDA_ARCH__) && __CUDA_ARCH__ >= 800
|
#endif // defined(__CUDA_ARCH__) && __CUDA_ARCH__ >= 800
|
||||||
}
|
}
|
||||||
|
|
||||||
|
template<>
|
||||||
|
__device__ __forceinline__ float convert_from_half<float>(half val) {
|
||||||
|
return __half2float(val);
|
||||||
|
}
|
||||||
|
|
||||||
#if defined(USE_ROCM)
|
#if defined(USE_ROCM)
|
||||||
|
|
||||||
#ifndef __has_builtin
|
#ifndef __has_builtin
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user