mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-26 12:57:13 +08:00
Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
f38ee34a0a
commit
226b452a20
@ -20,7 +20,6 @@
|
|||||||
#include <ATen/cuda/CUDAContext.h>
|
#include <ATen/cuda/CUDAContext.h>
|
||||||
#include <c10/cuda/CUDAGuard.h>
|
#include <c10/cuda/CUDAGuard.h>
|
||||||
#include "../cuda_compat.h"
|
#include "../cuda_compat.h"
|
||||||
#include <cuda/std/functional>
|
|
||||||
|
|
||||||
#ifndef USE_ROCM
|
#ifndef USE_ROCM
|
||||||
#include <cub/util_type.cuh>
|
#include <cub/util_type.cuh>
|
||||||
@ -63,7 +62,7 @@ __launch_bounds__(TPB) __global__
|
|||||||
|
|
||||||
const int thread_row_offset = blockIdx.x * num_cols;
|
const int thread_row_offset = blockIdx.x * num_cols;
|
||||||
|
|
||||||
cuda::std::plus<float> sum;
|
cub::Sum sum;
|
||||||
float threadData(-FLT_MAX);
|
float threadData(-FLT_MAX);
|
||||||
|
|
||||||
// Don't touch finished rows.
|
// Don't touch finished rows.
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user