#pragma once #ifndef USE_ROCM #include #if CUB_VERSION >= 200800 #include using CubAddOp = cuda::std::plus<>; using CubMaxOp = cuda::maximum<>; #else // if CUB_VERSION < 200800 using CubAddOp = cub::Sum; using CubMaxOp = cub::Max; #endif // CUB_VERSION #else #include using CubAddOp = cub::Sum; using CubMaxOp = cub::Max; #endif // USE_ROCM