mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-23 16:04:27 +08:00
[MISC] replace c10::optional with std::optional (#25602)
Signed-off-by: Shiyan Deng <dsy842974287@meta.com> Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
7319686692
commit
b95429c920
@ -6,11 +6,11 @@ torch::Tensor LLMM1(at::Tensor& in_a, at::Tensor& in_b,
|
|||||||
const int64_t rows_per_block);
|
const int64_t rows_per_block);
|
||||||
|
|
||||||
torch::Tensor wvSplitK(const at::Tensor& in_a, const at::Tensor& in_b,
|
torch::Tensor wvSplitK(const at::Tensor& in_a, const at::Tensor& in_b,
|
||||||
const c10::optional<at::Tensor>& in_bias,
|
const std::optional<at::Tensor>& in_bias,
|
||||||
const int64_t CuCount);
|
const int64_t CuCount);
|
||||||
|
|
||||||
void wvSplitKQ(const at::Tensor& in_a, const at::Tensor& in_b,
|
void wvSplitKQ(const at::Tensor& in_a, const at::Tensor& in_b,
|
||||||
const c10::optional<at::Tensor>& in_bias, at::Tensor& out_c,
|
const std::optional<at::Tensor>& in_bias, at::Tensor& out_c,
|
||||||
const at::Tensor& scale_a, const at::Tensor& scale_b,
|
const at::Tensor& scale_a, const at::Tensor& scale_b,
|
||||||
const int64_t CuCount);
|
const int64_t CuCount);
|
||||||
|
|
||||||
|
|||||||
@ -1271,7 +1271,7 @@ int mindiv(int N, int div1, int div2) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
torch::Tensor wvSplitK(const at::Tensor& in_a, const at::Tensor& in_b,
|
torch::Tensor wvSplitK(const at::Tensor& in_a, const at::Tensor& in_b,
|
||||||
const c10::optional<at::Tensor>& in_bias,
|
const std::optional<at::Tensor>& in_bias,
|
||||||
const int64_t CuCount) {
|
const int64_t CuCount) {
|
||||||
auto M_in = in_a.size(0);
|
auto M_in = in_a.size(0);
|
||||||
auto K_in = in_a.size(1);
|
auto K_in = in_a.size(1);
|
||||||
@ -1729,7 +1729,7 @@ __global__ void wvSplitKQ_hf_(const int K, const int Kp, const int M,
|
|||||||
#endif // defined(__HIP__MI3XX__) TODO: Add NAVI support
|
#endif // defined(__HIP__MI3XX__) TODO: Add NAVI support
|
||||||
|
|
||||||
void wvSplitKQ(const at::Tensor& in_a, const at::Tensor& in_b,
|
void wvSplitKQ(const at::Tensor& in_a, const at::Tensor& in_b,
|
||||||
const c10::optional<at::Tensor>& in_bias, at::Tensor& out_c,
|
const std::optional<at::Tensor>& in_bias, at::Tensor& out_c,
|
||||||
const at::Tensor& scale_a, const at::Tensor& scale_b,
|
const at::Tensor& scale_a, const at::Tensor& scale_b,
|
||||||
const int64_t CuCount) {
|
const int64_t CuCount) {
|
||||||
static c10::ScalarType kFp8Type = is_fp8_ocp()
|
static c10::ScalarType kFp8Type = is_fp8_ocp()
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user