mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-22 16:31:19 +08:00
potential hang fix
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
This commit is contained in:
parent
33f6aaf972
commit
db77f9b3a2
@ -582,7 +582,9 @@ struct Sm100FmhaMlaKernelTmaWarpspecialized {
|
|||||||
auto problem_shape = params.problem_shape;
|
auto problem_shape = params.problem_shape;
|
||||||
auto local_split_kv = params.split_kv;
|
auto local_split_kv = params.split_kv;
|
||||||
if (params.mainloop.ptr_seq != nullptr) {
|
if (params.mainloop.ptr_seq != nullptr) {
|
||||||
get<1>(problem_shape) = params.mainloop.ptr_seq[get<2>(blk_coord)];
|
auto seqlen = params.mainloop.ptr_seq[get<2>(blk_coord)];
|
||||||
|
if (seqlen == 0) continue;
|
||||||
|
get<1>(problem_shape) = seqlen;
|
||||||
if (params.ptr_split_kv != nullptr) {
|
if (params.ptr_split_kv != nullptr) {
|
||||||
local_split_kv = params.ptr_split_kv[get<2>(blk_coord)];
|
local_split_kv = params.ptr_split_kv[get<2>(blk_coord)];
|
||||||
}
|
}
|
||||||
@ -607,7 +609,9 @@ struct Sm100FmhaMlaKernelTmaWarpspecialized {
|
|||||||
auto problem_shape = params.problem_shape;
|
auto problem_shape = params.problem_shape;
|
||||||
auto local_split_kv = params.split_kv;
|
auto local_split_kv = params.split_kv;
|
||||||
if (params.mainloop.ptr_seq != nullptr) {
|
if (params.mainloop.ptr_seq != nullptr) {
|
||||||
get<1>(problem_shape) = params.mainloop.ptr_seq[get<2>(blk_coord)];
|
auto seqlen = params.mainloop.ptr_seq[get<2>(blk_coord)];
|
||||||
|
if (seqlen == 0) continue;
|
||||||
|
get<1>(problem_shape) = seqlen;
|
||||||
if (params.ptr_split_kv != nullptr) {
|
if (params.ptr_split_kv != nullptr) {
|
||||||
local_split_kv = params.ptr_split_kv[get<2>(blk_coord)];
|
local_split_kv = params.ptr_split_kv[get<2>(blk_coord)];
|
||||||
}
|
}
|
||||||
@ -636,7 +640,9 @@ struct Sm100FmhaMlaKernelTmaWarpspecialized {
|
|||||||
auto problem_shape = params.problem_shape;
|
auto problem_shape = params.problem_shape;
|
||||||
auto local_split_kv = params.split_kv;
|
auto local_split_kv = params.split_kv;
|
||||||
if (params.mainloop.ptr_seq != nullptr) {
|
if (params.mainloop.ptr_seq != nullptr) {
|
||||||
get<1>(problem_shape) = params.mainloop.ptr_seq[get<2>(blk_coord)];
|
auto seqlen = params.mainloop.ptr_seq[get<2>(blk_coord)];
|
||||||
|
if (seqlen == 0) continue;
|
||||||
|
get<1>(problem_shape) = seqlen;
|
||||||
if (params.ptr_split_kv != nullptr) {
|
if (params.ptr_split_kv != nullptr) {
|
||||||
local_split_kv = params.ptr_split_kv[get<2>(blk_coord)];
|
local_split_kv = params.ptr_split_kv[get<2>(blk_coord)];
|
||||||
}
|
}
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user