mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-15 11:36:20 +08:00
[Hybrid] [Kernel] Fix chunk scan kernel when BLOCK_SIZE_DSTATE > 128 (#28295)
Signed-off-by: Thomas Parnell <tpa@zurich.ibm.com>
This commit is contained in:
parent
bf3ffb61e6
commit
e0c910bb89
@ -245,7 +245,7 @@ def _chunk_scan_fwd_kernel(
|
|||||||
)
|
)
|
||||||
if not HAS_INITSTATES and (seq_idx != seq_idx_prev):
|
if not HAS_INITSTATES and (seq_idx != seq_idx_prev):
|
||||||
prev_states = tl.zeros(
|
prev_states = tl.zeros(
|
||||||
(BLOCK_SIZE_DSTATE, BLOCK_SIZE_K), dtype=C_ptr.dtype.element_ty
|
(BLOCK_SIZE_K, BLOCK_SIZE_N), dtype=C_ptr.dtype.element_ty
|
||||||
)
|
)
|
||||||
else:
|
else:
|
||||||
prev_states = tl.load(
|
prev_states = tl.load(
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user