mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-08 23:58:02 +08:00
[Bugfix][ROCm] Fix uninitialized prefix_scheduler_metadata variable
When use_cascade=True, the prefix_scheduler_metadata variable was only initialized in the else branch, causing an UnboundLocalError when use_cascade was True. Move initialization before the if/else block to ensure the variable is always defined. Signed-off-by: c0de128 <kevin.mckay@outlook.com>
This commit is contained in:
parent
19cc9468fd
commit
e85f4a3686
@ -116,6 +116,7 @@ class RocmAttentionMetadataBuilder(AttentionMetadataBuilder[RocmAttentionMetadat
|
|||||||
slot_mapping = common_attn_metadata.slot_mapping
|
slot_mapping = common_attn_metadata.slot_mapping
|
||||||
|
|
||||||
use_cascade = common_prefix_len > 0
|
use_cascade = common_prefix_len > 0
|
||||||
|
prefix_scheduler_metadata = None
|
||||||
|
|
||||||
if use_cascade:
|
if use_cascade:
|
||||||
cu_prefix_query_lens = torch.tensor(
|
cu_prefix_query_lens = torch.tensor(
|
||||||
@ -130,7 +131,6 @@ class RocmAttentionMetadataBuilder(AttentionMetadataBuilder[RocmAttentionMetadat
|
|||||||
cu_prefix_query_lens = None
|
cu_prefix_query_lens = None
|
||||||
prefix_kv_lens = None
|
prefix_kv_lens = None
|
||||||
suffix_kv_lens = None
|
suffix_kv_lens = None
|
||||||
prefix_scheduler_metadata = None
|
|
||||||
|
|
||||||
attn_metadata = RocmAttentionMetadata(
|
attn_metadata = RocmAttentionMetadata(
|
||||||
num_actual_tokens=num_actual_tokens,
|
num_actual_tokens=num_actual_tokens,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user