mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-20 04:54:26 +08:00
Merge 1c13c28087de72432b092836fa28694f0efbe801 into 254f6b986720c92ddf97fbb1a6a6465da8e87e29
This commit is contained in:
commit
de99c56dc5
@ -1708,7 +1708,11 @@ class GPUModelRunner(
|
||||
_get_block_table_and_slot_mapping(kv_cache_gid)
|
||||
)
|
||||
|
||||
if self.speculative_config and spec_decode_common_attn_metadata is None:
|
||||
if (
|
||||
self.speculative_config
|
||||
and spec_decode_common_attn_metadata is None
|
||||
and hasattr(self, "drafter")
|
||||
):
|
||||
if isinstance(self.drafter, EagleProposer):
|
||||
if self.drafter.attn_layer_names[0] in kv_cache_group.layer_names:
|
||||
spec_decode_common_attn_metadata = cm
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user