mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-13 07:17:03 +08:00
[Bugfix] Fix typo in Pallas backend (#5558)
This commit is contained in:
parent
e2afb03c92
commit
28c145eb57
@ -110,7 +110,7 @@ class PallasAttentionBackendImpl(AttentionImpl):
|
||||
raise NotImplementedError("TPU version must be 4 or higher.")
|
||||
|
||||
self.megacore_mode = None
|
||||
tpu_type = torch_xla.tpu.get_tp_groupu_env()["TYPE"].lower()
|
||||
tpu_type = torch_xla.tpu.get_tpu_env()["TYPE"].lower()
|
||||
if not tpu_type.endswith("lite"):
|
||||
if self.num_kv_heads % 2 == 0:
|
||||
self.megacore_mode = "kv_head"
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user