mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 08:04:58 +08:00
fix stablelm.py tensor-parallel-size bug (#2482)
This commit is contained in:
parent
d10f8e1d43
commit
8a25d3a71a
@ -99,7 +99,7 @@ class StablelmAttention(nn.Module):
|
||||
self.q_size = self.num_heads * self.head_dim
|
||||
self.kv_size = self.num_key_value_heads * self.head_dim
|
||||
|
||||
if (self.head_dim * self.num_heads) != self.hidden_size:
|
||||
if (self.head_dim * self.num_heads * tp_size) != self.hidden_size:
|
||||
raise ValueError(
|
||||
f"hidden_size must be divisible by num_heads (got `hidden_size`: {self.hidden_size}"
|
||||
f" and `num_heads`: {self.num_heads}).")
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user