This commit is contained in:
Philipp Moritz 2024-02-13 18:01:15 -08:00 committed by GitHub
parent 7eacffd951
commit 0c48b37c31
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -175,7 +175,8 @@ class LlamaDecoderLayer(nn.Module):
self.self_attn = LlamaAttention(
hidden_size=self.hidden_size,
num_heads=config.num_attention_heads,
num_kv_heads=config.num_key_value_heads,
num_kv_heads=getattr(config, "num_key_value_heads",
config.num_attention_heads),
rope_theta=rope_theta,
rope_scaling=rope_scaling,
max_position_embeddings=max_position_embeddings,