Unverified Commit 0c48b37c authored by Philipp Moritz's avatar Philipp Moritz Committed by GitHub
Browse files
parent 7eacffd9
...@@ -175,7 +175,8 @@ class LlamaDecoderLayer(nn.Module): ...@@ -175,7 +175,8 @@ class LlamaDecoderLayer(nn.Module):
self.self_attn = LlamaAttention( self.self_attn = LlamaAttention(
hidden_size=self.hidden_size, hidden_size=self.hidden_size,
num_heads=config.num_attention_heads, num_heads=config.num_attention_heads,
num_kv_heads=config.num_key_value_heads, num_kv_heads=getattr(config, "num_key_value_heads",
config.num_attention_heads),
rope_theta=rope_theta, rope_theta=rope_theta,
rope_scaling=rope_scaling, rope_scaling=rope_scaling,
max_position_embeddings=max_position_embeddings, max_position_embeddings=max_position_embeddings,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment