Fix bias in InternLM (#1501)

aa9af07c · Woosuk Kwon · GitHub · 69be658b · aa9af07c
Unverified Commit aa9af07c authored Oct 30, 2023 by Woosuk Kwon Committed by GitHub Oct 29, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 2 deletions

vllm/model_executor/models/internlm.py vllm/model_executor/models/internlm.py +4 -2

No files found.
--- a/vllm/model_executor/models/internlm.py
+++ b/vllm/model_executor/models/internlm.py
@@ -62,6 +62,7 @@ class InternLMAttention(nn.Module):
        self,
        hidden_size: int,
        num_heads: int,
+        bias: bool,
        rope_theta: float = 10000,
        max_position_embeddings: int = 8192,
    ):
@@ -81,13 +82,13 @@ class InternLMAttention(nn.Module):
        self.qkv_proj = ColumnParallelLinear(
            hidden_size,
            3 * self.total_num_heads * self.head_dim,
-            bias=True,
+            bias=bias,
            gather_output=False,
        )
        self.o_proj = RowParallelLinear(
            self.total_num_heads * self.head_dim,
            hidden_size,
-            bias=True,
+            bias=bias,
            input_is_parallel=True,
        )
        self.attn = PagedAttentionWithRoPE(
@@ -126,6 +127,7 @@ class InternLMDecoderLayer(nn.Module):
        self.self_attn = InternLMAttention(
            hidden_size=self.hidden_size,
            num_heads=config.num_attention_heads,
+            bias=config.bias,
            rope_theta=rope_theta,
            max_position_embeddings=max_position_embeddings,
        )