[Bugfix] Gemma4: fix multimodal embedder norm order to match HF reference (#40411)

Signed-off-by: Luciano Martins <lucianommartins@users.noreply.github.com> Co-authored-by: Luciano Martins <lucianommartins@users.noreply.github.com>

[Bugfix] Gemma4: fix multimodal embedder norm order to match HF reference (#40411)
Signed-off-by: Luciano Martins <lucianommartins@users.noreply.github.com> Co-authored-by: Luciano Martins <lucianommartins@users.noreply.github.com>
20d37434 · Luciano Martins · GitHub · 18563f20 · 20d37434
Unverified Commit 20d37434 authored Apr 20, 2026 by Luciano Martins Committed by GitHub Apr 21, 2026
Show whitespace changes
Inline Side-by-side

Showing with 9 additions and 8 deletions

vllm/model_executor/models/gemma4_mm.py vllm/model_executor/models/gemma4_mm.py +9 -8

No files found.
--- a/vllm/model_executor/models/gemma4_mm.py
+++ b/vllm/model_executor/models/gemma4_mm.py
@@ -849,22 +849,23 @@ class Gemma4MultimodalEmbedder(nn.Module):
            or multimodal_config.hidden_size
        )
-        self.embedding_projection = ReplicatedLinear(
+        self.embedding_pre_projection_norm = RMSNorm(
            embedding_dim,
-            self.text_hidden_size,
+            eps=self.eps,
-            bias=False,
+            has_weight=False,
        )
-        self.embedding_post_projection_norm = RMSNorm(
+        self.embedding_projection = ReplicatedLinear(
+            embedding_dim,
            self.text_hidden_size,
-            eps=self.eps,
+            bias=False,
-            has_weight=False,
        )
    def forward(self, inputs_embeds: torch.Tensor) -> torch.Tensor:
        """Project soft tokens from a multimodal tower into LM space."""
-        embs_proj, _ = self.embedding_projection(inputs_embeds)
+        embs_normed = self.embedding_pre_projection_norm(inputs_embeds)
-        return self.embedding_post_projection_norm(embs_proj)
+        embs_proj, _ = self.embedding_projection(embs_normed)
+        return embs_proj
 # ---------------------------------------------------------------------------