[Bugfix][Model] Make Olmo2Model weight loading return loaded weights (#18504)

Signed-off-by: Shane A <shanea@allenai.org>

[Bugfix][Model] Make Olmo2Model weight loading return loaded weights (#18504)
Signed-off-by: Shane A <shanea@allenai.org>
51797775 · Shane A · GitHub · cf5984b2 · 51797775
Unverified Commit 51797775 authored May 21, 2025 by Shane A Committed by GitHub May 21, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 1 deletion

vllm/model_executor/models/olmo2.py vllm/model_executor/models/olmo2.py +5 -1

No files found.
--- a/vllm/model_executor/models/olmo2.py
+++ b/vllm/model_executor/models/olmo2.py
@@ -314,7 +314,8 @@ class Olmo2Model(nn.Module):
        hidden_states = self.norm(hidden_states)
        return hidden_states

-    def load_weights(self, weights: Iterable[tuple[str, torch.Tensor]]):
+    def load_weights(self, weights: Iterable[tuple[str,
+                                                   torch.Tensor]]) -> set[str]:
        stacked_params_mapping = [
            # (param_name, shard_name, shard_id)
            ("qkv_proj", "q_proj", "q"),
@@ -325,6 +326,7 @@ class Olmo2Model(nn.Module):
        ]

        params_dict = dict(self.named_parameters(remove_duplicate=False))
+        loaded_params: set[str] = set()
        for name, loaded_weight in weights:
            if is_pp_missing_parameter(name, self):
                continue
@@ -347,6 +349,8 @@ class Olmo2Model(nn.Module):
                weight_loader = getattr(param, "weight_loader",
                                        default_weight_loader)
                weight_loader(param, loaded_weight)
+            loaded_params.add(name)
+        return loaded_params


 class Olmo2ForCausalLM(nn.Module, SupportsPP):