[Minor] Add comment on skipping rope caches (#2004)

24cde76a · Woosuk Kwon · GitHub · 1aa13615 · 24cde76a
Unverified Commit 24cde76a authored Dec 10, 2023 by Woosuk Kwon Committed by GitHub Dec 10, 2023
Show whitespace changes
Inline Side-by-side

Showing with 4 additions and 3 deletions

vllm/model_executor/models/llama.py vllm/model_executor/models/llama.py +4 -3

No files found.
--- a/vllm/model_executor/models/llama.py
+++ b/vllm/model_executor/models/llama.py
@@ -322,9 +322,10 @@ class LlamaForCausalLM(nn.Module):
                model_name_or_path, cache_dir, load_format, revision):
            if "rotary_emb.inv_freq" in name:
                continue
-            if "rotary_emb.cos_cached" in name:
-                continue
-            if "rotary_emb.sin_cached" in name:
+            if ("rotary_emb.cos_cached" in name
+                    or "rotary_emb.sin_cached" in name):
+                # Models trained using ColossalAI may include these tensors in
+                # the checkpoint. Skip them.
                continue
            for (param_name, weight_name, shard_id) in stacked_params_mapping:
                if weight_name not in name: