Unverified Commit 4729b908 authored by Aaron Hao's avatar Aaron Hao Committed by GitHub
Browse files

[Bug] Add e_score_correction_bias to SKIP_TENSORS (#38746)


Signed-off-by: default avatarahao-anyscale <ahao@anyscale.com>
parent 8b141ed8
...@@ -14,6 +14,7 @@ from vllm.model_executor.layers.quantization.base_config import QuantizeMethodBa ...@@ -14,6 +14,7 @@ from vllm.model_executor.layers.quantization.base_config import QuantizeMethodBa
from vllm.model_executor.model_loader.weight_utils import default_weight_loader from vllm.model_executor.model_loader.weight_utils import default_weight_loader
from .meta import ( from .meta import (
SKIP_TENSORS,
capture_layer_to_meta, capture_layer_to_meta,
get_numel_loaded, get_numel_loaded,
materialize_layer, materialize_layer,
...@@ -124,6 +125,8 @@ def initialize_online_processing(layer: torch.nn.Module): ...@@ -124,6 +125,8 @@ def initialize_online_processing(layer: torch.nn.Module):
# Wrap each parameter's weight loader # Wrap each parameter's weight loader
# Note that nested wrapping will occur for shared tensors # Note that nested wrapping will occur for shared tensors
for name, tensor in get_layer_tensors(layer).items(): for name, tensor in get_layer_tensors(layer).items():
if name in SKIP_TENSORS:
continue
if _get_weight_loader(tensor).__name__ != "online_process_loader": if _get_weight_loader(tensor).__name__ != "online_process_loader":
tensor.weight_loader = make_online_process_loader(layer, name) tensor.weight_loader = make_online_process_loader(layer, name)
......
...@@ -27,6 +27,7 @@ SKIP_TENSORS: set[str] = { ...@@ -27,6 +27,7 @@ SKIP_TENSORS: set[str] = {
"expert_global_to_physical", "expert_global_to_physical",
"expert_physical_to_global", "expert_physical_to_global",
"expert_local_to_global", "expert_local_to_global",
"e_score_correction_bias",
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment