update mlp

741dbbbb · zhuwenwen · 9d5e4dd9 · 741dbbbb
Commit 741dbbbb authored Jul 31, 2025 by zhuwenwen
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 1 deletion

vllm/model_executor/models/mlp_speculator.py vllm/model_executor/models/mlp_speculator.py +2 -1

No files found.
--- a/vllm/model_executor/models/mlp_speculator.py
+++ b/vllm/model_executor/models/mlp_speculator.py
@@ -19,6 +19,7 @@ from vllm.model_executor.layers.linear import ColumnParallelLinear
 from vllm.model_executor.model_loader.weight_utils import default_weight_loader
 from vllm import _custom_ops as ops
 from vllm.distributed import tensor_model_parallel_all_gather, tensor_model_parallel_gather
+from vllm import envs

 SQRT2 = 2**0.5

@@ -215,7 +216,7 @@ class MLPSpeculator(nn.Module):
                weight_loader(param, loaded_weight)
                loaded_params.add(name)

-                if self.use_llama_nn:
+                if self.use_llama_nn or envs.VLLM_USE_NN:
                    if (os.environ['LM_NN'] == '1' and "head" in name) or "proj" in name:
                        _weight = torch.zeros_like(param.data)
                        ori_shape =_weight.shape