[Bug Fix] Fix `naive_block_assignment` always defaulting to False due to arg misalignment (#33848)

Signed-off-by: Runkai Tao <rt572@physics.rutgers.edu>

[Bug Fix] Fix `naive_block_assignment` always defaulting to False due to arg misalignment (#33848)
Signed-off-by: Runkai Tao <rt572@physics.rutgers.edu>
e1d97c38 · Runkai Tao · GitHub · ec12d39d · e1d97c38 · e1d97c38
Unverified Commit e1d97c38 authored Feb 11, 2026 by Runkai Tao Committed by GitHub Feb 12, 2026
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 1 deletion

vllm/lora/layers/fused_moe.py vllm/lora/layers/fused_moe.py +1 -1

vllm/lora/punica_wrapper/punica_base.py vllm/lora/punica_wrapper/punica_base.py +1 -0

No files found.
--- a/vllm/lora/layers/fused_moe.py
+++ b/vllm/lora/layers/fused_moe.py
@@ -219,7 +219,7 @@ class FusedMoEWithLoRA(BaseLayerWithLoRA):
                    self.max_loras,
                    self.adapter_enabled,
                    expert_map,
-                    naive_block_assignment,
+                    naive_block_assignment=naive_block_assignment,
                )
                moe_state_dict["sorted_token_ids_lora"] = sorted_token_ids_lora

--- a/vllm/lora/punica_wrapper/punica_base.py
+++ b/vllm/lora/punica_wrapper/punica_base.py
@@ -458,6 +458,7 @@ class PunicaWrapperBase(PunicaWrapperABC):
        adapter_enabled: torch.Tensor,
        expert_map: torch.Tensor | None = None,
        pad_sorted_ids: bool = False,
+        naive_block_assignment: bool = False,
    ) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor]:
        """
        Aligns tokens and experts into block-sized chunks for LoRA-based