update vdim pad

1d57ec3d · zhuwenwen · 4564b2f5 · 1d57ec3d
Commit 1d57ec3d authored Apr 14, 2025 by zhuwenwen
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

vllm/attention/backends/mla/utils.py vllm/attention/backends/mla/utils.py +1 -1

No files found.
--- a/vllm/attention/backends/mla/utils.py
+++ b/vllm/attention/backends/mla/utils.py
@@ -535,7 +535,7 @@ class MLACommonImpl(MLAAttentionImpl[T], Generic[T]):
        # v with 0s to match the qk head dim
        # v_padded = torch.nn.functional.pad(v, [0, q.shape[-1] - v.shape[-1]],
        #                                    value=0)
-        v_padded = torch.nn.functional.pad(v, [0, (q.shape[-1] - v.shape[-1]-32)],
+        v_padded = torch.nn.functional.pad(v, [0, q.shape[-1] - v.shape[-1]],
                                           value=0)
        if torch.cuda.get_device_properties(torch.cuda.current_device()).multi_processor_count == 120: