Unverified Commit 5d8e1c92 authored by Antonio Gómez's avatar Antonio Gómez Committed by GitHub
Browse files

[Bugfix] Support triton==3.3.0+git95326d9f for RTX 5090 (Unsloth + vLLM compatibility) (#15471)


Co-authored-by: default avatarServerAI <ai@exc-mad-ai.com>
parent 0a049c7d
...@@ -130,7 +130,7 @@ def do_expand_kernel( ...@@ -130,7 +130,7 @@ def do_expand_kernel(
# Identify A and B block pointers # Identify A and B block pointers
offset_k = tl.arange(0, BLOCK_K) offset_k = tl.arange(0, BLOCK_K)
a_ptr = (cur_input_ptr + ram[:, None] * input_d1_stride + a_ptr = (cur_input_ptr + ram[:, None] * input_d1_stride +
offset_k[None, :] * input_d2_stride, ) offset_k[None, :] * input_d2_stride)
b_ptr = (cur_lora_ptr + cur_lora_d0_stride * lora_index + b_ptr = (cur_lora_ptr + cur_lora_d0_stride * lora_index +
offset_k[:, None] * cur_lora_d2_stride + offset_k[:, None] * cur_lora_d2_stride +
rbn[None, :] * cur_lora_d1_stride) rbn[None, :] * cur_lora_d1_stride)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment