Commit 085c3454 authored by zhuwenwen's avatar zhuwenwen
Browse files

update triton_decode_attention.py

parent 8b5a09f6
......@@ -1602,7 +1602,7 @@ def decode_attention_fwd(
logit_cap=logit_cap,
)
elif best_config['kernel_kind'] == 'v2_tc':
decode_attention_v1(
decode_attention_v2(
q,
k_buffer,
v_buffer,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment