"tests/vscode:/vscode.git/clone" did not exist on "0a08d41961220887c97074dcd585e52bba9f6220"
Commit 25e10153 authored by Po Yen Chen's avatar Po Yen Chen
Browse files

Re-arrange V tile move_tile_window() statement

parent b102083b
...@@ -448,6 +448,7 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS ...@@ -448,6 +448,7 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
}); });
} }
} }
__builtin_amdgcn_sched_barrier(0); __builtin_amdgcn_sched_barrier(0);
// move K tile window // move K tile window
i_page_block_k = k_page_block_navigator.move_tile_window( i_page_block_k = k_page_block_navigator.move_tile_window(
...@@ -466,6 +467,12 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS ...@@ -466,6 +467,12 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
tile_elementwise_inout( tile_elementwise_inout(
[](auto& e0, auto e1, auto e2) { e0 = max(e1, e2); }, m, m_old, m_local); // m{j} [](auto& e0, auto e1, auto e2) { e0 = max(e1, e2); }, m, m_old, m_local); // m{j}
__builtin_amdgcn_sched_barrier(0);
// move V tile window
i_page_block_v = v_page_block_navigator.move_tile_window(
i_page_block_v, v_dram_block_window, {0, kN0});
__builtin_amdgcn_sched_barrier(0);
auto p_compute = make_static_distributed_tensor<SMPLComputeDataType>( auto p_compute = make_static_distributed_tensor<SMPLComputeDataType>(
s.get_tile_distribution()); // Pcompute{j} s.get_tile_distribution()); // Pcompute{j}
...@@ -565,12 +572,6 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS ...@@ -565,12 +572,6 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
const auto p = const auto p =
cast_tile<PDataType>(tile_elementwise_in(p_compute_element_func, p_compute)); cast_tile<PDataType>(tile_elementwise_in(p_compute_element_func, p_compute));
__builtin_amdgcn_sched_barrier(0);
// move V tile window
i_page_block_v = v_page_block_navigator.move_tile_window(
i_page_block_v, v_dram_block_window, {0, kN0});
__builtin_amdgcn_sched_barrier(0);
// STAGE 3, KV gemm // STAGE 3, KV gemm
if constexpr(k1_loops > 1) if constexpr(k1_loops > 1)
{ {
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment