Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
25e10153
"tests/vscode:/vscode.git/clone" did not exist on "0a08d41961220887c97074dcd585e52bba9f6220"
Commit
25e10153
authored
Jan 01, 2025
by
Po Yen Chen
Browse files
Re-arrange V tile move_tile_window() statement
parent
b102083b
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
7 additions
and
6 deletions
+7
-6
include/ck_tile/ops/fmha/pipeline/block_fmha_fwd_splitkv_pipeline_qr_ks_vs.hpp
...mha/pipeline/block_fmha_fwd_splitkv_pipeline_qr_ks_vs.hpp
+7
-6
No files found.
include/ck_tile/ops/fmha/pipeline/block_fmha_fwd_splitkv_pipeline_qr_ks_vs.hpp
View file @
25e10153
...
@@ -448,6 +448,7 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
...
@@ -448,6 +448,7 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
});
});
}
}
}
}
__builtin_amdgcn_sched_barrier
(
0
);
__builtin_amdgcn_sched_barrier
(
0
);
// move K tile window
// move K tile window
i_page_block_k
=
k_page_block_navigator
.
move_tile_window
(
i_page_block_k
=
k_page_block_navigator
.
move_tile_window
(
...
@@ -466,6 +467,12 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
...
@@ -466,6 +467,12 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
tile_elementwise_inout
(
tile_elementwise_inout
(
[](
auto
&
e0
,
auto
e1
,
auto
e2
)
{
e0
=
max
(
e1
,
e2
);
},
m
,
m_old
,
m_local
);
// m{j}
[](
auto
&
e0
,
auto
e1
,
auto
e2
)
{
e0
=
max
(
e1
,
e2
);
},
m
,
m_old
,
m_local
);
// m{j}
__builtin_amdgcn_sched_barrier
(
0
);
// move V tile window
i_page_block_v
=
v_page_block_navigator
.
move_tile_window
(
i_page_block_v
,
v_dram_block_window
,
{
0
,
kN0
});
__builtin_amdgcn_sched_barrier
(
0
);
auto
p_compute
=
make_static_distributed_tensor
<
SMPLComputeDataType
>
(
auto
p_compute
=
make_static_distributed_tensor
<
SMPLComputeDataType
>
(
s
.
get_tile_distribution
());
// Pcompute{j}
s
.
get_tile_distribution
());
// Pcompute{j}
...
@@ -565,12 +572,6 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
...
@@ -565,12 +572,6 @@ struct BlockFmhaFwdSplitKVPipelineQRKSVS
const
auto
p
=
const
auto
p
=
cast_tile
<
PDataType
>
(
tile_elementwise_in
(
p_compute_element_func
,
p_compute
));
cast_tile
<
PDataType
>
(
tile_elementwise_in
(
p_compute_element_func
,
p_compute
));
__builtin_amdgcn_sched_barrier
(
0
);
// move V tile window
i_page_block_v
=
v_page_block_navigator
.
move_tile_window
(
i_page_block_v
,
v_dram_block_window
,
{
0
,
kN0
});
__builtin_amdgcn_sched_barrier
(
0
);
// STAGE 3, KV gemm
// STAGE 3, KV gemm
if
constexpr
(
k1_loops
>
1
)
if
constexpr
(
k1_loops
>
1
)
{
{
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment