Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
aca0c9e5
Commit
aca0c9e5
authored
Oct 21, 2024
by
rocking
Browse files
Support Repeat_M in distribution
parent
d7110645
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
6 additions
and
6 deletions
+6
-6
include/ck_tile/ops/layernorm2d/kernel/layernorm2d_fwd_shape.hpp
.../ck_tile/ops/layernorm2d/kernel/layernorm2d_fwd_shape.hpp
+2
-2
include/ck_tile/ops/layernorm2d/pipeline/layernorm2d_fwd_pipeline_default_policy.hpp
...rm2d/pipeline/layernorm2d_fwd_pipeline_default_policy.hpp
+4
-4
No files found.
include/ck_tile/ops/layernorm2d/kernel/layernorm2d_fwd_shape.hpp
View file @
aca0c9e5
...
@@ -15,9 +15,9 @@ namespace ck_tile {
...
@@ -15,9 +15,9 @@ namespace ck_tile {
+<----------------------< Repeat_N(2)>--------------------->+
+<----------------------< Repeat_N(2)>--------------------->+
| |
| |
+<-- <WarpPerBlock_N(2)> -->+
+<-- <WarpPerBlock_N(2)> -->+
Warp_
M
Warp_
N
+--------------+--------------+--------------+--------------+----+----------------+
+--------------+--------------+--------------+--------------+----+----------------+
Warp_
N
| wrap_0 | wrap_1 | | ^ ^
Warp_
M
| wrap_0 | wrap_1 | | ^ ^
+--------------+--------------+ | <WarpPerBlock_M(2)> |
+--------------+--------------+ | <WarpPerBlock_M(2)> |
| wrap_2 | wrap_3 | | v
| wrap_2 | wrap_3 | | v
+--------------+--------------+--------------+--------------+----+ Block_M
+--------------+--------------+--------------+--------------+----+ Block_M
...
...
include/ck_tile/ops/layernorm2d/pipeline/layernorm2d_fwd_pipeline_default_policy.hpp
View file @
aca0c9e5
...
@@ -19,12 +19,12 @@ struct Layernorm2dFwdPipelineDefaultPolicy
...
@@ -19,12 +19,12 @@ struct Layernorm2dFwdPipelineDefaultPolicy
return
make_static_tile_distribution
(
return
make_static_tile_distribution
(
tile_distribution_encoding
<
tile_distribution_encoding
<
sequence
<>
,
sequence
<>
,
tuple
<
sequence
<
S
::
WarpPerBlock_M
,
S
::
ThreadPerWarp_M
,
S
::
Vector_M
>
,
tuple
<
sequence
<
S
::
Repeat_M
,
S
::
WarpPerBlock_M
,
S
::
ThreadPerWarp_M
,
S
::
Vector_M
>
,
sequence
<
S
::
Repeat_N
,
S
::
WarpPerBlock_N
,
S
::
ThreadPerWarp_N
,
S
::
Vector_N
>>
,
sequence
<
S
::
Repeat_N
,
S
::
WarpPerBlock_N
,
S
::
ThreadPerWarp_N
,
S
::
Vector_N
>>
,
tuple
<
sequence
<
1
,
2
>
,
sequence
<
1
,
2
>>
,
tuple
<
sequence
<
1
,
2
>
,
sequence
<
1
,
2
>>
,
tuple
<
sequence
<
0
,
1
>
,
sequence
<
1
,
2
>>
,
tuple
<
sequence
<
1
,
1
>
,
sequence
<
2
,
2
>>
,
sequence
<
1
,
2
,
2
>
,
sequence
<
1
,
1
,
2
,
2
>
,
sequence
<
2
,
0
,
3
>>
{});
sequence
<
0
,
3
,
0
,
3
>>
{});
}
}
template
<
typename
Problem
>
template
<
typename
Problem
>
CK_TILE_DEVICE
static
constexpr
auto
MakeGammaBetaBlockTileDistribution
()
CK_TILE_DEVICE
static
constexpr
auto
MakeGammaBetaBlockTileDistribution
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment