Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
d846292c
"...composable_kernel.git" did not exist on "642d5e9155a16c96b01eee7b8ef0e9d558fc2e16"
Commit
d846292c
authored
Dec 12, 2024
by
letaoqin
Browse files
rewite save o code
parent
15e76415
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
15 additions
and
16 deletions
+15
-16
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general.hpp
...ops/fused_moe/pipeline/fused_moegemm_pipeline_general.hpp
+6
-8
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general_policy.hpp
...ed_moe/pipeline/fused_moegemm_pipeline_general_policy.hpp
+9
-8
No files found.
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general.hpp
View file @
d846292c
...
...
@@ -306,25 +306,23 @@ struct FusedMoeGemmPipeline_General
make_tuple
(
number
<
32
>
{},
number
<
32
>
{}),
{
0
,
0
},
Policy
::
template
MakeGlobalTileDistribution_O
<
Problem
>());
ignore
=
o_alds_win
;
auto
save_o
=
[
&
]()
{
if
(
blockIdx
.
x
==
0
&&
(
blockIdx
.
y
==
0
||
blockIdx
.
y
==
1
)
&&
blockIdx
.
z
==
0
)
{
if
(
threadIdx
.
x
<
64
)
{
auto
o0
=
load_tile
(
o_olds_win
);
for
(
int
step
=
1
;
step
<
4
;
step
++
)
{
auto
o0
=
load_tile
(
o_olds_win
);
constexpr
index_t
thread_buffer_size
=
decltype
(
o0
)
::
get_thread_buffer_size
();
static_for
<
1
,
BlockShape
::
Repeat_K1
,
1
>
{}([
&
](
auto
)
{
move_tile_window
(
o_olds_win
,
{
32
,
0
});
auto
o1
=
load_tile
(
o_olds_win
);
for
(
int
i
=
0
;
i
<
16
;
i
++
)
{
static_for
<
0
,
thread_buffer_size
,
1
>
{}([
&
](
auto
i
)
{
o0
.
get_thread_buffer
()(
i
)
=
type_convert
<
ODataType
>
(
type_convert
<
float
>
(
o0
.
get_thread_buffer
()[
i
])
+
type_convert
<
float
>
(
o1
.
get_thread_buffer
()[
i
]));
}
}
}
);
}
);
update_tile
(
o_window_
,
o0
);
}
}
...
...
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general_policy.hpp
View file @
d846292c
...
...
@@ -216,14 +216,15 @@ struct FusedMoeGemmPipelineGeneralPolicy
typename
S_
::
WarpTile_0
>>
;
constexpr
auto
warp_gemm
=
GetWarpGemm0
<
Problem
>
();
using
BlockGemmPolicy
=
BlockGemmASmemBSmemCRegV1CustomPolicy
<
typename
Problem
::
ADataType
,
// using BlockGemmPolicy =
// BlockGemmASmemBRegCRegV1CustomPolicy<typename
// Problem::ADataType,
typename
Problem
::
GDataType
,
typename
Problem
::
AccDataType
,
typename
S_
::
WarpPerBlock_0
,
decltype
(
warp_gemm
)
>
;
using
BlockGemmPolicy
=
BlockGemmASmemBSmemCRegV1CustomPolicy
<
typename
Problem
::
ADataType
,
// using BlockGemmPolicy =
// BlockGemmASmemBRegCRegV1CustomPolicy<typename
// Problem::ADataType,
typename
Problem
::
GDataType
,
typename
Problem
::
AccDataType
,
typename
S_
::
WarpPerBlock_0
,
decltype
(
warp_gemm
)
>
;
return
BlockGemmASmemBSmemCRegV1
<
GemmProblem
,
BlockGemmPolicy
>
{};
// return BlockGemmASmemBRegCRegV1<GemmProblem, BlockGemmPolicy>{};
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment