Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
28252273
Commit
28252273
authored
Dec 17, 2024
by
letaoqin
Browse files
first version right
parent
580d93dc
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
5 additions
and
3 deletions
+5
-3
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general.hpp
...ops/fused_moe/pipeline/fused_moegemm_pipeline_general.hpp
+3
-1
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general_policy.hpp
...ed_moe/pipeline/fused_moegemm_pipeline_general_policy.hpp
+2
-2
No files found.
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general.hpp
View file @
28252273
...
@@ -323,7 +323,7 @@ struct FusedMoeGemmPipeline_General
...
@@ -323,7 +323,7 @@ struct FusedMoeGemmPipeline_General
Policy
::
template
MakeGlobalTileDistribution_O
<
Problem
>());
Policy
::
template
MakeGlobalTileDistribution_O
<
Problem
>());
auto
save_o
=
[
&
]()
{
auto
save_o
=
[
&
]()
{
//if(blockIdx.x == 0 && (blockIdx.y == 0 || blockIdx.y == 1) && blockIdx.z == 0)
//
if(blockIdx.x == 0 && (blockIdx.y == 0 || blockIdx.y == 1) && blockIdx.z == 0)
{
{
if
(
threadIdx
.
x
<
64
)
if
(
threadIdx
.
x
<
64
)
{
{
...
@@ -339,6 +339,8 @@ struct FusedMoeGemmPipeline_General
...
@@ -339,6 +339,8 @@ struct FusedMoeGemmPipeline_General
});
});
});
});
update_tile
(
o_window_
,
o0
);
update_tile
(
o_window_
,
o0
);
// restore pos
move_tile_window
(
o_olds_win
,
{
-
32
*
(
BlockShape
::
Repeat_K1
-
1
),
0
});
}
}
}
}
};
};
...
...
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_general_policy.hpp
View file @
28252273
...
@@ -24,7 +24,7 @@ struct FusedMoeGemmPipelineGeneralPolicy
...
@@ -24,7 +24,7 @@ struct FusedMoeGemmPipelineGeneralPolicy
CK_TILE_HOST_DEVICE
static
constexpr
index_t
GetAsyncCopyDwords
()
CK_TILE_HOST_DEVICE
static
constexpr
index_t
GetAsyncCopyDwords
()
{
{
// TODO: always 1 dword
// TODO: always 1 dword
return
1
;
return
2
;
}
}
template
<
typename
Problem
>
template
<
typename
Problem
>
...
@@ -196,7 +196,7 @@ struct FusedMoeGemmPipelineGeneralPolicy
...
@@ -196,7 +196,7 @@ struct FusedMoeGemmPipelineGeneralPolicy
{
{
return
make_static_tile_distribution
(
return
make_static_tile_distribution
(
tile_distribution_encoding
<
sequence
<
1
>
,
tile_distribution_encoding
<
sequence
<
1
>
,
tuple
<
sequence
<
1
,
2
,
16
>
,
sequence
<
4
,
8
>>
,
tuple
<
sequence
<
1
,
1
,
32
>
,
sequence
<
2
,
16
>>
,
tuple
<
sequence
<
0
,
1
>
,
sequence
<
1
,
2
>>
,
tuple
<
sequence
<
0
,
1
>
,
sequence
<
1
,
2
>>
,
tuple
<
sequence
<
0
,
0
>
,
sequence
<
2
,
0
>>
,
tuple
<
sequence
<
0
,
0
>
,
sequence
<
2
,
0
>>
,
sequence
<
1
,
2
>
,
sequence
<
1
,
2
>
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment