Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
b5e35626
Commit
b5e35626
authored
Jan 16, 2025
by
coderfeli
Browse files
fix typo
parent
d12c3c6f
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
3 deletions
+4
-3
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_flatmm_uk.hpp
...s/fused_moe/pipeline/fused_moegemm_pipeline_flatmm_uk.hpp
+4
-3
No files found.
include/ck_tile/ops/fused_moe/pipeline/fused_moegemm_pipeline_flatmm_uk.hpp
View file @
b5e35626
...
@@ -187,7 +187,7 @@ struct FusedMoeGemmPipeline_FlatmmUk
...
@@ -187,7 +187,7 @@ struct FusedMoeGemmPipeline_FlatmmUk
const
IndexDataType
expert_id
=
__builtin_amdgcn_readfirstlane
(
const
IndexDataType
expert_id
=
__builtin_amdgcn_readfirstlane
(
reinterpret_cast
<
const
IndexDataType
*>
(
kargs
.
sorted_expert_ids_ptr
)[
sorted_tile_id
]);
reinterpret_cast
<
const
IndexDataType
*>
(
kargs
.
sorted_expert_ids_ptr
)[
sorted_tile_id
]);
const
IndexDataType
expert_first_token
=
__builtin_amdgcn_readfirstlane
(
const
IndexDataType
expert_first_token
=
__builtin_amdgcn_readfirstlane
(
reinterpret_cast
<
const
IndexDataType
*>
(
kargs
.
sorted_token_ids_ptr
)[
sorted_tile_id
*
32
]);
reinterpret_cast
<
const
IndexDataType
*>
(
kargs
.
sorted_token_ids_ptr
)[
sorted_tile_id
*
BlockShape
::
Block_M0
]);
index_t
expert_stride_0
=
shared_intermediate_size_0
*
kargs
.
hidden_size
;
index_t
expert_stride_0
=
shared_intermediate_size_0
*
kargs
.
hidden_size
;
index_t
expert_stride_1
=
shared_intermediate_size_1
*
kargs
.
hidden_size
;
index_t
expert_stride_1
=
shared_intermediate_size_1
*
kargs
.
hidden_size
;
...
@@ -209,9 +209,10 @@ struct FusedMoeGemmPipeline_FlatmmUk
...
@@ -209,9 +209,10 @@ struct FusedMoeGemmPipeline_FlatmmUk
threadIdx
.
x
%
(
BlockShape
::
Block_K0
/
kAlignmentA
)
*
kAlignmentA
;
threadIdx
.
x
%
(
BlockShape
::
Block_K0
/
kAlignmentA
)
*
kAlignmentA
;
},
},
number
<
row_ids_a
.
size
()
>
{});
number
<
row_ids_a
.
size
()
>
{});
if
(
expert_first_token
&
0xffffff
>=
kargs
.
num_tokens
)
if
(
(
expert_first_token
&
0xffffff
)
>=
kargs
.
num_tokens
)
return
;
return
;
// printf("tid %d %d, first %d\n", blockIdx.x, threadIdx.x,expert_first_token&0xffffff);
// if (threadIdx.x %32==0)
// printf("block %d %d thread %d, expert %d firstt %x %d, sorted_tile_id %d\n", blockIdx.x,blockIdx.y, threadIdx.x,expert_id, expert_first_token,(expert_first_token&0xffffff), sorted_tile_id);
// for (int i = 0; i < row_ids_a.size(); i++) {
// for (int i = 0; i < row_ids_a.size(); i++) {
// printf("%d bid %d tid %d rowid %d\n", i, blockIdx.x, threadIdx.x, row_ids_a[i]);
// printf("%d bid %d tid %d rowid %d\n", i, blockIdx.x, threadIdx.x, row_ids_a[i]);
// }
// }
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment