Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
0f49ce23
Commit
0f49ce23
authored
Jun 30, 2023
by
Jing Zhang
Committed by
root
Jun 30, 2023
Browse files
void data pointers
parent
a74cbab8
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
28 additions
and
12 deletions
+28
-12
include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_xdl_splitk_cshuffle.hpp
...u/device/impl/device_grouped_gemm_xdl_splitk_cshuffle.hpp
+28
-12
No files found.
include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_xdl_splitk_cshuffle.hpp
View file @
0f49ce23
...
...
@@ -25,6 +25,9 @@ namespace device {
template
<
typename
GridwiseGemm
,
typename
GemmDesc
,
typename
FloatA
,
typename
FloatB
,
typename
FloatC
,
bool
HasMainKBlockLoop
,
InMemoryDataOperationEnum
CGlobalMemoryDataOperation
>
__global__
void
...
...
@@ -77,9 +80,10 @@ __global__ void
}
#endif
const
auto
p_a_grid
=
gemm_desc_ptr
[
group_id
].
p_a_grid
;
const
auto
p_b_grid
=
gemm_desc_ptr
[
group_id
].
p_b_grid
;
const
auto
p_c_grid
=
gemm_desc_ptr
[
group_id
].
p_c_grid
;
const
auto
p_a_grid
=
reinterpret_cast
<
const
FloatA
*>
(
gemm_desc_ptr
[
group_id
].
p_a_grid
);
const
auto
p_b_grid
=
reinterpret_cast
<
const
FloatB
*>
(
gemm_desc_ptr
[
group_id
].
p_b_grid
);
const
auto
p_c_grid
=
reinterpret_cast
<
FloatC
*>
(
gemm_desc_ptr
[
group_id
].
p_c_grid
);
const
auto
M
=
gemm_desc_ptr
[
group_id
].
M
;
const
auto
N
=
gemm_desc_ptr
[
group_id
].
N
;
const
auto
K
=
gemm_desc_ptr
[
group_id
].
K
;
...
...
@@ -400,9 +404,9 @@ struct DeviceGroupedGemmXdlSplitKCShuffle : public DeviceGroupedGemmSplitK<ALayo
{
struct
SimpleGemmArgument
{
const
ADataType
*
p_a_grid
;
const
BDataType
*
p_b_grid
;
EDataType
*
p_c_grid
;
const
void
*
p_a_grid
;
const
void
*
p_b_grid
;
void
*
p_c_grid
;
index_t
M
;
index_t
N
;
...
...
@@ -517,6 +521,9 @@ struct DeviceGroupedGemmXdlSplitKCShuffle : public DeviceGroupedGemmSplitK<ALayo
const
auto
kernel
=
kernel_grouped_gemm_xdl_splitk
<
GridwiseGemm
,
GemmArgumentType
,
ADataType
,
BDataType
,
EDataType
,
true
,
InMemoryDataOperationEnum
::
AtomicAdd
>
;
...
...
@@ -527,6 +534,9 @@ struct DeviceGroupedGemmXdlSplitKCShuffle : public DeviceGroupedGemmSplitK<ALayo
const
auto
kernel
=
kernel_grouped_gemm_xdl_splitk
<
GridwiseGemm
,
GemmArgumentType
,
ADataType
,
BDataType
,
EDataType
,
true
,
InMemoryDataOperationEnum
::
Set
>
;
...
...
@@ -540,6 +550,9 @@ struct DeviceGroupedGemmXdlSplitKCShuffle : public DeviceGroupedGemmSplitK<ALayo
const
auto
kernel
=
kernel_grouped_gemm_xdl_splitk
<
GridwiseGemm
,
GemmArgumentType
,
ADataType
,
BDataType
,
EDataType
,
false
,
InMemoryDataOperationEnum
::
AtomicAdd
>
;
...
...
@@ -550,6 +563,9 @@ struct DeviceGroupedGemmXdlSplitKCShuffle : public DeviceGroupedGemmSplitK<ALayo
const
auto
kernel
=
kernel_grouped_gemm_xdl_splitk
<
GridwiseGemm
,
GemmArgumentType
,
ADataType
,
BDataType
,
EDataType
,
false
,
InMemoryDataOperationEnum
::
Set
>
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment