Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
822856e1
Commit
822856e1
authored
Jun 01, 2021
by
Jing Zhang
Browse files
rename kperwave to kpack
parent
5ac70ce0
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
8 additions
and
8 deletions
+8
-8
composable_kernel/include/driver/driver_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw.hpp
...tion_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw.hpp
+2
-2
composable_kernel/include/driver/driver_dynamic_gemm_xdlops_v1.hpp
...e_kernel/include/driver/driver_dynamic_gemm_xdlops_v1.hpp
+2
-2
driver/include/device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw.hpp
...tion_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw.hpp
+4
-4
No files found.
composable_kernel/include/driver/driver_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw.hpp
View file @
822856e1
...
@@ -16,7 +16,7 @@ template <typename FloatAB,
...
@@ -16,7 +16,7 @@ template <typename FloatAB,
index_t
GemmNPerBlock
,
index_t
GemmNPerBlock
,
index_t
GemmMPerWave
,
index_t
GemmMPerWave
,
index_t
GemmNPerWave
,
index_t
GemmNPerWave
,
index_t
GemmKP
erWave
,
index_t
GemmKP
ack
,
typename
...
Wei
,
typename
...
Wei
,
typename
...
In
,
typename
...
In
,
typename
...
Out
,
typename
...
Out
,
...
@@ -110,7 +110,7 @@ transform_forward_convolution_into_gemm_v4r4_xdlops_nchw_kcyx_nkhw_pad(
...
@@ -110,7 +110,7 @@ transform_forward_convolution_into_gemm_v4r4_xdlops_nchw_kcyx_nkhw_pad(
assert
(
GemmM
%
GemmMPerBlock
==
0
&&
GemmN
%
GemmNPerBlock
==
0
&&
GemmK
%
GemmKPerBlock
==
0
);
assert
(
GemmM
%
GemmMPerBlock
==
0
&&
GemmN
%
GemmNPerBlock
==
0
&&
GemmK
%
GemmKPerBlock
==
0
);
constexpr
auto
xdlops_gemm
=
XdlopsGemm
<
FloatAB
,
GemmMPerWave
,
GemmNPerWave
,
GemmKP
erWave
>
{};
constexpr
auto
xdlops_gemm
=
XdlopsGemm
<
FloatAB
,
GemmMPerWave
,
GemmNPerWave
,
GemmKP
ack
>
{};
constexpr
auto
CLayout
=
xdlops_gemm
.
GetCLayout
();
constexpr
auto
CLayout
=
xdlops_gemm
.
GetCLayout
();
...
...
composable_kernel/include/driver/driver_dynamic_gemm_xdlops_v1.hpp
View file @
822856e1
...
@@ -23,7 +23,7 @@ template <index_t BlockSize,
...
@@ -23,7 +23,7 @@ template <index_t BlockSize,
index_t
KPerBlock
,
index_t
KPerBlock
,
index_t
MPerWave
,
index_t
MPerWave
,
index_t
NPerWave
,
index_t
NPerWave
,
index_t
KP
erWave
,
index_t
KP
ack
,
index_t
MRepeat
,
index_t
MRepeat
,
index_t
NRepeat
,
index_t
NRepeat
,
typename
ABlockTransferThreadSliceLengths_K_M
,
typename
ABlockTransferThreadSliceLengths_K_M
,
...
@@ -100,7 +100,7 @@ __host__ float launch_kernel_dynamic_gemm_xdlops_v1(const FloatAB* p_a_global,
...
@@ -100,7 +100,7 @@ __host__ float launch_kernel_dynamic_gemm_xdlops_v1(const FloatAB* p_a_global,
KPerBlock
,
KPerBlock
,
MPerWave
,
MPerWave
,
NPerWave
,
NPerWave
,
KP
erWave
,
KP
ack
,
MRepeat
,
MRepeat
,
NRepeat
,
NRepeat
,
ABlockTransferThreadSliceLengths_K_M
,
ABlockTransferThreadSliceLengths_K_M
,
...
...
driver/include/device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw.hpp
View file @
822856e1
...
@@ -88,7 +88,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
...
@@ -88,7 +88,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
constexpr index_t GemmMPerWave = 64;
constexpr index_t GemmMPerWave = 64;
constexpr index_t GemmNPerWave = 64;
constexpr index_t GemmNPerWave = 64;
constexpr index_t GemmKP
erWave
= 1;
constexpr index_t GemmKP
ack
= 1;
using GemmABlockTransferThreadSliceLengths_GemmK_GemmM = Sequence<4, 2>;
using GemmABlockTransferThreadSliceLengths_GemmK_GemmM = Sequence<4, 2>;
using GemmABlockTransferThreadClusterLengths_GemmK_GemmM = Sequence<2, 32>;
using GemmABlockTransferThreadClusterLengths_GemmK_GemmM = Sequence<2, 32>;
...
@@ -112,7 +112,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
...
@@ -112,7 +112,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
constexpr
index_t
GemmMPerWave
=
64
;
constexpr
index_t
GemmMPerWave
=
64
;
constexpr
index_t
GemmNPerWave
=
64
;
constexpr
index_t
GemmNPerWave
=
64
;
constexpr
index_t
GemmKP
erWave
=
4
;
constexpr
index_t
GemmKP
ack
=
4
;
constexpr
index_t
MRepeat
=
1
;
constexpr
index_t
MRepeat
=
1
;
constexpr
index_t
NRepeat
=
1
;
constexpr
index_t
NRepeat
=
1
;
...
@@ -138,7 +138,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
...
@@ -138,7 +138,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
GemmNPerBlock
,
GemmNPerBlock
,
GemmMPerWave
,
GemmMPerWave
,
GemmNPerWave
,
GemmNPerWave
,
GemmKP
erWave
>
(
GemmKP
ack
>
(
wei_k_c_y_x_desc
,
wei_k_c_y_x_desc
,
in_n_c_hi_wi_desc
,
in_n_c_hi_wi_desc
,
out_n_k_ho_wo_desc
,
out_n_k_ho_wo_desc
,
...
@@ -164,7 +164,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
...
@@ -164,7 +164,7 @@ void device_dynamic_convolution_forward_implicit_gemm_v4r4_xdlops_nchw_kcyx_nkhw
GemmKPerBlock
,
GemmKPerBlock
,
GemmMPerWave
,
GemmMPerWave
,
GemmNPerWave
,
GemmNPerWave
,
GemmKP
erWave
,
GemmKP
ack
,
MRepeat
,
MRepeat
,
NRepeat
,
NRepeat
,
GemmABlockTransferThreadSliceLengths_GemmK_GemmM
,
GemmABlockTransferThreadSliceLengths_GemmK_GemmM
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment