Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
d2490b49
Commit
d2490b49
authored
Nov 19, 2019
by
Chao Liu
Browse files
rename
parent
d78fe365
Changes
3
Show whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
29 additions
and
31 deletions
+29
-31
composable_kernel/include/kernel_algorithm/gridwise_convolution_backward_data_implicit_gemm_v4r4_nchw_kcyx_nkhw_lds_double_buffer.hpp
...a_implicit_gemm_v4r4_nchw_kcyx_nkhw_lds_double_buffer.hpp
+3
-3
driver/include/device_convolution_backward_data_implicit_gemm_v4r4_nchw_kcyx_nkhw.hpp
...ution_backward_data_implicit_gemm_v4r4_nchw_kcyx_nkhw.hpp
+13
-13
driver/src/conv_bwd_data_driver.cpp
driver/src/conv_bwd_data_driver.cpp
+13
-15
No files found.
composable_kernel/include/kernel_algorithm/gridwise_convolution_backward_data_implicit_gemm_v
1
_nchw_kcyx_nkhw_lds_double_buffer.hpp
→
composable_kernel/include/kernel_algorithm/gridwise_convolution_backward_data_implicit_gemm_v
4r4
_nchw_kcyx_nkhw_lds_double_buffer.hpp
View file @
d2490b49
#ifndef CK_GRIDWISE_CONVOLUTION_BACKWARD_DATA_IMPLICIT_GEMM_V
1
_NCHW_KCYX_NKHW_LDS_DOUBLE_BUFFER_HPP
#define CK_GRIDWISE_CONVOLUTION_BACKWARD_DATA_IMPLICIT_GEMM_V
1
_NCHW_KCYX_NKHW_LDS_DOUBLE_BUFFER_HPP
#ifndef CK_GRIDWISE_CONVOLUTION_BACKWARD_DATA_IMPLICIT_GEMM_V
4R4
_NCHW_KCYX_NKHW_LDS_DOUBLE_BUFFER_HPP
#define CK_GRIDWISE_CONVOLUTION_BACKWARD_DATA_IMPLICIT_GEMM_V
4R4
_NCHW_KCYX_NKHW_LDS_DOUBLE_BUFFER_HPP
#include "common_header.hpp"
#include "tensor_descriptor.hpp"
...
...
@@ -41,7 +41,7 @@ template <index_t GridSize,
typename
WeiBlockCopyClusterLengths_K_E
,
index_t
WeiBlockCopyDataPerAccess_E
,
index_t
InThreadCopyDataPerAccess_B
>
struct
GridwiseConvolutionBackwardDataImplicitGemm_v
1
_nchw_kcyx_nkhw_lds_double_buffer
struct
GridwiseConvolutionBackwardDataImplicitGemm_v
4r4
_nchw_kcyx_nkhw_lds_double_buffer
{
__device__
void
Run
(
Float
*
const
__restrict__
p_in_global
,
const
Float
*
const
__restrict__
p_wei_global
,
...
...
driver/include/device_convolution_b
w
d_data_implicit_gemm_v
1
_nchw_kcyx_nkhw.hpp
→
driver/include/device_convolution_b
ackwar
d_data_implicit_gemm_v
4r4
_nchw_kcyx_nkhw.hpp
View file @
d2490b49
...
...
@@ -3,7 +3,7 @@
#include "device.hpp"
#include "tensor.hpp"
#include "gridwise_operation_wrapper.hpp"
#include "gridwise_convolution_backward_data_implicit_gemm_v
1
_nchw_kcyx_nkhw_lds_double_buffer.hpp"
#include "gridwise_convolution_backward_data_implicit_gemm_v
4r4
_nchw_kcyx_nkhw_lds_double_buffer.hpp"
template
<
typename
T
,
typename
InDesc
,
...
...
@@ -13,7 +13,7 @@ template <typename T,
typename
ConvDilations
,
typename
LeftPads
,
typename
RightPads
>
void
device_convolution_b
w
d_data_implicit_gemm_v
1
_nchw_kcyx_nkhw
(
InDesc
in_nchw_desc
,
void
device_convolution_b
ackwar
d_data_implicit_gemm_v
4r4
_nchw_kcyx_nkhw
(
InDesc
in_nchw_desc
,
Tensor
<
T
>&
in_nchw
,
WeiDesc
wei_kcyx_desc
,
const
Tensor
<
T
>&
wei_kcyx
,
...
...
@@ -85,7 +85,7 @@ void device_convolution_bwd_data_implicit_gemm_v1_nchw_kcyx_nkhw(InDesc in_nchw_
printf
(
"%s: BlockSize %u, GridSize %u
\n
"
,
__func__
,
BlockSize
,
GridSize
);
constexpr
auto
gridwise_conv
=
GridwiseConvolutionBackwardDataImplicitGemm_v
1
_nchw_kcyx_nkhw_lds_double_buffer
<
GridwiseConvolutionBackwardDataImplicitGemm_v
4r4
_nchw_kcyx_nkhw_lds_double_buffer
<
GridSize
,
BlockSize
,
T
,
...
...
driver/src/conv_bwd_data_driver.cpp
View file @
d2490b49
...
...
@@ -13,7 +13,7 @@
#include "device_tensor.hpp"
#include "conv_common.hpp"
#include "host_conv_bwd_data.hpp"
#include "device_convolution_b
w
d_data_implicit_gemm_v
1
_nchw_kcyx_nkhw.hpp"
#include "device_convolution_b
ackwar
d_data_implicit_gemm_v
4r4
_nchw_kcyx_nkhw.hpp"
int
main
(
int
argc
,
char
*
argv
[])
{
...
...
@@ -96,7 +96,7 @@ int main(int argc, char* argv[])
using
LeftPads
=
Sequence
<
0
,
0
>
;
using
RightPads
=
Sequence
<
0
,
0
>
;
#elif
0
#elif
1
// 1x1 filter, 8x8 image
// cudnn@V100 83%, ck@V100 75%, ck@P100 78%, ck@VII 65%
constexpr
index_t
N
=
128
;
...
...
@@ -344,8 +344,7 @@ int main(int argc, char* argv[])
#endif
}
#if 1
device_convolution_bwd_data_implicit_gemm_v1_nchw_kcyx_nkhw
(
in_nchw_desc
,
device_convolution_backward_data_implicit_gemm_v4r4_nchw_kcyx_nkhw
(
in_nchw_desc
,
in_nchw_device
,
wei_kcyx_desc
,
wei_kcyx
,
...
...
@@ -356,7 +355,6 @@ int main(int argc, char* argv[])
LeftPads
{},
RightPads
{},
nrepeat
);
#endif
if
(
do_verification
)
{
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment