Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
yangql
composable_kernel-1
Commits
c39c573e
Commit
c39c573e
authored
Jan 24, 2019
by
Chao Liu
Browse files
refactor
parent
c9af4dec
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
8 additions
and
8 deletions
+8
-8
driver/device_implicit_gemm_convolution_2_cnhw_srck_knhw.cuh
driver/device_implicit_gemm_convolution_2_cnhw_srck_knhw.cuh
+4
-4
src/include/gridwise_implicit_gemm_convolution_3_cnhw_srck_knhw.cuh
...e/gridwise_implicit_gemm_convolution_3_cnhw_srck_knhw.cuh
+4
-4
No files found.
driver/device_implicit_gemm_convolution_2_cnhw_srck_knhw.cuh
View file @
c39c573e
...
...
@@ -102,8 +102,8 @@ void device_implicit_gemm_convolution_2_cnhw_srck_knhw(InDesc,
constexpr
unsigned
KPerThread
=
8
;
constexpr
unsigned
CPerThread
=
1
;
constexpr
unsigned
GemmThreadPerCluster
Row
=
4
;
constexpr
unsigned
GemmThreadPerCluster
Column
=
4
;
constexpr
unsigned
Gemm
Row
ThreadPerCluster
=
4
;
constexpr
unsigned
Gemm
Column
ThreadPerCluster
=
4
;
constexpr
unsigned
InBlockCopyThreadPerDim0
=
2
;
constexpr
unsigned
InBlockCopyThreadPerDim1
=
64
;
...
...
@@ -149,8 +149,8 @@ void device_implicit_gemm_convolution_2_cnhw_srck_knhw(InDesc,
BPerThread
,
KPerThread
,
CPerThread
,
GemmThreadPerCluster
Row
,
GemmThreadPerCluster
Column
,
Gemm
Row
ThreadPerCluster
,
Gemm
Column
ThreadPerCluster
,
InBlockCopyThreadPerDim0
,
InBlockCopyThreadPerDim1
>
<<<
grid_dim
,
block_dim
>>>
(
in_cnhw_desc
,
...
...
src/include/gridwise_implicit_gemm_convolution_3_cnhw_srck_knhw.cuh
View file @
c39c573e
...
...
@@ -20,8 +20,8 @@ template <unsigned GridSize,
unsigned
BPerThread
,
unsigned
KPerThread
,
unsigned
CPerThread
,
unsigned
GemmThreadPerCluster
Row
,
unsigned
GemmThreadPerCluster
Column
,
unsigned
Gemm
Row
ThreadPerCluster
,
unsigned
Gemm
Column
ThreadPerCluster
,
unsigned
InBlockCopyThreadPerDim0
,
unsigned
InBlockCopyThreadPerDim1
>
__global__
void
...
...
@@ -177,8 +177,8 @@ gridwise_implicit_gemm_convolution_3_cnhw_srck_knhw(InGlobalDesc,
false
,
false
,
CPerThread
,
GemmThreadPerCluster
Row
,
GemmThreadPerCluster
Column
,
Gemm
Row
ThreadPerCluster
,
Gemm
Column
ThreadPerCluster
,
true
>
{};
// LDS
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment