Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
yangql
composable_kernel-1
Commits
05e04665
Commit
05e04665
authored
Jun 11, 2019
by
Chao Liu
Browse files
remove .hip extension
parent
a68b16a5
Changes
57
Show whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
101 additions
and
101 deletions
+101
-101
src/include/blockwise_4d_tensor_op.hpp
src/include/blockwise_4d_tensor_op.hpp
+2
-2
src/include/blockwise_batched_gemm.hpp
src/include/blockwise_batched_gemm.hpp
+1
-1
src/include/blockwise_gemm.hpp
src/include/blockwise_gemm.hpp
+2
-2
src/include/blockwise_generic_tensor_slice_op.hpp
src/include/blockwise_generic_tensor_slice_op.hpp
+1
-1
src/include/blockwise_tensor_slice_op.hpp
src/include/blockwise_tensor_slice_op.hpp
+1
-1
src/include/common.hip.hpp
src/include/common.hip.hpp
+0
-13
src/include/common.hpp
src/include/common.hpp
+13
-0
src/include/conv_common.hpp
src/include/conv_common.hpp
+1
-1
src/include/functional.hpp
src/include/functional.hpp
+2
-2
src/include/functional2.hpp
src/include/functional2.hpp
+2
-2
src/include/functional3.hpp
src/include/functional3.hpp
+4
-4
src/include/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp
...include/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp
+6
-6
src/include/gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp
+8
-8
src/include/gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp
+9
-9
src/include/gridwise_convolution_implicit_gemm_v1r2_nchw_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r2_nchw_cyxk_khwn.hpp
+9
-9
src/include/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp
+8
-8
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_chwn_cyxk_khwn.hpp
...n_implicit_gemm_v1r3_lds_double_buffer_chwn_cyxk_khwn.hpp
+8
-8
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_khwn.hpp
...n_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_khwn.hpp
+8
-8
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_nkhw.hpp
...n_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_nkhw.hpp
+8
-8
src/include/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_khwn.hpp
+8
-8
No files found.
src/include/blockwise_4d_tensor_op.
hip.
hpp
→
src/include/blockwise_4d_tensor_op.hpp
View file @
05e04665
#pragma once
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "ConstantTensorDescriptor.hpp"
#include "threadwise_tensor_slice_op.hpp"
template
<
index_t
BlockSize
,
class
Float
,
class
DstDesc
,
class
F
>
__device__
void
...
...
src/include/blockwise_batched_gemm.
hip.
hpp
→
src/include/blockwise_batched_gemm.hpp
View file @
05e04665
#pragma once
#include "threadwise_gemm.
hip.
hpp"
#include "threadwise_gemm.hpp"
template
<
index_t
BlockSize
,
class
BlockMatrixA
,
...
...
src/include/blockwise_gemm.
hip.
hpp
→
src/include/blockwise_gemm.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "threadwise_gemm.
hip.
hpp"
#include "common.hpp"
#include "threadwise_gemm.hpp"
// if following number are power of 2, index calculation shall be greatly reduced:
// MPerThreadSubC, NPerThreadSubC, MLevel0Cluster, NLevel0Cluster, MLevel1Cluster, NLevel1Cluster
...
...
src/include/blockwise_generic_tensor_slice_op.
hip.
hpp
→
src/include/blockwise_generic_tensor_slice_op.hpp
View file @
05e04665
#pragma once
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.hpp"
// slice a (normal or merged) tensor, and copy it into another (normal or merged) tensor
// memory layout (ordering of dimensions) can be different between src and dst
...
...
src/include/blockwise_tensor_slice_op.
hip.
hpp
→
src/include/blockwise_tensor_slice_op.hpp
View file @
05e04665
#pragma once
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.hpp"
template
<
index_t
BlockSize
,
class
Float
,
...
...
src/include/common.hip.hpp
deleted
100644 → 0
View file @
a68b16a5
#pragma once
#include "base.hip.hpp"
#include "vector_type.hip.hpp"
#include "integral_constant.hip.hpp"
#include "Sequence.hip.hpp"
#include "Array.hip.hpp"
#include "functional.hip.hpp"
#include "functional2.hip.hpp"
#include "functional3.hip.hpp"
#if USE_AMD_INLINE_ASM
#include "amd_inline_asm.hip.hpp"
#endif
src/include/common.hpp
0 → 100644
View file @
05e04665
#pragma once
#include "base.hpp"
#include "vector_type.hpp"
#include "integral_constant.hpp"
#include "Sequence.hpp"
#include "Array.hpp"
#include "functional.hpp"
#include "functional2.hpp"
#include "functional3.hpp"
#if USE_AMD_INLINE_ASM
#include "amd_inline_asm.hpp"
#endif
src/include/conv_common.
hip.
hpp
→
src/include/conv_common.hpp
View file @
05e04665
#pragma once
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantTensorDescriptor.hpp"
// this is ugly, only for 4d
template
<
class
InDesc
,
class
WeiDesc
>
...
...
src/include/functional.
hip.
hpp
→
src/include/functional.hpp
View file @
05e04665
#pragma once
#include "integral_constant.
hip.
hpp"
#include "Sequence.
hip.
hpp"
#include "integral_constant.hpp"
#include "Sequence.hpp"
struct
forwarder
{
...
...
src/include/functional2.
hip.
hpp
→
src/include/functional2.hpp
View file @
05e04665
#pragma once
#include "functional.
hip.
hpp"
#include "Sequence.
hip.
hpp"
#include "functional.hpp"
#include "Sequence.hpp"
template
<
class
>
struct
static_for_impl
;
...
...
src/include/functional3.
hip.
hpp
→
src/include/functional3.hpp
View file @
05e04665
#pragma once
#include "functional.
hip.
hpp"
#include "functional2.
hip.
hpp"
#include "Sequence.
hip.
hpp"
#include "Array.
hip.
hpp"
#include "functional.hpp"
#include "functional2.hpp"
#include "Sequence.hpp"
#include "Array.hpp"
// RemainLengths: Sequence<...>
template
<
class
RemainLengths
>
...
...
src/include/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.
hip.
hpp
→
src/include/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_4d_tensor_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_direct_convolution.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_direct_convolution.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_3d_tensor_op.
hip.
hpp"
#include "blockwise_4d_tensor_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_3d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r2_nchw_cyxk_khwn.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r2_nchw_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_3d_tensor_op.
hip.
hpp"
#include "blockwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_3d_tensor_op.hpp"
#include "blockwise_tensor_slice_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_4d_tensor_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_chwn_cyxk_khwn.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_chwn_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_4d_tensor_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_khwn.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_tensor_slice_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_nkhw.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_nkhw.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_tensor_slice_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
src/include/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_khwn.
hip.
hpp
→
src/include/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#include "common.
hip.
hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantMatrixDescriptor.
hip.
hpp"
#include "blockwise_2d_tensor_op.
hip.
hpp"
#include "blockwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_tensor_slice_op.
hip.
hpp"
#include "threadwise_4d_tensor_op.
hip.
hpp"
#include "blockwise_batched_gemm.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "blockwise_tensor_slice_op.hpp"
#include "threadwise_tensor_slice_op.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
template
<
index_t
GridSize
,
index_t
BlockSize
,
...
...
Prev
1
2
3
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment