Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
yangql
composable_kernel-1
Commits
05e04665
"...resnet50_tensorflow.git" did not exist on "fb35d6bef6eecc640fb865dd2fc73d8fee2a93b6"
Commit
05e04665
authored
Jun 11, 2019
by
Chao Liu
Browse files
remove .hip extension
parent
a68b16a5
Changes
57
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
41 additions
and
41 deletions
+41
-41
driver/device_convolution_direct_v2_nchw_kcyx_nkhw.hpp
driver/device_convolution_direct_v2_nchw_kcyx_nkhw.hpp
+2
-2
driver/device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp
...er/device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp
+5
-5
driver/device_convolution_implicit_gemm_v1_nchw_cyxk_khwn.hpp
...er/device_convolution_implicit_gemm_v1_nchw_cyxk_khwn.hpp
+4
-4
driver/device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw.hpp
...er/device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw.hpp
+3
-3
driver/device_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
...er/device_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
+3
-3
driver/device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
...er/device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
+3
-3
driver/device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp
...er/device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp
+3
-3
driver/device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp
...device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp
+1
-1
driver/device_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp
...ice_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp
+1
-1
driver/driver.cpp
driver/driver.cpp
+2
-2
driver/driver.cu
driver/driver.cu
+1
-1
src/include/Array.hpp
src/include/Array.hpp
+2
-2
src/include/ConstantMatrixDescriptor.hpp
src/include/ConstantMatrixDescriptor.hpp
+1
-1
src/include/ConstantMergedTensorDescriptor.hpp
src/include/ConstantMergedTensorDescriptor.hpp
+2
-2
src/include/ConstantTensorDescriptor.hpp
src/include/ConstantTensorDescriptor.hpp
+1
-1
src/include/Sequence.hpp
src/include/Sequence.hpp
+2
-2
src/include/amd_inline_asm.hpp
src/include/amd_inline_asm.hpp
+1
-1
src/include/base.hpp
src/include/base.hpp
+0
-0
src/include/blockwise_2d_tensor_op.hpp
src/include/blockwise_2d_tensor_op.hpp
+2
-2
src/include/blockwise_3d_tensor_op.hpp
src/include/blockwise_3d_tensor_op.hpp
+2
-2
No files found.
driver/device_convolution_direct_v2_nchw_kcyx_nkhw.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_wrapper.
hip.
hpp"
#include "gridwise_convolution_wrapper.hpp"
#include "gridwise_convolution_direct_v2_nchw_kcyx_nkhw.
hip.
hpp"
#include "gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_convolution_direct_v2_nchw_kcyx_nkhw
(
InDesc
,
void
device_convolution_direct_v2_nchw_kcyx_nkhw
(
InDesc
,
...
...
driver/device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_wrapper.
hip.
hpp"
#include "gridwise_convolution_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_chwn_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_chwn_cyxk_khwn.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_convolution_implicit_gemm_v1_chwn_cyxk_khwn
(
InDesc
,
void
device_convolution_implicit_gemm_v1_chwn_cyxk_khwn
(
InDesc
,
...
...
driver/device_convolution_implicit_gemm_v1_nchw_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_wrapper.
hip.
hpp"
#include "gridwise_convolution_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v1r2_nchw_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r2_nchw_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_khwn.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_convolution_implicit_gemm_v1_nchw_cyxk_khwn
(
InDesc
,
void
device_convolution_implicit_gemm_v1_nchw_cyxk_khwn
(
InDesc
,
...
...
driver/device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_wrapper.
hip.
hpp"
#include "gridwise_convolution_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_nkhw.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_lds_double_buffer_nchw_cyxk_nkhw.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw
(
InDesc
,
void
device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw
(
InDesc
,
...
...
driver/device_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_wrapper.
hip.
hpp"
#include "gridwise_convolution_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_convolution_implicit_gemm_v2_chwn_cyxk_khwn
(
InDesc
,
void
device_convolution_implicit_gemm_v2_chwn_cyxk_khwn
(
InDesc
,
...
...
driver/device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_wrapper.
hip.
hpp"
#include "gridwise_convolution_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp"
#include "gridwise_convolution_implicit_gemm_v3_lds_double_buffer_nchw_cyxk_nkhw.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v3_lds_double_buffer_nchw_cyxk_nkhw.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw
(
InDesc
,
void
device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw
(
InDesc
,
...
...
driver/device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_wrapper.
hip.
hpp"
#include "gridwise_convolution_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp"
#include "gridwise_convolution_implicit_gemm_v4_lds_double_buffer_nchw_kcyx_nkhw.
hip.
hpp"
#include "gridwise_convolution_implicit_gemm_v4_lds_double_buffer_nchw_kcyx_nkhw.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw
(
InDesc
,
void
device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw
(
InDesc
,
...
...
driver/device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_direct_convolution_2_vectorized_nchw_kcyx_nkhw.
hip.
hpp"
#include "gridwise_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp"
template
<
class
TInWei
,
class
TOut
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
template
<
class
TInWei
,
class
TOut
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
>
void
device_direct_convolution_2_vectorized_nchw_kcyx_nkhw
(
InDesc
,
void
device_direct_convolution_2_vectorized_nchw_kcyx_nkhw
(
InDesc
,
...
...
driver/device_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp
View file @
05e04665
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.
hip.
hpp"
#include "gridwise_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp"
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
,
class
LowerPads
,
class
UpperPads
>
template
<
class
T
,
class
InDesc
,
class
WeiDesc
,
class
OutDesc
,
class
LowerPads
,
class
UpperPads
>
void
device_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded
(
InDesc
,
void
device_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded
(
InDesc
,
...
...
driver/driver.
hip.
cpp
→
driver/driver.cpp
View file @
05e04665
...
@@ -5,8 +5,8 @@
...
@@ -5,8 +5,8 @@
#include <stdlib.h>
#include <stdlib.h>
#include "config.h"
#include "config.h"
#include "tensor.hpp"
#include "tensor.hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantTensorDescriptor.hpp"
#include "conv_common.
hip.
hpp"
#include "conv_common.hpp"
#include "device_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
#include "device_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
//#include "device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp"
//#include "device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp"
#include "device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp"
#include "device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp"
...
...
driver/driver.cu
View file @
05e04665
driver
.
hip
.
cpp
driver
.
cpp
\ No newline at end of file
\ No newline at end of file
src/include/Array.
hip.
hpp
→
src/include/Array.hpp
View file @
05e04665
#pragma once
#pragma once
#include "Sequence.
hip.
hpp"
#include "Sequence.hpp"
#include "functional2.
hip.
hpp"
#include "functional2.hpp"
template
<
class
TData
,
index_t
NSize
>
template
<
class
TData
,
index_t
NSize
>
struct
Array
struct
Array
...
...
src/include/ConstantMatrixDescriptor.
hip.
hpp
→
src/include/ConstantMatrixDescriptor.hpp
View file @
05e04665
#pragma once
#pragma once
#include "common.
hip.
hpp"
#include "common.hpp"
template
<
index_t
NRow_
,
index_t
NCol_
,
index_t
RowStride_
>
template
<
index_t
NRow_
,
index_t
NCol_
,
index_t
RowStride_
>
struct
ConstantMatrixDescriptor
struct
ConstantMatrixDescriptor
...
...
src/include/ConstantMergedTensorDescriptor.
hip.
hpp
→
src/include/ConstantMergedTensorDescriptor.hpp
View file @
05e04665
#pragma once
#pragma once
#include "common.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantTensorDescriptor.hpp"
// OriginalTensorDesc : ConstantTensorDescriptor<...>
// OriginalTensorDesc : ConstantTensorDescriptor<...>
// it's the tensor whose dimensions are to be merged
// it's the tensor whose dimensions are to be merged
...
...
src/include/ConstantTensorDescriptor.
hip.
hpp
→
src/include/ConstantTensorDescriptor.hpp
View file @
05e04665
#pragma once
#pragma once
#include "common.
hip.
hpp"
#include "common.hpp"
template
<
class
Lengths
>
template
<
class
Lengths
>
__host__
__device__
constexpr
auto
calculate_tensor_strides_packed
(
Lengths
)
__host__
__device__
constexpr
auto
calculate_tensor_strides_packed
(
Lengths
)
...
...
src/include/Sequence.
hip.
hpp
→
src/include/Sequence.hpp
View file @
05e04665
#pragma once
#pragma once
#include "integral_constant.
hip.
hpp"
#include "integral_constant.hpp"
#include "functional.
hip.
hpp"
#include "functional.hpp"
template
<
class
Seq
>
template
<
class
Seq
>
struct
is_valid_sequence_map
;
struct
is_valid_sequence_map
;
...
...
src/include/amd_inline_asm.
hip.
hpp
→
src/include/amd_inline_asm.hpp
View file @
05e04665
#pragma once
#pragma once
#include "common.
hip.
hpp"
#include "common.hpp"
#define NO_VM_WAIT 0
#define NO_VM_WAIT 0
#define NO_LGKM_WAIT 0
#define NO_LGKM_WAIT 0
...
...
src/include/base.
hip.
hpp
→
src/include/base.hpp
View file @
05e04665
File moved
src/include/blockwise_2d_tensor_op.
hip.
hpp
→
src/include/blockwise_2d_tensor_op.hpp
View file @
05e04665
#pragma once
#pragma once
#include "common.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantTensorDescriptor.hpp"
template
<
index_t
BlockSize
,
class
Float
,
class
DstDesc
,
class
F
>
template
<
index_t
BlockSize
,
class
Float
,
class
DstDesc
,
class
F
>
__device__
void
__device__
void
...
...
src/include/blockwise_3d_tensor_op.
hip.
hpp
→
src/include/blockwise_3d_tensor_op.hpp
View file @
05e04665
#pragma once
#pragma once
#include "common.
hip.
hpp"
#include "common.hpp"
#include "ConstantTensorDescriptor.
hip.
hpp"
#include "ConstantTensorDescriptor.hpp"
template
<
index_t
BlockSize
,
template
<
index_t
BlockSize
,
class
Float
,
class
Float
,
...
...
Prev
1
2
3
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment