Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
yangql
composable_kernel-1
Commits
81497a93
Commit
81497a93
authored
Jun 11, 2019
by
Chao Liu
Browse files
reorginze files
parent
88b77181
Changes
59
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
95 additions
and
92 deletions
+95
-92
CMakeLists.txt
CMakeLists.txt
+4
-1
driver/device_convolution_direct_v2_nchw_kcyx_nkhw.hpp
driver/device_convolution_direct_v2_nchw_kcyx_nkhw.hpp
+1
-1
driver/device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp
...er/device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp
+4
-4
driver/device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw.hpp
...er/device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw.hpp
+2
-2
driver/device_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
...er/device_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
+2
-2
driver/device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
...er/device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
+2
-2
driver/device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp
...er/device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp
+2
-2
driver/device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp
...device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp
+1
-1
driver/device_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp
...ice_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp
+1
-1
driver/driver.cpp
driver/driver.cpp
+2
-2
include/composable_kernel/kernel_algorithm/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp
...gorithm/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp
+6
-6
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp
+8
-8
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp
+9
-9
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp
...ridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp
+8
-8
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp
...n_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp
+8
-8
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp
...ridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp
+8
-8
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp
...n_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp
+8
-8
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
.../gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
+6
-6
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp
...ion_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp
+7
-7
include/composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
.../gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
+6
-6
No files found.
CMakeLists.txt
View file @
81497a93
...
@@ -45,6 +45,9 @@ elseif(DEVICE_BACKEND STREQUAL "CUDA")
...
@@ -45,6 +45,9 @@ elseif(DEVICE_BACKEND STREQUAL "CUDA")
endif
()
endif
()
#
#
include_directories
(
BEFORE src/include
${
PROJECT_BINARY_DIR
}
/src/include
)
include_directories
(
BEFORE
include
${
PROJECT_BINARY_DIR
}
/include
)
add_subdirectory
(
src
)
add_subdirectory
(
src
)
add_subdirectory
(
driver
)
add_subdirectory
(
driver
)
driver/device_convolution_direct_v2_nchw_kcyx_nkhw.hpp
View file @
81497a93
...
@@ -2,7 +2,7 @@
...
@@ -2,7 +2,7 @@
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp
View file @
81497a93
...
@@ -2,10 +2,10 @@
...
@@ -2,10 +2,10 @@
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/device_convolution_implicit_gemm_v1_nchw_cyxk_nkhw.hpp
View file @
81497a93
...
@@ -2,8 +2,8 @@
...
@@ -2,8 +2,8 @@
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp"
#include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/device_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
View file @
81497a93
...
@@ -2,8 +2,8 @@
...
@@ -2,8 +2,8 @@
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp"
#include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/device_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
View file @
81497a93
...
@@ -2,8 +2,8 @@
...
@@ -2,8 +2,8 @@
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp"
#include "gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw_lds_double_buffer.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw_lds_double_buffer.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/device_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp
View file @
81497a93
...
@@ -2,8 +2,8 @@
...
@@ -2,8 +2,8 @@
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp"
#include "gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp"
#include "gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw_lds_double_buffer.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw_lds_double_buffer.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/device_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp
View file @
81497a93
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/device_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp
View file @
81497a93
#pragma once
#pragma once
#include <unistd.h>
#include <unistd.h>
#include "device.hpp"
#include "device.hpp"
#include "gridwise_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp"
#include "
composable_kernel/kernel_algorithm/
gridwise_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp"
using
namespace
ck
;
using
namespace
ck
;
...
...
driver/driver.cpp
View file @
81497a93
...
@@ -3,9 +3,9 @@
...
@@ -3,9 +3,9 @@
#include <initializer_list>
#include <initializer_list>
#include <cstdlib>
#include <cstdlib>
#include <stdlib.h>
#include <stdlib.h>
#include "config.hpp"
#include "composable_kernel/utility/config.hpp"
#include "composable_kernel/tensor_description/ConstantTensorDescriptor.hpp"
#include "tensor.hpp"
#include "tensor.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "conv_common.hpp"
#include "conv_common.hpp"
#include "device_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
#include "device_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
#include "device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp"
#include "device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp"
...
...
src/
include/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_DIRECT_V2_NCHW_KCYX_NKHW
#ifndef CK_GRIDWISE_CONVOLUTION_DIRECT_V2_NCHW_KCYX_NKHW
#define CK_GRIDWISE_CONVOLUTION_DIRECT_V2_NCHW_KCYX_NKHW
#define CK_GRIDWISE_CONVOLUTION_DIRECT_V2_NCHW_KCYX_NKHW
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "threadwise_direct_convolution.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_direct_convolution.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R1_CHWN_CYXK_KHWN
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R1_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R1_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R1_CHWN_CYXK_KHWN
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_4d_tensor_op.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_batched_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R2_CHWN_CYXK_KHWN
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R2_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R2_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R2_CHWN_CYXK_KHWN
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "blockwise_3d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_3d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_batched_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_batched_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_4d_tensor_op.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "threadwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_4d_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_batched_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "blockwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_tensor_slice_copy.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "threadwise_generic_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_generic_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_batched_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW_LDS_DOUBLE_BUFFER
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW_LDS_DOUBLE_BUFFER
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW_LDS_DOUBLE_BUFFER
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V1R3_NCHW_CYXK_NKHW_LDS_DOUBLE_BUFFER
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "blockwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_tensor_slice_copy.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "threadwise_generic_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_generic_tensor_op.hpp"
#include "blockwise_batched_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_batched_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_4d_tensor_op.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "blockwise_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V2_CHWN_CYXK_KHWN_LDS_DOUBLE_BUFFER
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_4d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_4d_tensor_op.hpp"
#include "blockwise_2d_tensor_op.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_2d_tensor_op.hpp"
#include "threadwise_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
threadwise_tensor_slice_copy.hpp"
#include "blockwise_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
src/
include/gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
→
include/
composable_kernel/kernel_algorithm/
gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp
View file @
81497a93
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V3_NCHW_CYXK_NKHW
#ifndef CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V3_NCHW_CYXK_NKHW
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V3_NCHW_CYXK_NKHW
#define CK_GRIDWISE_CONVOLUTION_IMPLICIT_GEMM_V3_NCHW_CYXK_NKHW
#include "common.hpp"
#include "
composable_kernel/utility/
common.hpp"
#include "ConstantTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantTensorDescriptor.hpp"
#include "ConstantMergedTensorDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMergedTensorDescriptor.hpp"
#include "ConstantMatrixDescriptor.hpp"
#include "
composable_kernel/tensor_description/
ConstantMatrixDescriptor.hpp"
#include "blockwise_generic_tensor_slice_copy.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_generic_tensor_slice_copy.hpp"
#include "blockwise_gemm.hpp"
#include "
composable_kernel/tensor_operation/
blockwise_gemm.hpp"
namespace
ck
{
namespace
ck
{
...
...
Prev
1
2
3
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment