Commit 1566b317 authored by Chao Liu's avatar Chao Liu
Browse files

reorginzed files

parent c82b833d
#ifndef CK_FUNCTIONAL2_HPP #ifndef CK_FUNCTIONAL2_HPP
#define CK_FUNCTIONAL2_HPP #define CK_FUNCTIONAL2_HPP
#include "composable_kernel/utility/functional.hpp" #include "functional.hpp"
#include "composable_kernel/utility/Sequence.hpp" #include "Sequence.hpp"
namespace ck { namespace ck {
......
#ifndef CK_FUNCTIONAL3_HPP #ifndef CK_FUNCTIONAL3_HPP
#define CK_FUNCTIONAL3_HPP #define CK_FUNCTIONAL3_HPP
#include "composable_kernel/utility/functional.hpp" #include "functional.hpp"
#include "composable_kernel/utility/functional2.hpp" #include "functional2.hpp"
#include "composable_kernel/utility/Sequence.hpp" #include "Sequence.hpp"
#include "composable_kernel/utility/Array.hpp" #include "Array.hpp"
namespace ck { namespace ck {
......
#ifndef CK_UTILITY_HPP #ifndef CK_UTILITY_HPP
#define CK_UTILITY_HPP #define CK_UTILITY_HPP
#include "config.hpp"
namespace ck { namespace ck {
__device__ index_t get_thread_local_1d_id() { return threadIdx.x; } __device__ index_t get_thread_local_1d_id() { return threadIdx.x; }
......
#ifndef CK_VECTOR_TYPE_HPP #ifndef CK_VECTOR_TYPE_HPP
#define CK_VECTOR_TYPE_HPP #define CK_VECTOR_TYPE_HPP
#include "composable_kernel/utility/config.hpp" #include "config.hpp"
#include "composable_kernel/utility/integral_constant.hpp" #include "integral_constant.hpp"
namespace ck { namespace ck {
......
set(TENSOR_SOURCE
src/tensor.cpp;
src/device.cpp;
)
add_library(tensor SHARED ${TENSOR_SOURCE})
target_compile_features(tensor PUBLIC)
set_target_properties(tensor PROPERTIES POSITION_INDEPENDENT_CODE ON)
if(DEVICE_BACKEND STREQUAL "NVIDIA")
target_link_libraries(tensor nvToolsExt cudart)
endif()
install(TARGETS tensor LIBRARY DESTINATION lib)
if(DEVICE_BACKEND STREQUAL "AMD") if(DEVICE_BACKEND STREQUAL "AMD")
set(DRIVER_SOURCE driver.cpp) set(DRIVER_SOURCE src/driver.cpp)
elseif(DEVICE_BACKEND STREQUAL "NVIDIA") elseif(DEVICE_BACKEND STREQUAL "NVIDIA")
set(DRIVER_SOURCE driver.cu) set(DRIVER_SOURCE src/driver.cu)
endif() endif()
add_executable(driver ${DRIVER_SOURCE}) add_executable(driver ${DRIVER_SOURCE})
......
#ifndef CK_CONV_COMMON_HPP #ifndef CK_CONV_COMMON_HPP
#define CK_CONV_COMMON_HPP #define CK_CONV_COMMON_HPP
#include "composable_kernel/tensor_description/ConstantTensorDescriptor.hpp" #include "ConstantTensorDescriptor.hpp"
using namespace ck; using namespace ck;
......
...@@ -2,7 +2,7 @@ ...@@ -2,7 +2,7 @@
#define CK_DEVICE_HPP #define CK_DEVICE_HPP
#include <memory> #include <memory>
#include "composable_kernel/utility/config.hpp" #include "config.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "tensor.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp" #include "gridwise_convolution_kernel_wrapper.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp" #include "gridwise_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "tensor.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp" #include "gridwise_convolution_kernel_wrapper.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp" #include "gridwise_convolution_implicit_gemm_v1r1_chwn_cyxk_khwn.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp" #include "gridwise_convolution_implicit_gemm_v1r2_chwn_cyxk_khwn.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp" #include "gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp" #include "gridwise_convolution_implicit_gemm_v1r3_chwn_cyxk_khwn_lds_double_buffer.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "tensor.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp" #include "gridwise_convolution_kernel_wrapper.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp" #include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp" #include "gridwise_convolution_implicit_gemm_v1r3_nchw_cyxk_nkhw_lds_double_buffer.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "tensor.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp" #include "gridwise_convolution_kernel_wrapper.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp" #include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp" #include "gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "tensor.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp" #include "gridwise_convolution_kernel_wrapper.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp" #include "gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw_lds_double_buffer.hpp" #include "gridwise_convolution_implicit_gemm_v3_nchw_cyxk_nkhw_lds_double_buffer.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "tensor.hpp"
#include "gridwise_convolution_kernel_wrapper.hpp" #include "gridwise_convolution_kernel_wrapper.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp" #include "gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw_lds_double_buffer.hpp" #include "gridwise_convolution_implicit_gemm_v4_nchw_kcyx_nkhw_lds_double_buffer.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp" #include "tensor.hpp"
#include "gridwise_direct_convolution_2_vectorized_nchw_kcyx_nkhw.hpp"
using namespace ck; using namespace ck;
......
#pragma once #pragma once
#include <unistd.h> #include <unistd.h>
#include "device.hpp" #include "device.hpp"
#include "composable_kernel/kernel_algorithm/gridwise_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp" #include "tensor.hpp"
#include "gridwise_implicit_gemm_convolution_1_chwn_cyxk_khwn_padded.hpp"
using namespace ck; using namespace ck;
......
#include "composable_kernel/utility/config.hpp" #include "config.hpp"
#include "device.hpp" #include "device.hpp"
DeviceMem::DeviceMem(std::size_t mem_size) : mMemSize(mem_size) DeviceMem::DeviceMem(std::size_t mem_size) : mMemSize(mem_size)
......
...@@ -3,9 +3,9 @@ ...@@ -3,9 +3,9 @@
#include <initializer_list> #include <initializer_list>
#include <cstdlib> #include <cstdlib>
#include <stdlib.h> #include <stdlib.h>
#include "composable_kernel/utility/config.hpp" #include "config.hpp"
#include "composable_kernel/tensor_description/ConstantTensorDescriptor.hpp" #include "ConstantTensorDescriptor.hpp"
#include "tensor.hpp" #include "device.hpp"
#include "conv_common.hpp" #include "conv_common.hpp"
#include "device_convolution_direct_v2_nchw_kcyx_nkhw.hpp" #include "device_convolution_direct_v2_nchw_kcyx_nkhw.hpp"
#include "device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp" #include "device_convolution_implicit_gemm_v1_chwn_cyxk_khwn.hpp"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment