gridwise_convolution_kernel_wrapper.hpp 488 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
#ifndef CK_GRIDWISE_CONVOLUTION_KERNEL_WRAPPER
#define CK_GRIDWISE_CONVOLUTION_KERNEL_WRAPPER

template <class GridwiseConvolution, class T>
__global__ void run_gridwise_convolution_kernel(const T* const __restrict__ p_in_global,
                                                const T* const __restrict__ p_wei_global,
                                                T* const __restrict__ p_out_global)
{
    GridwiseConvolution{}.Run(p_in_global, p_wei_global, p_out_global);
}

#endif