direct_convolution.cuh 450 Bytes
Newer Older
Chao Liu's avatar
Chao Liu committed
1
2
3
4
5
#pragma once
#include "device_tensor.cuh"

template <class TFloat, int NBlockDim>
__global__ void direct_convolution(DeviceTensorDescriptor in_desc,
Chao Liu's avatar
Chao Liu committed
6
                                   TFloat* const p_in,
Chao Liu's avatar
Chao Liu committed
7
                                   DeviceTensorDescriptor wei_desc,
Chao Liu's avatar
Chao Liu committed
8
                                   TFloat* const p_wei,
Chao Liu's avatar
Chao Liu committed
9
                                   DeviceTensorDescriptor out_desc,
Chao Liu's avatar
Chao Liu committed
10
                                   TFloat* p_out)
Chao Liu's avatar
Chao Liu committed
11
12
{
}