gridwise_convolution_wrapper.hip.hpp 378 Bytes
Newer Older
1
2
3
#pragma once

template <class GridwiseConvolution, class T>
4
__global__ void run_gridwise_convolution(const T* const __restrict__ p_in_global,
5
6
7
8
9
                                         const T* const __restrict__ p_wei_global,
                                         T* const __restrict__ p_out_global)
{
    GridwiseConvolution{}.Run(p_in_global, p_wei_global, p_out_global);
}