#pragma once template __global__ void run_gridwise_convolution(GridwiseConvolution, const T* const __restrict__ p_in_global, const T* const __restrict__ p_wei_global, T* const __restrict__ p_out_global) { GridwiseConvolution{}.Run(p_in_global, p_wei_global, p_out_global); }