#pragma once #include "constant_tensor_descriptor.cuh" template __device__ void blockwise_winograd_transform_input(TFloat* const __restrict__ p_in, TFloat* __restrict__ p_in_transform) { p_in_transform[0] = 1; } template __device__ void blockwise_winograd_transform_weight(TFloat* const __restrict__ p_wei, TFloat* __restrict__ p_wei_transform) { p_wei_transform[0] = 1; }