#include #include #include #include #include "data_type.hpp" #include "element_wise_operation.hpp" #include "conv_fwd_util.hpp" #include "conv_util.hpp" #include "host_tensor.hpp" #include "tensor_layout.hpp" #include "check_err.hpp" // Forward declarations for conv instances. using DeviceConvFwdNoOpPtr = ck::tensor_operation::device::DeviceConvFwdPtr; namespace ck { namespace tensor_operation { namespace device { namespace device_conv1d_fwd_instance { void add_device_conv1d_fwd_xdl_nwc_kxc_nwk_bf16_instances(std::vector&); void add_device_conv1d_fwd_xdl_nwc_kxc_nwk_f16_instances(std::vector&); void add_device_conv1d_fwd_xdl_nwc_kxc_nwk_f32_instances(std::vector&); void add_device_conv1d_fwd_xdl_nwc_kxc_nwk_int8_instances(std::vector&); } // namespace device_conv1d_fwd_instance } // namespace device } // namespace tensor_operation } // namespace ck namespace { bool test_conv1D_nwc() { bool res{true}; ck::utils::conv::ConvParams params; params.num_dim_spatial = 1; params.N = 2; params.K = 16; params.C = 4; params.filter_spatial_lengths = std::vector{3}; params.input_spatial_lengths = std::vector{16}; params.conv_filter_strides = std::vector{1}; params.conv_filter_dilations = std::vector{1}; params.input_left_pads = std::vector{1}; params.input_right_pads = std::vector{1}; auto host_tensors = ck::utils::conv::get_host_tensors(params); const Tensor& input = std::get<0>(host_tensors); const Tensor& weights = std::get<1>(host_tensors); Tensor& host_output = std::get<2>(host_tensors); Tensor& device_output = std::get<3>(host_tensors); ck::utils::conv::run_reference_convolution_forward<1>(params, input, weights, host_output); test::conv::RunConv<1>(params, input, weights, device_output); res = res && ck::utils::check_err( device_output.mData, host_output.mData, "Error: incorrect results!", 1e-5f, 1e-4f); return res; } template bool test_conv1d_nwc_instances(const std::vector& conv_ptrs) { ck::utils::conv::ConvParams params; params.num_dim_spatial = 1; params.filter_spatial_lengths = std::vector{3}; params.input_spatial_lengths = std::vector{71}; params.conv_filter_strides = std::vector{2}; params.conv_filter_dilations = std::vector{1}; params.input_left_pads = std::vector{1}; params.input_right_pads = std::vector{1}; auto host_tensors = ck::utils::conv::get_host_tensors(params); const Tensor& input = std::get<0>(host_tensors); const Tensor& weights = std::get<1>(host_tensors); Tensor& host_output = std::get<2>(host_tensors); Tensor& device_output = std::get<3>(host_tensors); ck::utils::conv::run_reference_convolution_forward<1>(params, input, weights, host_output); return ck::utils::conv::run_convolution_forward_instances<1>( params, conv_ptrs, input, weights, device_output, host_output); } bool test_conv1d_nwc_bf16_instances() { std::vector conv_ptrs; ck::tensor_operation::device::device_conv1d_fwd_instance:: add_device_conv1d_fwd_xdl_nwc_kxc_nwk_bf16_instances(conv_ptrs); return test_conv1d_nwc_instances(conv_ptrs); } bool test_conv1d_nwc_f16_instances() { std::vector conv_ptrs; ck::tensor_operation::device::device_conv1d_fwd_instance:: add_device_conv1d_fwd_xdl_nwc_kxc_nwk_f16_instances(conv_ptrs); return test_conv1d_nwc_instances(conv_ptrs); } bool test_conv1d_nwc_f32_instances() { std::vector conv_ptrs; ck::tensor_operation::device::device_conv1d_fwd_instance:: add_device_conv1d_fwd_xdl_nwc_kxc_nwk_f32_instances(conv_ptrs); return test_conv1d_nwc_instances(conv_ptrs); } bool test_conv1d_nwc_int8_instances() { std::vector conv_ptrs; ck::tensor_operation::device::device_conv1d_fwd_instance:: add_device_conv1d_fwd_xdl_nwc_kxc_nwk_int8_instances(conv_ptrs); return test_conv1d_nwc_instances(conv_ptrs); } } // anonymous namespace int main() { bool res{true}; res = test_conv1D_nwc(); std::cout << "test_conv1D_nwc ..... " << (res ? "SUCCESS" : "FAILURE") << std::endl; res = test_conv1d_nwc_bf16_instances(); std::cout << "\nTestConv1DNWCBF16Instances ..... " << (res ? "SUCCESS" : "FAILURE") << std::endl; res = test_conv1d_nwc_f16_instances(); std::cout << "\ntest_conv1d_nwc_f16_instances ..... " << (res ? "SUCCESS" : "FAILURE") << std::endl; res = test_conv1d_nwc_f32_instances(); std::cout << "\ntest_conv1d_nwc_f32_instances ..... " << (res ? "SUCCESS" : "FAILURE") << std::endl; res = test_conv1d_nwc_int8_instances(); std::cout << "\ntes_tconv1_dnw_cint_8instances ..... " << (res ? "SUCCESS" : "FAILURE") << std::endl; return res ? 0 : 1; }