#include #include #include #include #include "utils.hpp" int main() { using InputType = float; const int64_t n = 4; // Batch size // Input const int64_t c = 64; // Number of channels const int64_t h = 16; // Height const int64_t w = 16; // Width // Filter const int64_t k = 64; // Number of filters const int64_t r = 1; // Height const int64_t s = 1; // Width // Conv param const int64_t strideH = 1; // Height stride const int64_t strideW = 1; // Width stride const int64_t padH = 0; // Height padding const int64_t padW = 0; // Width padding const int64_t dilH = 1; // Height dilation const int64_t dilW = 1; // Width dilation const int64_t outH = ((h + 2 * padH - (dilH * (r - 1) + 1)) / strideH) + 1; const int64_t outW = ((w + 2 * padW - (dilW * (s - 1) + 1)) / strideW) + 1; const int64_t g = 1; // Number of groups auto buildDeformConvBackwardGraph = [=](hipdnnHandle_t handle) { auto graph = std::make_shared(); graph->set_name("deform_conv_backward_graph") .set_io_data_type(hipdnn_frontend::getDataTypeEnumFromType()) .set_intermediate_data_type(hipdnn_frontend::getDataTypeEnumFromType()) .set_compute_data_type(hipdnn_frontend::DataType::FLOAT); auto image = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("image") .set_dim({n, c, h, w}) .set_stride({c * h * w, 1, c * w, c})); auto filter = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("filter") .set_dim({k, c / g, r, s}) .set_stride({c / g * r * s, 1, c / g * s, c / g})); auto loss = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("loss") .set_dim({n, k, outH, outW}) .set_stride({k * outH * outW, 1, k * outW, k})); auto offset = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("offset") .set_dim({n, 2 * g * r * s, outH, outW}) .set_stride({2 * g * r * s * outH * outW, 1, 2 * g * r * s * outW, 2 * g * r * s})); auto mask = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("mask") .set_dim({n, g * r * s, outH, outW}) .set_stride({g * r * s * outH * outW, 1, g * r * s * outW, g * r * s})); auto deformConvBwdAttributes = hipdnn_frontend::graph::DeformConvDgradAttributes() .set_name("deform_conv_backward_node") .set_padding({padH, padW}) .set_stride({strideH, strideW}) .set_dilation({dilH, dilW}) .set_x(image) .set_mask(mask); auto [dx, doffset, dmask] = graph->deform_conv_dgrad(loss, filter, offset, deformConvBwdAttributes); dx->set_output(true); doffset->set_output(true); dmask->set_output(true); // build graph HIPDNN_FE_CHECK(graph->build(handle)); return std::make_tuple(graph, image, filter, loss, offset, mask, dx, doffset, dmask); }; auto backend = hipdnn_frontend::detail::hipdnnBackend(); if(!backend) { std::cout << "Creat backend failed. \n"; return 1; } hipdnnHandle_t handle; HIPDNN_CHECK(backend->create(&handle)); auto [graph, image, filter, loss, offset, mask, dx, doffset, dmask] = buildDeformConvBackwardGraph(handle); hipdnn_data_sdk::utilities::Tensor lossTensor(loss->get_dim(), loss->get_stride()); hipdnn_data_sdk::utilities::Tensor inputTensor(image->get_dim(), image->get_stride()); hipdnn_data_sdk::utilities::Tensor filterTensor(filter->get_dim(), filter->get_stride()); hipdnn_data_sdk::utilities::Tensor offsetTensor(offset->get_dim(), offset->get_stride()); hipdnn_data_sdk::utilities::Tensor maskTensor(mask->get_dim(), mask->get_stride()); hipdnn_data_sdk::utilities::Tensor dxTensor(dx->get_dim(), dx->get_stride()); hipdnn_data_sdk::utilities::Tensor doffsetTensor(doffset->get_dim(), doffset->get_stride()); hipdnn_data_sdk::utilities::Tensor dmaskTensor(dmask->get_dim(), dmask->get_stride()); // Pixel-level offset values for each sampling point of the convolution kernel offsetTensor.fillWithRandomValues(static_cast(0.0f), static_cast(1.0f)); std::unordered_map variantPack; variantPack[loss->get_uid()] = lossTensor.memory().deviceData(); variantPack[image->get_uid()] = inputTensor.memory().deviceData(); variantPack[filter->get_uid()] = filterTensor.memory().deviceData(); variantPack[offset->get_uid()] = offsetTensor.memory().deviceData(); variantPack[mask->get_uid()] = maskTensor.memory().deviceData(); variantPack[dx->get_uid()] = dxTensor.memory().deviceData(); variantPack[doffset->get_uid()] = doffsetTensor.memory().deviceData(); variantPack[dmask->get_uid()] = dmaskTensor.memory().deviceData(); int64_t workspaceSize = 0; HIPDNN_FE_CHECK(graph->get_workspace_size(workspaceSize)); const hipdnn_data_sdk::utilities::Workspace workspace(static_cast(workspaceSize)); HIPDNN_FE_CHECK(graph->execute(handle, variantPack, workspace.get())); std::cout << "Deformable convolution backward graph execution complete.\n\n"; HIPDNN_CHECK(backend->destroy(handle)); return 0; }