#include #include "utils.hpp" #include #include #include int main() { using InputType = hipdnn_data_sdk::types::half; const int64_t n = 2; // Batch size // Input const int64_t c = 32; // Number of channels const int64_t h = 32; // Height const int64_t w = 32; // Width std::vector blockSize = {1, 32}; const int64_t scaleW = w / blockSize[1]; auto buildBlockScaleDequantizeGraph = [=](hipdnnHandle_t handle) { auto graph = std::make_shared(); graph->set_name("block_scale_dequantize_graph") .set_io_data_type(hipdnn_frontend::getDataTypeEnumFromType()) .set_intermediate_data_type(hipdnn_frontend::getDataTypeEnumFromType()) .set_compute_data_type(hipdnn_frontend::DataType::FLOAT); auto x = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("x") .set_dim({n, c, h, w}) .set_stride({c * h * w, 1, c * w, c})); auto scale = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("scale") .set_dim({n, c, h, scaleW}) .set_stride({c * h * scaleW, 1, c * scaleW, c})); auto blockScaleDequantizeAttributes = hipdnn_frontend::graph::BlockScaleDequantizeAttributes() .set_name("block_scale_dequantize_node") .set_block_size(blockSize) .set_is_negative_scale(true); auto y = graph->block_scale_dequantize(x, scale, blockScaleDequantizeAttributes); y->set_output(true); // build graph HIPDNN_FE_CHECK(graph->build(handle)); return std::make_tuple(graph, x, scale, y); }; auto backend = hipdnn_frontend::detail::hipdnnBackend(); if(!backend) { std::cout << "Creat backend failed. \n"; return 1; } hipdnnHandle_t handle; HIPDNN_CHECK(backend->create(&handle)); auto [graph, x, scale, y] = buildBlockScaleDequantizeGraph(handle); hipdnn_data_sdk::utilities::Tensor xTensor(x->get_dim(), x->get_stride()); hipdnn_data_sdk::utilities::Tensor scaleTensor(scale->get_dim(), scale->get_stride()); hipdnn_data_sdk::utilities::Tensor yTensor(y->get_dim(), y->get_stride()); int64_t workspaceSize = 0; HIPDNN_FE_CHECK(graph->get_workspace_size(workspaceSize)); const hipdnn_data_sdk::utilities::Workspace workspace(static_cast(workspaceSize)); std::unordered_map variantPack; variantPack[x->get_uid()] = xTensor.memory().deviceData(); variantPack[scale->get_uid()] = scaleTensor.memory().deviceData(); variantPack[y->get_uid()] = yTensor.memory().deviceData(); HIPDNN_FE_CHECK(graph->execute(handle, variantPack, workspace.get())); std::cout << "\nBlockScaleDequantize graph execution complete. \n"; HIPDNN_CHECK(backend->destroy(handle)); return 0; }