#include #include "hipdnn_frontend/attributes/MatmulAttributes.hpp" #include "utils.hpp" #include #include #include int main() { using InputType = hipdnn_data_sdk::types::half; const int64_t b = 2; // Batch size // Input const int64_t n = 16; // Height const int64_t m = 32; // Width auto buildMatmulBiasGraph = [=](hipdnnHandle_t handle) { auto graph = std::make_shared(); graph->set_name("matmul_bias_graph") .set_io_data_type(hipdnn_frontend::getDataTypeEnumFromType()) .set_intermediate_data_type(hipdnn_frontend::getDataTypeEnumFromType()) .set_compute_data_type(hipdnn_frontend::DataType::FLOAT); // create matmul auto inputA = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("input_a") .set_dim({b, n, m}) .set_stride({n * m, m, 1})); auto inputB = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("input_b") .set_dim({b, m, n}) .set_stride({n * m, n, 1})); auto matmulAttributes = hipdnn_frontend::graph::MatmulAttributes().set_name("matmul_node"); auto matmulOutput = graph->matmul(inputA, inputB, matmulAttributes); // create bias auto bias = std::make_shared( hipdnn_frontend::graph::Tensor_attributes() .set_name("bias") .set_dim({1, 1, n}) .set_stride({n, n, 1})); auto biasAttributes = hipdnn_frontend::graph::PointwiseAttributes() .set_name("bias_node") .set_mode(hipdnn_frontend::PointwiseMode_t::ADD); auto biasOutput = graph->pointwise(matmulOutput, bias, biasAttributes); // create swish auto swishAttributes = hipdnn_frontend::graph::PointwiseAttributes() .set_name("swish_node") .set_mode(hipdnn_frontend::PointwiseMode_t::SWISH_FWD) .set_swish_beta(1.0f); auto output = graph->pointwise(biasOutput, swishAttributes); output->set_output(true); // build graph HIPDNN_FE_CHECK(graph->build(handle)); return std::make_tuple(graph, inputA, inputB, bias, output); }; auto backend = hipdnn_frontend::detail::hipdnnBackend(); if(!backend) { std::cout << "Creat backend failed. \n"; return 1; } hipdnnHandle_t handle; HIPDNN_CHECK(backend->create(&handle)); auto [graph, inputA, inputB, bias, output] = buildMatmulBiasGraph(handle); // Allocate DCU memory hipdnn_data_sdk::utilities::Tensor inputATensor(inputA->get_dim(), inputA->get_stride()); hipdnn_data_sdk::utilities::Tensor inputBTensor(inputB->get_dim(), inputB->get_stride()); hipdnn_data_sdk::utilities::Tensor biasTensor(bias->get_dim(), bias->get_stride()); hipdnn_data_sdk::utilities::Tensor outTensor(output->get_dim(), output->get_stride()); std::unordered_map variantPack; variantPack[inputA->get_uid()] = inputATensor.memory().deviceData(); variantPack[inputB->get_uid()] = inputBTensor.memory().deviceData(); variantPack[bias->get_uid()] = biasTensor.memory().deviceData(); variantPack[output->get_uid()] = outTensor.memory().deviceData(); int64_t workspaceSize = 0; HIPDNN_FE_CHECK(graph->get_workspace_size(workspaceSize)); const hipdnn_data_sdk::utilities::Workspace workspace(static_cast(workspaceSize)); HIPDNN_FE_CHECK(graph->execute(handle, variantPack, workspace.get())); std::cout << "Matmul_bias_swish graph execution complete. \n"; HIPDNN_CHECK(backend->destroy(handle)); return 0; }