/* * The MIT License (MIT) * * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved. * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal * in the Software without restriction, including without limitation the rights * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell * copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN * THE SOFTWARE. */ #include #include #include #include namespace migraphx { inline namespace MIGRAPHX_INLINE_NS { namespace onnx { struct parse_gemm : op_parser { std::vector operators() const { return {{"Gemm"}}; } instruction_ref parse(const op_desc& /*opd*/, const onnx_parser& parser, onnx_parser::node_info info, std::vector args) const { auto A = args[0]; auto B = args[1]; if(A->get_shape().ndim() != 2 or B->get_shape().ndim() != 2) { MIGRAPHX_THROW("PARSE_GEMM: A and B should be rank 2, A is rank " + std::to_string(A->get_shape().ndim()) + "B is rank " + std::to_string(B->get_shape().ndim())); } float alpha = 1.0f; float beta = 1.0f; bool transa = false; bool transb = false; if(contains(info.attributes, "alpha")) { alpha = parser.parse_value(info.attributes.at("alpha")).at(); } if(contains(info.attributes, "beta")) { beta = parser.parse_value(info.attributes.at("beta")).at(); } if(contains(info.attributes, "transA")) { transa = parser.parse_value(info.attributes.at("transA")).at(); } if(contains(info.attributes, "transB")) { transb = parser.parse_value(info.attributes.at("transB")).at(); } std::vector perm(2); std::iota(perm.begin(), perm.end(), int64_t{0}); // swap the last two elements std::swap(*perm.rbegin(), *(perm.rbegin() + 1)); auto dot_type = A->get_shape().type(); if(alpha != 1.0f) { auto alpha_literal = info.add_literal(alpha); A = info.add_broadcastable_binary_op("mul", alpha_literal, A); if(A->get_shape().type() != dot_type) { A = info.add_instruction(make_op("convert", {{"target_type", dot_type}}), A); } } A = (transa) ? info.add_instruction(make_op("transpose", {{"permutation", perm}}), A) : A; B = (transb) ? info.add_instruction(make_op("transpose", {{"permutation", perm}}), args[1]) : args[1]; auto ret = info.add_instruction(make_op("dot"), A, B); if(args.size() == 3) { // TODO: support dynamic C input if(std::any_of(args.cbegin(), args.cend(), [](auto in_arg) { return in_arg->get_shape().dynamic(); })) { MIGRAPHX_THROW("PARSE_GEMM: C input not handled for dynamic input shapes"); } if(not float_equal(beta, 0.0f) and args[2]->get_shape().elements() > 0) { auto out_lens = A->get_shape().lens(); out_lens.back() = B->get_shape().lens().back(); auto C = args[2]; auto C_lens = C->get_shape().lens(); if(not std::equal(out_lens.begin(), out_lens.end(), C_lens.begin(), C_lens.end())) { C = info.add_instruction(make_op("multibroadcast", {{"out_lens", out_lens}}), args[2]); } auto beta_literal = info.add_literal(beta); auto beta_C = info.add_broadcastable_binary_op("mul", C, beta_literal); if(beta_C->get_shape().type() != dot_type) { beta_C = info.add_instruction(make_op("convert", {{"target_type", dot_type}}), beta_C); } return info.add_instruction(make_op("add"), ret, beta_C); } } return ret; } }; } // namespace onnx } // namespace MIGRAPHX_INLINE_NS } // namespace migraphx