parse_gemm.cpp 3.27 KB
Newer Older
Paul Fultz II's avatar
Paul Fultz II committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
#include <migraphx/onnx/op_parser.hpp>
#include <migraphx/ranges.hpp>
#include <migraphx/instruction.hpp>
#include <migraphx/make_op.hpp>

namespace migraphx {
inline namespace MIGRAPHX_INLINE_NS {
namespace onnx {

struct parse_gemm : op_parser<parse_gemm>
{
    std::vector<op_desc> operators() const { return {{"Gemm"}}; }

    instruction_ref parse(const op_desc& /*opd*/,
                          const onnx_parser& parser,
                          onnx_parser::node_info info,
                          std::vector<instruction_ref> args) const
    {
        float alpha = 1.0f;
        float beta  = 1.0f;
        bool transa = false;
        bool transb = false;
        if(contains(info.attributes, "alpha"))
        {
            alpha = parser.parse_value(info.attributes.at("alpha")).at<float>();
        }
        if(contains(info.attributes, "beta"))
        {
            beta = parser.parse_value(info.attributes.at("beta")).at<float>();
        }
        if(contains(info.attributes, "transA"))
        {
            transa = parser.parse_value(info.attributes.at("transA")).at<bool>();
        }
        if(contains(info.attributes, "transB"))
        {
            transb = parser.parse_value(info.attributes.at("transB")).at<bool>();
        }

        std::vector<int64_t> perm(args[0]->get_shape().lens().size());
        std::iota(perm.begin(), perm.end(), int64_t{0});
        // swap the last two elements
        std::swap(*perm.rbegin(), *(perm.rbegin() + 1));

45
46
47
48
49
50
51
52
53
54
55
        auto l1 = args[0];

        if(alpha != 1.0f)
        {
            auto alpha_literal = info.add_literal(alpha);
            auto alpha_l1      = info.add_broadcastable_binary_op("mul", alpha_literal, l1);
            l1 = info.add_instruction(make_op("convert", {{"target_type", l1->get_shape().type()}}),
                                      alpha_l1);
        }

        l1      = (transa) ? info.add_instruction(make_op("transpose", {{"dims", perm}}), l1) : l1;
Paul Fultz II's avatar
Paul Fultz II committed
56
57
        auto l2 = (transb) ? info.add_instruction(make_op("transpose", {{"dims", perm}}), args[1])
                           : args[1];
58

Paul Fultz II's avatar
Paul Fultz II committed
59
60
        if(args.size() == 3)
        {
61
            if(beta != 0.0f && args[2]->get_shape().elements() > 0)
Paul Fultz II's avatar
Paul Fultz II committed
62
63
64
65
66
67
68
69
70
71
            {
                auto out_lens   = l1->get_shape().lens();
                out_lens.back() = l2->get_shape().lens().back();
                auto l3         = args[2];
                auto l3_lens    = l3->get_shape().lens();
                if(!std::equal(out_lens.begin(), out_lens.end(), l3_lens.begin(), l3_lens.end()))
                {
                    l3 = info.add_instruction(
                        make_op("multibroadcast", {{"output_lens", out_lens}}), args[2]);
                }
72
73
74
75
76
                auto beta_literal   = info.add_literal(beta);
                auto beta_broadcast = info.add_instruction(
                    make_op("multibroadcast", {{"output_lens", out_lens}}), beta_literal);
                l3 = info.add_instruction(make_op("mul"), l3, beta_broadcast);

Paul Fultz II's avatar
Paul Fultz II committed
77
                return info.add_instruction(
78
                    make_op("dot", {{"alpha", 1.0f}, {"beta", 1.0f}}), l1, l2, l3);
Paul Fultz II's avatar
Paul Fultz II committed
79
80
81
            }
        }

82
        return info.add_instruction(make_op("dot", {{"alpha", 1.0f}, {"beta", 1.0f}}), l1, l2);
Paul Fultz II's avatar
Paul Fultz II committed
83
84
85
86
87
88
    }
};

} // namespace onnx
} // namespace MIGRAPHX_INLINE_NS
} // namespace migraphx