parse_gemm.cpp 3.51 KB
Newer Older
Paul Fultz II's avatar
Paul Fultz II committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
#include <migraphx/onnx/op_parser.hpp>
#include <migraphx/ranges.hpp>
#include <migraphx/instruction.hpp>
#include <migraphx/make_op.hpp>

namespace migraphx {
inline namespace MIGRAPHX_INLINE_NS {
namespace onnx {

struct parse_gemm : op_parser<parse_gemm>
{
    std::vector<op_desc> operators() const { return {{"Gemm"}}; }

    instruction_ref parse(const op_desc& /*opd*/,
                          const onnx_parser& parser,
                          onnx_parser::node_info info,
                          std::vector<instruction_ref> args) const
    {
        float alpha = 1.0f;
        float beta  = 1.0f;
        bool transa = false;
        bool transb = false;
        if(contains(info.attributes, "alpha"))
        {
            alpha = parser.parse_value(info.attributes.at("alpha")).at<float>();
        }
        if(contains(info.attributes, "beta"))
        {
            beta = parser.parse_value(info.attributes.at("beta")).at<float>();
        }
        if(contains(info.attributes, "transA"))
        {
            transa = parser.parse_value(info.attributes.at("transA")).at<bool>();
        }
        if(contains(info.attributes, "transB"))
        {
            transb = parser.parse_value(info.attributes.at("transB")).at<bool>();
        }

        std::vector<int64_t> perm(args[0]->get_shape().lens().size());
        std::iota(perm.begin(), perm.end(), int64_t{0});
        // swap the last two elements
        std::swap(*perm.rbegin(), *(perm.rbegin() + 1));

Shucai Xiao's avatar
Shucai Xiao committed
45
46
        auto l1       = args[0];
        auto dot_type = l1->get_shape().type();
47
48
49
50

        if(alpha != 1.0f)
        {
            auto alpha_literal = info.add_literal(alpha);
Shucai Xiao's avatar
Shucai Xiao committed
51
52
53
54
55
            l1                 = info.add_broadcastable_binary_op("mul", alpha_literal, l1);
            if(l1->get_shape().type() != dot_type)
            {
                l1 = info.add_instruction(make_op("convert", {{"target_type", dot_type}}), l1);
            }
56
57
        }

58
59
60
61
62
        l1 =
            (transa) ? info.add_instruction(make_op("transpose", {{"permutation", perm}}), l1) : l1;
        auto l2 = (transb)
                      ? info.add_instruction(make_op("transpose", {{"permutation", perm}}), args[1])
                      : args[1];
63

64
        auto ret = info.add_instruction(make_op("dot", {{"alpha", 1.0f}, {"beta", 0.0f}}), l1, l2);
turneram's avatar
turneram committed
65

Paul Fultz II's avatar
Paul Fultz II committed
66
67
        if(args.size() == 3)
        {
turneram's avatar
turneram committed
68
            if(not float_equal(beta, 0.0f) && args[2]->get_shape().elements() > 0)
Paul Fultz II's avatar
Paul Fultz II committed
69
70
71
72
73
74
75
            {
                auto out_lens   = l1->get_shape().lens();
                out_lens.back() = l2->get_shape().lens().back();
                auto l3         = args[2];
                auto l3_lens    = l3->get_shape().lens();
                if(!std::equal(out_lens.begin(), out_lens.end(), l3_lens.begin(), l3_lens.end()))
                {
76
77
                    l3 = info.add_instruction(make_op("multibroadcast", {{"out_lens", out_lens}}),
                                              args[2]);
Paul Fultz II's avatar
Paul Fultz II committed
78
                }
Shucai Xiao's avatar
Shucai Xiao committed
79
80
81
82
83
84
85
                auto beta_literal = info.add_literal(beta);
                auto beta_l3      = info.add_broadcastable_binary_op("mul", l3, beta_literal);
                if(beta_l3->get_shape().type() != dot_type)
                {
                    beta_l3 = info.add_instruction(make_op("convert", {{"target_type", dot_type}}),
                                                   beta_l3);
                }
86

turneram's avatar
turneram committed
87
                return info.add_instruction(make_op("add"), ret, beta_l3);
Paul Fultz II's avatar
Paul Fultz II committed
88
89
90
            }
        }

turneram's avatar
turneram committed
91
        return ret;
Paul Fultz II's avatar
Paul Fultz II committed
92
93
94
95
96
97
    }
};

} // namespace onnx
} // namespace MIGRAPHX_INLINE_NS
} // namespace migraphx