fuse_ck.cpp 4.24 KB
Newer Older
Paul's avatar
Paul committed
1
2
3
4
5
#include <migraphx/gpu/fuse_ck.hpp>
#include <migraphx/matcher.hpp>
#include <migraphx/pass_manager.hpp>
#include <migraphx/make_op.hpp>
#include <migraphx/register_op.hpp>
Paul's avatar
Paul committed
6
#include <migraphx/env.hpp>
Paul's avatar
Paul committed
7
8
9
10

namespace migraphx {
inline namespace MIGRAPHX_INLINE_NS {

Paul's avatar
Paul committed
11
12
13
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_CK_GEMM);
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_CK_GEMM_FUSION);

Paul's avatar
Paul committed
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
struct module;

namespace gpu {

struct ck_gemm
{
    operation op = make_op("dot");

    template <class Self, class F>
    static auto reflect(Self& self, F f)
    {
        return pack(f(self.op, "op"));
    }

    std::string name() const { return "gpu::ck_gemm"; }
Paul's avatar
Paul committed
29
30
31

    void check_gemm_shape(const shape& s) const
    {
Paul's avatar
Format  
Paul committed
32
        if(not contains(range(s.strides().rbegin(), s.strides().rbegin() + 3), 1))
Paul's avatar
Paul committed
33
34
35
            MIGRAPHX_THROW("Invalid shape for ck_gemm");
    }

Paul's avatar
Paul committed
36
37
    shape compute_shape(std::vector<shape> inputs, const std::vector<module_ref>& mods) const
    {
Paul's avatar
Paul committed
38
        check_shapes{inputs, *this}.same_ndims();
Paul's avatar
Paul committed
39
40
41
42
        // if(mods.size() != 1)
        //     MIGRAPHX_THROW("should have one submodule.");
        if(inputs.size() < 2)
            MIGRAPHX_THROW("should have at least two inputs.");
Paul's avatar
Paul committed
43
44
        auto a = inputs[0];
        auto b = inputs[1];
Paul's avatar
Format  
Paul committed
45
        for(const auto& input : inputs)
Paul's avatar
Paul committed
46
            check_gemm_shape(input);
Paul's avatar
Paul committed
47
        auto r = op.compute_shape({a, b});
Paul's avatar
Format  
Paul committed
48
        if(mods.empty())
Paul's avatar
Paul committed
49
50
            return r;
        return r.with_type(mods.front()->get_output_shapes().front().type());
Paul's avatar
Paul committed
51
52
53
54
55
56
57
58
59
60
61
62
    }
};
MIGRAPHX_REGISTER_OP(ck_gemm);

namespace {

MIGRAPHX_PRED_MATCHER(is_ck_gemm, instruction_ref ins)
{
    if(ins->name() != "dot")
        return false;
    auto a = ins->inputs().front()->get_shape();
    auto b = ins->inputs().back()->get_shape();
Paul's avatar
Paul committed
63
    if(a.lens().back() > 2048)
Paul's avatar
Paul committed
64
        return false;
Paul's avatar
Paul committed
65
    return true;
Paul's avatar
Paul committed
66
67
}

Paul's avatar
Paul committed
68
struct find_ck_gemm_pointwise
Paul's avatar
Paul committed
69
{
Paul's avatar
Paul committed
70
    // Find a gemm followed by a pointwise operation.
Paul's avatar
Format  
Paul committed
71
72
73
74
    auto matcher() const
    {
        auto gemm =
            match::skip(match::name("contiguous"))(match::name("dot")(is_ck_gemm().bind("gemm")));
Paul's avatar
Paul committed
75
76
        return match::name("pointwise")(match::any_of[match::inputs()](gemm.bind("x")));
    }
Paul's avatar
Paul committed
77
78
79

    void apply(module_pass_manager& mpm, const match::matcher_result& r) const
    {
Paul's avatar
Paul committed
80
81
82
83
84
85
        auto ins      = r.result;
        auto gemm_ins = r.instructions["gemm"];
        auto x_ins    = r.instructions["x"]; // input after contiguous
        auto* pm      = ins->module_inputs().front();
        auto names    = pm->get_parameter_names();
        std::sort(names.begin(), names.end());
Paul's avatar
Format  
Paul committed
86
87
        auto inputs   = ins->inputs();
        auto gemm_it  = std::find(inputs.begin(), inputs.end(), x_ins);
Paul's avatar
Paul committed
88
89
        auto gemm_idx = gemm_it - inputs.begin();
        assert(gemm_it != inputs.end());
Paul's avatar
Format  
Paul committed
90
        if(ins->get_shape().type() != shape::half_type)
Paul's avatar
Paul committed
91
            return;
Paul's avatar
Format  
Paul committed
92
        if(gemm_idx != 0)
Paul's avatar
Paul committed
93
        {
Paul's avatar
Format  
Paul committed
94
95
            auto first_param    = pm->get_parameter(names[0]);
            auto gemm_param     = pm->get_parameter(names[gemm_idx]);
Paul's avatar
Paul committed
96
            auto new_gemm_param = pm->add_parameter(names[0] + ".0", gemm_param->get_shape());
Paul's avatar
Format  
Paul committed
97
98
            auto new_first_param =
                pm->add_parameter(names[gemm_idx] + ".0", first_param->get_shape());
Paul's avatar
Paul committed
99
100
101
102
103
104
105
106
107
            pm->replace_instruction(gemm_param, new_gemm_param);
            pm->replace_instruction(first_param, new_first_param);
            pm->remove_instruction(first_param);
            pm->remove_instruction(gemm_param);
        }
        inputs.erase(gemm_it);
        inputs.insert(inputs.begin(), gemm_ins->inputs().begin(), gemm_ins->inputs().end());

        mpm.get_module().replace_instruction(ins, ck_gemm{}, inputs, {pm});
Paul's avatar
Paul committed
108
109
110
    }
};

Paul's avatar
Paul committed
111
112
113
114
115
116
117
118
119
120
121
struct find_ck_gemm
{
    auto matcher() const { return match::name("dot")(is_ck_gemm().bind("gemm")); }

    void apply(module_pass_manager& mpm, const match::matcher_result& r) const
    {
        auto ins = r.result;
        mpm.get_module().replace_instruction(ins, ck_gemm{ins->get_operator()}, ins->inputs());
    }
};

Paul's avatar
Paul committed
122
123
} // namespace

Paul's avatar
Format  
Paul committed
124
125
void fuse_ck::apply(module_pass_manager& mpm) const
{
Paul's avatar
Format  
Paul committed
126
    if(not enabled(MIGRAPHX_DISABLE_CK_GEMM_FUSION{}))
Paul's avatar
Paul committed
127
        match::find_matches(mpm, find_ck_gemm_pointwise{});
Paul's avatar
Format  
Paul committed
128
    if(not enabled(MIGRAPHX_DISABLE_CK_GEMM{}))
Paul's avatar
Paul committed
129
        match::find_matches(mpm, find_ck_gemm{});
Paul's avatar
Paul committed
130
}
Paul's avatar
Paul committed
131
132
133
134
135

} // namespace gpu

} // namespace MIGRAPHX_INLINE_NS
} // namespace migraphx