"docs/en/understand_mmcv/ops.md" did not exist on "a7bf770168f36d4a4864a666114fb9b93f7e318f"
0ck_gemm_softmax_gemm.cpp 4.75 KB
Newer Older
Alan Turner's avatar
Alan Turner committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
/*
 * The MIT License (MIT)
 *
 * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */

#include "verify_program.hpp"
#include <migraphx/program.hpp>
#include <migraphx/generate.hpp>
#include <migraphx/make_op.hpp>

struct ck_gemm_softmax_gemm : verify_program<ck_gemm_softmax_gemm>
{
    migraphx::program create_program() const
    {
Alan Turner's avatar
Alan Turner committed
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
        // migraphx::program p;
        // auto* mm = p.get_main_module();
        // migraphx::shape m1_shape{migraphx::shape::half_type, {16, 12, 384, 64}};
        // migraphx::shape m2_shape{migraphx::shape::half_type, {16, 12, 384, 384}};
        // auto m2_elements = 16 * 12 * 384 * 384;
        // auto a           = mm->add_parameter("1", m1_shape);
        // auto b           = mm->add_parameter("2", m1_shape);
        // auto b1          = mm->add_parameter("3", m1_shape);
        // auto c           = mm->add_parameter("4", m1_shape);
        // std::vector<float> eights(m2_elements, 0.125);
        // auto eight = mm->add_literal(migraphx::literal{m2_shape, eights});
        // std::vector<float> zeros(m2_elements, 0);
        // auto zero = mm->add_literal(migraphx::literal{m2_shape, zeros});
        // std::vector<float> ones(m2_elements, 1);
        // auto one = mm->add_literal(migraphx::literal{m2_shape, ones});

        // // a = one;
        // // b = one;
        // // b1 = one;
Alan Turner's avatar
Alan Turner committed
53
54
55
56
57
        // b = mm->add_instruction(migraphx::make_op("transpose", {{"permutation", {0, 1, 3, 2}}}),
        // b); auto gemm1   = mm->add_instruction(migraphx::make_op("dot"), a, b); auto scale   =
        // mm->add_instruction(migraphx::make_op("mul"), gemm1, eight); auto bias    =
        // mm->add_instruction(migraphx::make_op("add"), scale, zero); auto softmax =
        // mm->add_instruction(migraphx::make_op("softmax", {{"axis", -1}}), bias);
Alan Turner's avatar
Alan Turner committed
58
59
        // mm->add_instruction(migraphx::make_op("dot"), softmax, b1);

Alan Turner's avatar
Alan Turner committed
60
        migraphx::program p;
Alan Turner's avatar
Alan Turner committed
61
        auto* mm     = p.get_main_module();
Alan Turner's avatar
Alan Turner committed
62
63
64
65
66
        size_t batch = 2;
        migraphx::shape m1_shape{migraphx::shape::half_type, {batch, 384, 2304}};
        migraphx::shape m2_shape{migraphx::shape::half_type, {batch, 12, 384, 384}};
        auto m2_elements = batch * 12 * 384 * 384;
        auto g           = mm->add_parameter("1", m1_shape);
Alan Turner's avatar
Alan Turner committed
67
68
69
70
71
72
73
        std::vector<float> eights(m2_elements, 0.125);
        auto eight = mm->add_literal(migraphx::literal{m2_shape, eights});
        std::vector<float> zeros(m2_elements, 0);
        auto zero = mm->add_literal(migraphx::literal{m2_shape, zeros});
        std::vector<float> ones(m2_elements, 1);
        auto one = mm->add_literal(migraphx::literal{m2_shape, ones});

Alan Turner's avatar
Alan Turner committed
74
75
        g = mm->add_instruction(migraphx::make_op("reshape", {{"dims", {batch, 384, 36, 64}}}), g);
        g = mm->add_instruction(migraphx::make_op("transpose", {{"permutation", {0, 2, 1, 3}}}), g);
Alan Turner's avatar
Alan Turner committed
76
77
78
79
80
81
        auto a = mm->add_instruction(
            migraphx::make_op("slice", {{"axes", {1}}, {"starts", {0}}, {"ends", {12}}}), g);
        auto b = mm->add_instruction(
            migraphx::make_op("slice", {{"axes", {1}}, {"starts", {12}}, {"ends", {24}}}), g);
        auto b1 = mm->add_instruction(
            migraphx::make_op("slice", {{"axes", {1}}, {"starts", {24}}, {"ends", {36}}}), g);
Alan Turner's avatar
Alan Turner committed
82
        b = mm->add_instruction(migraphx::make_op("transpose", {{"permutation", {0, 1, 3, 2}}}), b);
Alan Turner's avatar
Alan Turner committed
83

Alan Turner's avatar
Alan Turner committed
84
85
86
        auto gemm1   = mm->add_instruction(migraphx::make_op("dot"), a, b);
        auto scale   = mm->add_instruction(migraphx::make_op("mul"), gemm1, eight);
        auto bias    = mm->add_instruction(migraphx::make_op("add"), scale, zero);
Alan Turner's avatar
Alan Turner committed
87
88
89
90
91
92
        auto softmax = mm->add_instruction(migraphx::make_op("softmax", {{"axis", -1}}), bias);
        mm->add_instruction(migraphx::make_op("dot"), softmax, b1);

        return p;
    }
};