"vscode:/vscode.git/clone" did not exist on "5f202fe5c1d63a5e3a1598690877eccff2ad4640"
quantization.cpp 4.92 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
/*
 * The MIT License (MIT)
 *
 * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
Shucai Xiao's avatar
Shucai Xiao committed
24
25
#include <iostream>
#include <vector>
26
#include <migraphx/gpu/fuse_mlir.hpp>
27
#include <migraphx/make_op.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
28
#include <migraphx/instruction.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
29
#include <migraphx/quantization.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
30
#include <migraphx/generate.hpp>
31
#include <migraphx/register_target.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
32
33
34
35
36
#include <migraphx/verify.hpp>
#include <migraphx/dead_code_elimination.hpp>
#include <migraphx/propagate_constant.hpp>
#include <migraphx/pass_manager.hpp>
#include <migraphx/onnx.hpp>
37
#include <test.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
38
39
#include <migraphx/half.hpp>

Shucai Xiao's avatar
Shucai Xiao committed
40
TEST_CASE(gpu_target_copy)
Shucai Xiao's avatar
Shucai Xiao committed
41
{
42
43
    migraphx::target gpu_t = migraphx::make_target("gpu");
    migraphx::target ref_t = migraphx::make_target("ref");
Shucai Xiao's avatar
Shucai Xiao committed
44
    migraphx::shape s{migraphx::shape::int8_type, {2, 3, 4, 5}};
Shucai Xiao's avatar
Shucai Xiao committed
45

46
47
48
    auto ref_arg_orig  = migraphx::generate_argument(s, 0x123456L);
    auto gpu_arg       = gpu_t.copy_to(ref_arg_orig);
    auto ref_arg_final = gpu_t.copy_from(gpu_arg);
Shucai Xiao's avatar
Shucai Xiao committed
49

Shucai Xiao's avatar
Shucai Xiao committed
50
    std::vector<int8_t> val_orig;
51
    ref_arg_orig.visit([&](auto v) { val_orig.assign(v.begin(), v.end()); });
Shucai Xiao's avatar
Shucai Xiao committed
52
    std::vector<int8_t> val_final;
53
    ref_arg_final.visit([&](auto v) { val_final.assign(v.begin(), v.end()); });
Shucai Xiao's avatar
Shucai Xiao committed
54

Umang Yadav's avatar
Umang Yadav committed
55
    EXPECT(migraphx::verify::verify_range(val_orig, val_final));
Shucai Xiao's avatar
Shucai Xiao committed
56
57
}

Shucai Xiao's avatar
Shucai Xiao committed
58
59
60
61
TEST_CASE(int8_quantization)
{
    auto run_prog = [](migraphx::program p,
                       const migraphx::target& t,
62
                       migraphx::parameter_map& m_in,
Shucai Xiao's avatar
Shucai Xiao committed
63
                       std::vector<float>& res) {
64
        std::vector<migraphx::parameter_map> cali_data;
Shucai Xiao's avatar
Shucai Xiao committed
65
66
67
        cali_data.push_back(m_in);
        migraphx::quantize_int8(p, t, cali_data);
        p.compile(t);
68
        migraphx::parameter_map m;
Shucai Xiao's avatar
Shucai Xiao committed
69
70
71
72
73
74
75
76
77
78
79
80
        for(auto&& x : p.get_parameter_shapes())
        {
            if(m_in.count(x.first) > 0)
            {
                m[x.first] = t.copy_to(m_in[x.first]);
            }
            else
            {
                m[x.first] = t.allocate(x.second);
            }
        }

81
        auto result = t.copy_from(p.eval(m).back());
Shucai Xiao's avatar
Shucai Xiao committed
82
83
84
85
86
        result.visit([&](auto v) { res.assign(v.begin(), v.end()); });
    };

    auto create_program = [] {
        migraphx::program p;
87
        auto* mm = p.get_main_module();
Shucai Xiao's avatar
Shucai Xiao committed
88
        migraphx::shape sa{migraphx::shape::float_type, {5, 16}};
Shucai Xiao's avatar
Shucai Xiao committed
89
        migraphx::shape sb{migraphx::shape::float_type, {16, 8}};
Shucai Xiao's avatar
Shucai Xiao committed
90
        migraphx::shape sc{migraphx::shape::float_type, {5, 8}};
91
92
        auto pa = mm->add_parameter("a", sa);
        auto pb = mm->add_parameter("b", sb);
93
        mm->add_instruction(migraphx::make_op("dot"), pa, pb);
Shucai Xiao's avatar
Shucai Xiao committed
94
95
96
97
98
99

        return p;
    };

    {
        auto p = create_program();
100
        migraphx::parameter_map m;
Shucai Xiao's avatar
Shucai Xiao committed
101
        migraphx::shape sa{migraphx::shape::float_type, {5, 16}};
Shucai Xiao's avatar
Shucai Xiao committed
102
        migraphx::shape sb{migraphx::shape::float_type, {16, 8}};
Shucai Xiao's avatar
Shucai Xiao committed
103
        migraphx::shape sc{migraphx::shape::float_type, {5, 8}};
Shucai Xiao's avatar
Shucai Xiao committed
104
        m["a"] = migraphx::generate_argument(sa);
Shucai Xiao's avatar
Shucai Xiao committed
105
        m["b"] = migraphx::generate_argument(sb);
106
        std::vector<float> ref_result;
107
        migraphx::target ref_t = migraphx::make_target("ref");
108
        run_prog(p, ref_t, m, ref_result);
Shucai Xiao's avatar
Shucai Xiao committed
109
110

        std::vector<float> gpu_result;
111
        migraphx::target gpu_t = migraphx::make_target("gpu");
Shucai Xiao's avatar
Shucai Xiao committed
112
113
        run_prog(p, gpu_t, m, gpu_result);

114
115
116
117
118
119
120
        // Note: the tolerance for mlir_enabled result is temporarily bumped
        // higher because the lowering pipeline between mlir fallback and
        // regular non-mlir pipeline diverged. MLIR fallback uses the
        // rewrite_quantization at the very end of the pipeline, whereas
        // the regular pipeline uses the rewrite_quantization in the much
        // earlier stage.
        if(migraphx::gpu::mlir_enabled())
Umang Yadav's avatar
Umang Yadav committed
121
            EXPECT(migraphx::verify::verify_range(ref_result, gpu_result, 1e5));
122
        else
Umang Yadav's avatar
Umang Yadav committed
123
            EXPECT(migraphx::verify::verify_range(ref_result, gpu_result));
Shucai Xiao's avatar
Shucai Xiao committed
124
125
126
    }
}

Shucai Xiao's avatar
Shucai Xiao committed
127
int main(int argc, const char* argv[]) { test::run(argc, argv); }