target.cpp 7.23 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
/*
 * The MIT License (MIT)
 *
 * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24
#include <migraphx/adjust_allocation.hpp>
Paul's avatar
Paul committed
25
#include <migraphx/auto_contiguous.hpp>
26
#include <migraphx/check_context.hpp>
Paul's avatar
Paul committed
27
#include <migraphx/dead_code_elimination.hpp>
28
#include <migraphx/eliminate_allocation.hpp>
Paul's avatar
Paul committed
29
#include <migraphx/eliminate_concat.hpp>
30
#include <migraphx/eliminate_contiguous.hpp>
31
#include <migraphx/eliminate_data_type.hpp>
32
#include <migraphx/eliminate_identity.hpp>
33
#include <migraphx/eliminate_pad.hpp>
34
#include <migraphx/fuse_pointwise.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
35
#include <migraphx/fuse_reduce.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
36
#include <migraphx/inline_module.hpp>
kahmed10's avatar
kahmed10 committed
37
#include <migraphx/insert_pad.hpp>
38
#include <migraphx/layout_nhwc.hpp>
39
#include <migraphx/memory_coloring.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
40
#include <migraphx/normalize_ops.hpp>
41
#include <migraphx/optimize_module.hpp>
42
#include <migraphx/preallocate_param.hpp>
Charlie Lin's avatar
Charlie Lin committed
43
#include <migraphx/promote_literals.hpp>
44
#include <migraphx/register_target.hpp>
45
#include <migraphx/replace_allocate.hpp>
46
#include <migraphx/rewrite_gelu.hpp>
47
#include <migraphx/rewrite_pooling.hpp>
turneram's avatar
turneram committed
48
#include <migraphx/rewrite_quantization.hpp>
49
#include <migraphx/rewrite_rnn.hpp>
Paul's avatar
Paul committed
50
#include <migraphx/schedule.hpp>
51
#include <migraphx/simplify_dyn_ops.hpp>
turneram's avatar
turneram committed
52
#include <migraphx/simplify_qdq.hpp>
53
#include <migraphx/simplify_reshapes.hpp>
54
#include <migraphx/split_single_dyn_dim.hpp>
55
#include <migraphx/gpu/allocation_model.hpp>
56
#include <migraphx/ck.hpp>
57
#include <migraphx/gpu/compile_miopen.hpp>
58
#include <migraphx/gpu/compile_ops.hpp>
59
60
#include <migraphx/gpu/concat_gpu_opt.hpp>
#include <migraphx/gpu/context.hpp>
61
#include <migraphx/gpu/device_name.hpp>
62
#include <migraphx/gpu/fuse_ck.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
63
#include <migraphx/gpu/fuse_mlir.hpp>
64
#include <migraphx/gpu/fuse_ops.hpp>
65
#include <migraphx/gpu/prefuse_ops.hpp>
66
67
68
69
70
71
#include <migraphx/gpu/lowering.hpp>
#include <migraphx/gpu/pack_int8_args.hpp>
#include <migraphx/gpu/schedule_model.hpp>
#include <migraphx/gpu/sync_device.hpp>
#include <migraphx/gpu/target.hpp>
#include <migraphx/gpu/write_literals.hpp>
Paul's avatar
Paul committed
72

Paul's avatar
Paul committed
73
namespace migraphx {
Paul's avatar
Paul committed
74
inline namespace MIGRAPHX_INLINE_NS {
Paul's avatar
Paul committed
75
namespace gpu {
mei-ye's avatar
mei-ye committed
76

77
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_SCHEDULE_PASS)
Paul Fultz II's avatar
Paul Fultz II committed
78
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_REDUCE_FUSION)
79
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_ENABLE_NHWC)
80

81
82
83
84
85
86
87
88
89
90
91
92
struct id_pass
{
    std::string name() const { return "id"; }
    void apple(const module&) const {}
};

pass enable_pass(bool enabled, pass p)
{
    if(enabled)
        return p;
    return id_pass{};
}
Paul's avatar
Paul committed
93

94
std::vector<pass> target::get_passes(migraphx::context& gctx, const compile_options& options) const
Paul's avatar
Paul committed
95
{
Paul's avatar
Paul committed
96
    auto& ctx = any_cast<context>(gctx);
97
    ctx.set_exhaustive_tune_flag(options.exhaustive_tune);
98
99
100
101
102
103
    std::set<shape::type_t> unsupported_types(shape::types().begin(), shape::types().end());
    unsupported_types.erase(shape::type_t::float_type);
    unsupported_types.erase(shape::type_t::half_type);
    unsupported_types.erase(shape::type_t::bool_type);
    unsupported_types.erase(shape::type_t::int8_type);
    unsupported_types.erase(shape::type_t::uint8_type);
104
    unsupported_types.erase(shape::type_t::int32_type);
Shucai Xiao's avatar
Shucai Xiao committed
105
    unsupported_types.erase(shape::type_t::tuple_type);
Paul's avatar
Paul committed
106
107
108
    // clang-format off
    return
    {
109
110
        split_single_dyn_dim{},
        dead_code_elimination{},
111
112
        simplify_dyn_ops{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
113
        normalize_ops{},
114
        dead_code_elimination{},
turneram's avatar
turneram committed
115
        simplify_qdq{},
116
        enable_pass(not mlir_enabled(), rewrite_quantization{}),
turneram's avatar
turneram committed
117
        dead_code_elimination{},
118
        eliminate_data_type{unsupported_types, shape::type_t::float_type},
119
        simplify_reshapes{},
120
        eliminate_identity{},
121
        eliminate_pad{},
122
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
123
124
        insert_pad{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
125
        rewrite_rnn{},
Shucai Xiao's avatar
Shucai Xiao committed
126
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
127
        inline_module{},
128
        rewrite_pooling{},
Shucai Xiao's avatar
Shucai Xiao committed
129
        dead_code_elimination{},
130
        enable_pass(options.fast_math, rewrite_gelu{}),
131
        optimize_module{},
132
133
        enable_pass(enabled(MIGRAPHX_ENABLE_NHWC{}), layout_nhwc{}),
        dead_code_elimination{},
134
135
        prefuse_ops{},
        dead_code_elimination{},
Paul's avatar
Paul committed
136
        auto_contiguous{},
137
        optimize_module{},
138
        fuse_pointwise{},
139
        dead_code_elimination{},
Paul Fultz II's avatar
Paul Fultz II committed
140
141
        enable_pass(not enabled(MIGRAPHX_DISABLE_REDUCE_FUSION{}), fuse_reduce{}),
        dead_code_elimination{},
turneram's avatar
turneram committed
142
#ifndef _WIN32
143
        enable_pass(enabled(MIGRAPHX_ENABLE_CK{}), fuse_ck{}),
144
#endif
145
        dead_code_elimination{},
146
        enable_pass(mlir_enabled(), fuse_mlir{&ctx}),
Paul Fultz II's avatar
Paul Fultz II committed
147
        dead_code_elimination{},
148
        lowering{&ctx, options.offload_copy},
149
        eliminate_contiguous{"gpu::contiguous"},
Paul's avatar
Paul committed
150
        dead_code_elimination{},
151
152
        eliminate_concat{concat_gpu_optimization{}},
        dead_code_elimination{},
153
154
        compile_miopen{&gctx},
        dead_code_elimination{},
155
156
        pack_int8_args{},
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
157
        fuse_ops{&ctx, options.fast_math},
Paul's avatar
Paul committed
158
        dead_code_elimination{},
159
160
        replace_allocate{gpu_allocation_model{}, options.offload_copy},
        dead_code_elimination{},
161
162
        adjust_allocation{gpu_allocation_model{}},
        dead_code_elimination{},
163
        compile_ops{&ctx, options.exhaustive_tune},
164
        dead_code_elimination{},
Charlie Lin's avatar
Charlie Lin committed
165
166
        promote_literals{},
        dead_code_elimination{},
Paul's avatar
Paul committed
167
        write_literals{&ctx},
168
        schedule{gpu::schedule_model{ctx.get_current_device().nstreams()}, not enabled(MIGRAPHX_DISABLE_SCHEDULE_PASS{})},
Paul's avatar
Paul committed
169
        memory_coloring{"hip::allocate"},
170
        sync_device{},
171
        preallocate_param{"scratch", gpu_allocation_model{}},
Paul's avatar
Paul committed
172
        dead_code_elimination{},
Paul's avatar
Paul committed
173
        eliminate_allocation{"hip::allocate"},
174
        check_context<context>{},
175
        normalize_ops{},
176
177
        dead_code_elimination{},
        eliminate_identity{}
Paul's avatar
Paul committed
178
179
    };
    // clang-format on
Paul's avatar
Paul committed
180
}
Paul's avatar
Paul committed
181

182
std::string target::name() const { return "gpu"; }
Paul's avatar
Paul committed
183

184
migraphx::context target::get_context() const { return context(gpu::get_device_id()); }
185

Shucai Xiao's avatar
Shucai Xiao committed
186
argument target::copy_to(const argument& arg) const { return gpu::to_gpu(arg); }
187

Shucai Xiao's avatar
Shucai Xiao committed
188
argument target::copy_from(const argument& arg) const { return gpu::from_gpu(arg); }
189

Shucai Xiao's avatar
Shucai Xiao committed
190
argument target::allocate(const shape& s) const { return gpu::allocate_gpu(s); }
191

192
193
MIGRAPHX_REGISTER_TARGET(target);

Paul's avatar
Paul committed
194
} // namespace gpu
Paul's avatar
Paul committed
195
} // namespace MIGRAPHX_INLINE_NS
Paul's avatar
Paul committed
196
} // namespace migraphx