target.cpp 7.06 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
/*
 * The MIT License (MIT)
 *
 * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24
#include <migraphx/adjust_allocation.hpp>
Paul's avatar
Paul committed
25
#include <migraphx/auto_contiguous.hpp>
26
#include <migraphx/check_context.hpp>
Paul's avatar
Paul committed
27
#include <migraphx/dead_code_elimination.hpp>
28
#include <migraphx/eliminate_allocation.hpp>
Paul's avatar
Paul committed
29
#include <migraphx/eliminate_concat.hpp>
30
#include <migraphx/eliminate_contiguous.hpp>
31
#include <migraphx/eliminate_data_type.hpp>
32
#include <migraphx/eliminate_identity.hpp>
33
#include <migraphx/eliminate_pad.hpp>
34
#include <migraphx/fuse_pointwise.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
35
#include <migraphx/fuse_reduce.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
36
#include <migraphx/inline_module.hpp>
kahmed10's avatar
kahmed10 committed
37
#include <migraphx/insert_pad.hpp>
38
#include <migraphx/layout_nhwc.hpp>
39
#include <migraphx/memory_coloring.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
40
#include <migraphx/normalize_ops.hpp>
41
#include <migraphx/optimize_module.hpp>
42
#include <migraphx/preallocate_param.hpp>
Charlie Lin's avatar
Charlie Lin committed
43
#include <migraphx/promote_literals.hpp>
44
#include <migraphx/register_target.hpp>
45
#include <migraphx/replace_allocate.hpp>
46
#include <migraphx/rewrite_gelu.hpp>
47
#include <migraphx/rewrite_pooling.hpp>
turneram's avatar
turneram committed
48
#include <migraphx/rewrite_quantization.hpp>
49
#include <migraphx/rewrite_rnn.hpp>
Paul's avatar
Paul committed
50
#include <migraphx/schedule.hpp>
turneram's avatar
turneram committed
51
#include <migraphx/simplify_qdq.hpp>
52
#include <migraphx/simplify_reshapes.hpp>
53
#include <migraphx/split_single_dyn_dim.hpp>
54
#include <migraphx/gpu/allocation_model.hpp>
55
#include <migraphx/gpu/compile_miopen.hpp>
56
#include <migraphx/gpu/compile_ops.hpp>
57
58
#include <migraphx/gpu/concat_gpu_opt.hpp>
#include <migraphx/gpu/context.hpp>
59
#include <migraphx/gpu/device_name.hpp>
Paul's avatar
Paul committed
60
#include <migraphx/gpu/fuse_ck.hpp>
Alan Turner's avatar
Alan Turner committed
61
#include <migraphx/gpu/fuse_ck_gemm_softmax_gemm.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
62
#include <migraphx/gpu/fuse_mlir.hpp>
63
#include <migraphx/gpu/fuse_ops.hpp>
64
#include <migraphx/gpu/prefuse_ops.hpp>
65
66
67
68
69
70
#include <migraphx/gpu/lowering.hpp>
#include <migraphx/gpu/pack_int8_args.hpp>
#include <migraphx/gpu/schedule_model.hpp>
#include <migraphx/gpu/sync_device.hpp>
#include <migraphx/gpu/target.hpp>
#include <migraphx/gpu/write_literals.hpp>
Paul's avatar
Paul committed
71

Paul's avatar
Paul committed
72
namespace migraphx {
Paul's avatar
Paul committed
73
inline namespace MIGRAPHX_INLINE_NS {
Paul's avatar
Paul committed
74
namespace gpu {
mei-ye's avatar
mei-ye committed
75

76
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_SCHEDULE_PASS)
Paul Fultz II's avatar
Paul Fultz II committed
77
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_REDUCE_FUSION)
78
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_ENABLE_NHWC)
79
80
81
82
83
84
85
86
87
88
89
90
struct id_pass
{
    std::string name() const { return "id"; }
    void apple(const module&) const {}
};

pass enable_pass(bool enabled, pass p)
{
    if(enabled)
        return p;
    return id_pass{};
}
Paul's avatar
Paul committed
91

92
std::vector<pass> target::get_passes(migraphx::context& gctx, const compile_options& options) const
Paul's avatar
Paul committed
93
{
Paul's avatar
Paul committed
94
    auto& ctx = any_cast<context>(gctx);
95
    ctx.set_exhaustive_tune_flag(options.exhaustive_tune);
96
97
98
99
100
101
    std::set<shape::type_t> unsupported_types(shape::types().begin(), shape::types().end());
    unsupported_types.erase(shape::type_t::float_type);
    unsupported_types.erase(shape::type_t::half_type);
    unsupported_types.erase(shape::type_t::bool_type);
    unsupported_types.erase(shape::type_t::int8_type);
    unsupported_types.erase(shape::type_t::uint8_type);
Shucai Xiao's avatar
Shucai Xiao committed
102
    unsupported_types.erase(shape::type_t::tuple_type);
Paul's avatar
Paul committed
103
104
105
    // clang-format off
    return
    {
106
107
        split_single_dyn_dim{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
108
        normalize_ops{},
109
        dead_code_elimination{},
turneram's avatar
turneram committed
110
        simplify_qdq{},
111
        enable_pass(not mlir_enabled(), rewrite_quantization{}),
turneram's avatar
turneram committed
112
        dead_code_elimination{},
113
        eliminate_data_type{unsupported_types, shape::type_t::float_type},
114
        simplify_reshapes{},
115
        eliminate_identity{},
116
        eliminate_pad{},
117
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
118
119
        insert_pad{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
120
        rewrite_rnn{},
Shucai Xiao's avatar
Shucai Xiao committed
121
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
122
        inline_module{},
123
        rewrite_pooling{},
Shucai Xiao's avatar
Shucai Xiao committed
124
        dead_code_elimination{},
125
        rewrite_gelu{},
126
        optimize_module{},
127
        enable_pass(enabled(MIGRAPHX_ENABLE_NHWC{}), layout_nhwc{}),
128
        dead_code_elimination{},
129
130
        prefuse_ops{},
        dead_code_elimination{},
Paul's avatar
Paul committed
131
        auto_contiguous{},
132
133
        fuse_ck_gemm_softmax_gemm{&ctx},
        dead_code_elimination{},
134
        optimize_module{},
135
        fuse_pointwise{},
136
        dead_code_elimination{},
Paul Fultz II's avatar
Paul Fultz II committed
137
138
        enable_pass(not enabled(MIGRAPHX_DISABLE_REDUCE_FUSION{}), fuse_reduce{}),
        dead_code_elimination{},
139
        enable_pass(mlir_enabled(), fuse_mlir{&ctx}),
Paul Fultz II's avatar
Paul Fultz II committed
140
        dead_code_elimination{},
Paul's avatar
Paul committed
141
142
        fuse_ck{&ctx},
        dead_code_elimination{},
143
        lowering{&ctx, options.offload_copy},
144
        eliminate_contiguous{"gpu::contiguous"},
Paul's avatar
Paul committed
145
        dead_code_elimination{},
146
147
        eliminate_concat{concat_gpu_optimization{}},
        dead_code_elimination{},
148
149
        compile_miopen{&gctx},
        dead_code_elimination{},
150
151
        pack_int8_args{},
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
152
        fuse_ops{&ctx, options.fast_math},
Paul's avatar
Paul committed
153
        dead_code_elimination{},
154
155
        replace_allocate{gpu_allocation_model{}, options.offload_copy},
        dead_code_elimination{},
156
157
        adjust_allocation{gpu_allocation_model{}},
        dead_code_elimination{},
158
159
        compile_ops{&ctx},
        dead_code_elimination{},
Charlie Lin's avatar
Charlie Lin committed
160
161
        promote_literals{},
        dead_code_elimination{},
Paul's avatar
Paul committed
162
        write_literals{&ctx},
163
        schedule{gpu::schedule_model{ctx.get_current_device().nstreams()}, not enabled(MIGRAPHX_DISABLE_SCHEDULE_PASS{})},
Paul's avatar
Paul committed
164
        memory_coloring{"hip::allocate"},
165
        sync_device{},
166
        preallocate_param{"scratch", gpu_allocation_model{}},
Paul's avatar
Paul committed
167
        dead_code_elimination{},
Paul's avatar
Paul committed
168
        eliminate_allocation{"hip::allocate"},
169
        check_context<context>{},
170
        normalize_ops{},
171
172
        dead_code_elimination{},
        eliminate_identity{}
Paul's avatar
Paul committed
173
174
    };
    // clang-format on
Paul's avatar
Paul committed
175
}
Paul's avatar
Paul committed
176

177
std::string target::name() const { return "gpu"; }
Paul's avatar
Paul committed
178

179
migraphx::context target::get_context() const { return context(gpu::get_device_id()); }
180

Shucai Xiao's avatar
Shucai Xiao committed
181
argument target::copy_to(const argument& arg) const { return gpu::to_gpu(arg); }
182

Shucai Xiao's avatar
Shucai Xiao committed
183
argument target::copy_from(const argument& arg) const { return gpu::from_gpu(arg); }
184

Shucai Xiao's avatar
Shucai Xiao committed
185
argument target::allocate(const shape& s) const { return gpu::allocate_gpu(s); }
186

187
188
MIGRAPHX_REGISTER_TARGET(target);

Paul's avatar
Paul committed
189
} // namespace gpu
Paul's avatar
Paul committed
190
} // namespace MIGRAPHX_INLINE_NS
Paul's avatar
Paul committed
191
} // namespace migraphx