"git@developer.sourcefind.cn:gaoqiong/migraphx.git" did not exist on "5315d9bb2672a5db993e769636737f9a4ed233ce"
target.cpp 7.71 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
/*
 * The MIT License (MIT)
 *
 * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24
#include <migraphx/adjust_allocation.hpp>
Paul's avatar
Paul committed
25
#include <migraphx/auto_contiguous.hpp>
26
#include <migraphx/check_context.hpp>
Paul's avatar
Paul committed
27
#include <migraphx/dead_code_elimination.hpp>
28
#include <migraphx/eliminate_allocation.hpp>
Paul's avatar
Paul committed
29
#include <migraphx/eliminate_concat.hpp>
30
#include <migraphx/eliminate_contiguous.hpp>
31
#include <migraphx/eliminate_data_type.hpp>
Umang Yadav's avatar
Umang Yadav committed
32
#include <migraphx/eliminate_nested_converts.hpp>
33
#include <migraphx/eliminate_identity.hpp>
34
#include <migraphx/eliminate_pad.hpp>
35
#include <migraphx/fuse_pointwise.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
36
#include <migraphx/fuse_reduce.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
37
#include <migraphx/inline_module.hpp>
kahmed10's avatar
kahmed10 committed
38
#include <migraphx/insert_pad.hpp>
39
#include <migraphx/layout_nhwc.hpp>
40
#include <migraphx/memory_coloring.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
41
#include <migraphx/normalize_ops.hpp>
42
#include <migraphx/optimize_module.hpp>
43
#include <migraphx/preallocate_param.hpp>
Charlie Lin's avatar
Charlie Lin committed
44
#include <migraphx/promote_literals.hpp>
45
#include <migraphx/register_target.hpp>
46
#include <migraphx/replace_allocate.hpp>
47
#include <migraphx/rewrite_gelu.hpp>
48
#include <migraphx/rewrite_pooling.hpp>
turneram's avatar
turneram committed
49
#include <migraphx/rewrite_quantization.hpp>
50
#include <migraphx/rewrite_rnn.hpp>
Paul's avatar
Paul committed
51
#include <migraphx/schedule.hpp>
52
#include <migraphx/simplify_dyn_ops.hpp>
turneram's avatar
turneram committed
53
#include <migraphx/simplify_qdq.hpp>
54
#include <migraphx/simplify_reshapes.hpp>
55
#include <migraphx/split_single_dyn_dim.hpp>
56
#include <migraphx/gpu/allocation_model.hpp>
57
#include <migraphx/gpu/compile_miopen.hpp>
58
#include <migraphx/gpu/compile_ops.hpp>
59
60
#include <migraphx/gpu/concat_gpu_opt.hpp>
#include <migraphx/gpu/context.hpp>
61
#include <migraphx/gpu/device_name.hpp>
62
#include <migraphx/gpu/fuse_ck.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
63
#include <migraphx/gpu/fuse_mlir.hpp>
64
#include <migraphx/gpu/fuse_ops.hpp>
65
#include <migraphx/gpu/prefuse_ops.hpp>
66
67
68
69
70
#include <migraphx/gpu/lowering.hpp>
#include <migraphx/gpu/schedule_model.hpp>
#include <migraphx/gpu/sync_device.hpp>
#include <migraphx/gpu/target.hpp>
#include <migraphx/gpu/write_literals.hpp>
Paul's avatar
Paul committed
71

Paul's avatar
Paul committed
72
namespace migraphx {
Paul's avatar
Paul committed
73
inline namespace MIGRAPHX_INLINE_NS {
Paul's avatar
Paul committed
74
namespace gpu {
mei-ye's avatar
mei-ye committed
75

76
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_SCHEDULE_PASS)
Paul Fultz II's avatar
Paul Fultz II committed
77
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_REDUCE_FUSION)
78
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_ENABLE_NHWC)
turneram's avatar
turneram committed
79
#ifndef _WIN32
80
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_ENABLE_CK)
81
#endif
82

83
84
85
86
87
88
89
90
91
92
93
94
struct id_pass
{
    std::string name() const { return "id"; }
    void apple(const module&) const {}
};

pass enable_pass(bool enabled, pass p)
{
    if(enabled)
        return p;
    return id_pass{};
}
Paul's avatar
Paul committed
95

96
std::vector<pass> target::get_passes(migraphx::context& gctx, const compile_options& options) const
Paul's avatar
Paul committed
97
{
Paul's avatar
Paul committed
98
    auto& ctx = any_cast<context>(gctx);
99
    ctx.set_exhaustive_tune_flag(options.exhaustive_tune);
100
101
    std::set<shape::type_t> unsupported_types(shape::types().begin(), shape::types().end());
    unsupported_types.erase(shape::type_t::float_type);
Umang Yadav's avatar
Umang Yadav committed
102
    unsupported_types.erase(shape::type_t::fp8e4m3fnuz_type);
103
104
105
106
    unsupported_types.erase(shape::type_t::half_type);
    unsupported_types.erase(shape::type_t::bool_type);
    unsupported_types.erase(shape::type_t::int8_type);
    unsupported_types.erase(shape::type_t::uint8_type);
107
    unsupported_types.erase(shape::type_t::int32_type);
Shucai Xiao's avatar
Shucai Xiao committed
108
    unsupported_types.erase(shape::type_t::tuple_type);
Umang Yadav's avatar
Umang Yadav committed
109
110
111
112
    std::set<std::string> unsupported_fp8_ops = {};
    if(not gpu::rocblas_fp8_available())
    {
        unsupported_fp8_ops.insert("dot");
113
        unsupported_fp8_ops.insert("quant_dot");
Umang Yadav's avatar
Umang Yadav committed
114
    }
Paul's avatar
Paul committed
115
116
117
    // clang-format off
    return
    {
118
119
        split_single_dyn_dim{},
        dead_code_elimination{},
120
121
        simplify_dyn_ops{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
122
        normalize_ops{},
123
        dead_code_elimination{},
turneram's avatar
turneram committed
124
        simplify_qdq{},
125
        enable_pass(not mlir_enabled(), rewrite_quantization{}),
turneram's avatar
turneram committed
126
        dead_code_elimination{},
127
        eliminate_data_type{unsupported_types, shape::type_t::float_type},
Umang Yadav's avatar
Umang Yadav committed
128
129
        dead_code_elimination{},
        eliminate_nested_converts{},
130
        simplify_reshapes{},
131
        eliminate_identity{},
132
        eliminate_pad{},
133
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
134
135
        insert_pad{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
136
        rewrite_rnn{},
Shucai Xiao's avatar
Shucai Xiao committed
137
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
138
        inline_module{},
139
        rewrite_pooling{},
Shucai Xiao's avatar
Shucai Xiao committed
140
        dead_code_elimination{},
141
        enable_pass(options.fast_math, rewrite_gelu{}),
142
        optimize_module{},
143
144
        enable_pass(enabled(MIGRAPHX_ENABLE_NHWC{}), layout_nhwc{}),
        dead_code_elimination{},
145
146
        prefuse_ops{},
        dead_code_elimination{},
Paul's avatar
Paul committed
147
        auto_contiguous{},
148
        eliminate_data_type{{migraphx::shape::fp8e4m3fnuz_type}, shape::float_type, unsupported_fp8_ops},
Umang Yadav's avatar
Umang Yadav committed
149
        dead_code_elimination{},
150
        optimize_module{},
151
        fuse_pointwise{},
152
        dead_code_elimination{},
Paul Fultz II's avatar
Paul Fultz II committed
153
154
        enable_pass(not enabled(MIGRAPHX_DISABLE_REDUCE_FUSION{}), fuse_reduce{}),
        dead_code_elimination{},
turneram's avatar
turneram committed
155
#ifndef _WIN32
156
        enable_pass(enabled(MIGRAPHX_ENABLE_CK{}), fuse_ck{}),
157
#endif
158
        dead_code_elimination{},
159
        enable_pass(mlir_enabled(), fuse_mlir{&ctx}),
Paul Fultz II's avatar
Paul Fultz II committed
160
        dead_code_elimination{},
161
        lowering{&ctx, options.offload_copy},
162
        eliminate_contiguous{"gpu::contiguous"},
Paul's avatar
Paul committed
163
        dead_code_elimination{},
164
165
        eliminate_concat{concat_gpu_optimization{}},
        dead_code_elimination{},
166
167
        compile_miopen{&gctx},
        dead_code_elimination{},
168
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
169
        fuse_ops{&ctx, options.fast_math},
Paul's avatar
Paul committed
170
        dead_code_elimination{},
171
172
        replace_allocate{gpu_allocation_model{}, options.offload_copy},
        dead_code_elimination{},
173
174
        adjust_allocation{gpu_allocation_model{}},
        dead_code_elimination{},
175
        compile_ops{&ctx, options.exhaustive_tune},
176
        dead_code_elimination{},
Charlie Lin's avatar
Charlie Lin committed
177
178
        promote_literals{},
        dead_code_elimination{},
Paul's avatar
Paul committed
179
        write_literals{&ctx},
180
        schedule{gpu::schedule_model{ctx.get_current_device().nstreams()}, not enabled(MIGRAPHX_DISABLE_SCHEDULE_PASS{})},
Paul's avatar
Paul committed
181
        memory_coloring{"hip::allocate"},
182
        sync_device{},
183
        preallocate_param{"scratch", gpu_allocation_model{}},
Paul's avatar
Paul committed
184
        dead_code_elimination{},
Paul's avatar
Paul committed
185
        eliminate_allocation{"hip::allocate"},
186
        check_context<context>{},
187
        normalize_ops{},
188
189
        dead_code_elimination{},
        eliminate_identity{}
Paul's avatar
Paul committed
190
191
    };
    // clang-format on
Paul's avatar
Paul committed
192
}
Paul's avatar
Paul committed
193

194
std::string target::name() const { return "gpu"; }
Paul's avatar
Paul committed
195

196
migraphx::context target::get_context() const { return context(gpu::get_device_id()); }
197

Shucai Xiao's avatar
Shucai Xiao committed
198
argument target::copy_to(const argument& arg) const { return gpu::to_gpu(arg); }
199

Shucai Xiao's avatar
Shucai Xiao committed
200
argument target::copy_from(const argument& arg) const { return gpu::from_gpu(arg); }
201

Shucai Xiao's avatar
Shucai Xiao committed
202
argument target::allocate(const shape& s) const { return gpu::allocate_gpu(s); }
203

204
205
MIGRAPHX_REGISTER_TARGET(target);

Paul's avatar
Paul committed
206
} // namespace gpu
Paul's avatar
Paul committed
207
} // namespace MIGRAPHX_INLINE_NS
Paul's avatar
Paul committed
208
} // namespace migraphx