"git@developer.sourcefind.cn:gaoqiong/migraphx.git" did not exist on "1b56b01b6ff678c8e38c3b3d3408f83a46db5086"
target.cpp 7.52 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
/*
 * The MIT License (MIT)
 *
 * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
24
#include <migraphx/adjust_allocation.hpp>
Paul's avatar
Paul committed
25
#include <migraphx/auto_contiguous.hpp>
26
#include <migraphx/check_context.hpp>
Paul's avatar
Paul committed
27
#include <migraphx/dead_code_elimination.hpp>
28
#include <migraphx/eliminate_allocation.hpp>
Paul's avatar
Paul committed
29
#include <migraphx/eliminate_concat.hpp>
30
#include <migraphx/eliminate_contiguous.hpp>
31
#include <migraphx/eliminate_data_type.hpp>
32
#include <migraphx/eliminate_identity.hpp>
33
#include <migraphx/eliminate_pad.hpp>
34
#include <migraphx/fuse_pointwise.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
35
#include <migraphx/fuse_reduce.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
36
#include <migraphx/inline_module.hpp>
kahmed10's avatar
kahmed10 committed
37
#include <migraphx/insert_pad.hpp>
38
#include <migraphx/layout_nhwc.hpp>
39
#include <migraphx/memory_coloring.hpp>
Shucai Xiao's avatar
Shucai Xiao committed
40
#include <migraphx/normalize_ops.hpp>
41
#include <migraphx/optimize_module.hpp>
42
#include <migraphx/preallocate_param.hpp>
Charlie Lin's avatar
Charlie Lin committed
43
#include <migraphx/promote_literals.hpp>
44
#include <migraphx/register_target.hpp>
45
#include <migraphx/replace_allocate.hpp>
46
#include <migraphx/rewrite_gelu.hpp>
47
#include <migraphx/rewrite_pooling.hpp>
turneram's avatar
turneram committed
48
#include <migraphx/rewrite_quantization.hpp>
49
#include <migraphx/rewrite_rnn.hpp>
Paul's avatar
Paul committed
50
#include <migraphx/schedule.hpp>
51
#include <migraphx/simplify_dyn_ops.hpp>
turneram's avatar
turneram committed
52
#include <migraphx/simplify_qdq.hpp>
53
#include <migraphx/simplify_reshapes.hpp>
54
#include <migraphx/split_single_dyn_dim.hpp>
Umang Yadav's avatar
Umang Yadav committed
55
#include <migraphx/eliminate_fp8.hpp>
56
#include <migraphx/gpu/allocation_model.hpp>
57
#include <migraphx/gpu/compile_miopen.hpp>
58
#include <migraphx/gpu/compile_ops.hpp>
59
60
#include <migraphx/gpu/concat_gpu_opt.hpp>
#include <migraphx/gpu/context.hpp>
61
#include <migraphx/gpu/device_name.hpp>
62
#include <migraphx/gpu/fuse_ck.hpp>
Paul Fultz II's avatar
Paul Fultz II committed
63
#include <migraphx/gpu/fuse_mlir.hpp>
64
#include <migraphx/gpu/fuse_ops.hpp>
65
#include <migraphx/gpu/prefuse_ops.hpp>
66
67
68
69
70
#include <migraphx/gpu/lowering.hpp>
#include <migraphx/gpu/schedule_model.hpp>
#include <migraphx/gpu/sync_device.hpp>
#include <migraphx/gpu/target.hpp>
#include <migraphx/gpu/write_literals.hpp>
Paul's avatar
Paul committed
71

Paul's avatar
Paul committed
72
namespace migraphx {
Paul's avatar
Paul committed
73
inline namespace MIGRAPHX_INLINE_NS {
Paul's avatar
Paul committed
74
namespace gpu {
mei-ye's avatar
mei-ye committed
75

76
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_SCHEDULE_PASS)
Paul Fultz II's avatar
Paul Fultz II committed
77
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_DISABLE_REDUCE_FUSION)
78
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_ENABLE_NHWC)
turneram's avatar
turneram committed
79
#ifndef _WIN32
80
MIGRAPHX_DECLARE_ENV_VAR(MIGRAPHX_ENABLE_CK)
81
#endif
82

83
84
85
86
87
88
89
90
91
92
93
94
struct id_pass
{
    std::string name() const { return "id"; }
    void apple(const module&) const {}
};

pass enable_pass(bool enabled, pass p)
{
    if(enabled)
        return p;
    return id_pass{};
}
Paul's avatar
Paul committed
95

96
std::vector<pass> target::get_passes(migraphx::context& gctx, const compile_options& options) const
Paul's avatar
Paul committed
97
{
Paul's avatar
Paul committed
98
    auto& ctx = any_cast<context>(gctx);
99
    ctx.set_exhaustive_tune_flag(options.exhaustive_tune);
100
101
    std::set<shape::type_t> unsupported_types(shape::types().begin(), shape::types().end());
    unsupported_types.erase(shape::type_t::float_type);
Umang Yadav's avatar
Umang Yadav committed
102
    unsupported_types.erase(shape::type_t::fp8e4m3fnuz_type);
103
104
105
106
    unsupported_types.erase(shape::type_t::half_type);
    unsupported_types.erase(shape::type_t::bool_type);
    unsupported_types.erase(shape::type_t::int8_type);
    unsupported_types.erase(shape::type_t::uint8_type);
107
    unsupported_types.erase(shape::type_t::int32_type);
Shucai Xiao's avatar
Shucai Xiao committed
108
    unsupported_types.erase(shape::type_t::tuple_type);
Umang Yadav's avatar
Umang Yadav committed
109
110
111
112
113
    std::set<std::string> unsupported_fp8_ops = {};
    if(not gpu::rocblas_fp8_available())
    {
        unsupported_fp8_ops.insert("dot");
    }
Paul's avatar
Paul committed
114
115
116
    // clang-format off
    return
    {
117
118
        split_single_dyn_dim{},
        dead_code_elimination{},
119
120
        simplify_dyn_ops{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
121
        normalize_ops{},
122
        dead_code_elimination{},
turneram's avatar
turneram committed
123
        simplify_qdq{},
124
        enable_pass(not mlir_enabled(), rewrite_quantization{}),
turneram's avatar
turneram committed
125
        dead_code_elimination{},
126
        eliminate_data_type{unsupported_types, shape::type_t::float_type},
127
        simplify_reshapes{},
128
        eliminate_identity{},
129
        eliminate_pad{},
130
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
131
132
        insert_pad{},
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
133
        rewrite_rnn{},
Shucai Xiao's avatar
Shucai Xiao committed
134
        dead_code_elimination{},
Shucai Xiao's avatar
Shucai Xiao committed
135
        inline_module{},
136
        rewrite_pooling{},
Shucai Xiao's avatar
Shucai Xiao committed
137
        dead_code_elimination{},
138
        enable_pass(options.fast_math, rewrite_gelu{}),
139
        optimize_module{},
140
141
        enable_pass(enabled(MIGRAPHX_ENABLE_NHWC{}), layout_nhwc{}),
        dead_code_elimination{},
142
143
        prefuse_ops{},
        dead_code_elimination{},
Paul's avatar
Paul committed
144
        auto_contiguous{},
Umang Yadav's avatar
Umang Yadav committed
145
146
        eliminate_fp8{unsupported_fp8_ops},
        dead_code_elimination{},
147
        optimize_module{},
148
        fuse_pointwise{},
149
        dead_code_elimination{},
Paul Fultz II's avatar
Paul Fultz II committed
150
151
        enable_pass(not enabled(MIGRAPHX_DISABLE_REDUCE_FUSION{}), fuse_reduce{}),
        dead_code_elimination{},
turneram's avatar
turneram committed
152
#ifndef _WIN32
153
        enable_pass(enabled(MIGRAPHX_ENABLE_CK{}), fuse_ck{}),
154
#endif
155
        dead_code_elimination{},
156
        enable_pass(mlir_enabled(), fuse_mlir{&ctx}),
Paul Fultz II's avatar
Paul Fultz II committed
157
        dead_code_elimination{},
158
        lowering{&ctx, options.offload_copy},
159
        eliminate_contiguous{"gpu::contiguous"},
Paul's avatar
Paul committed
160
        dead_code_elimination{},
161
162
        eliminate_concat{concat_gpu_optimization{}},
        dead_code_elimination{},
163
164
        compile_miopen{&gctx},
        dead_code_elimination{},
165
        dead_code_elimination{},
kahmed10's avatar
kahmed10 committed
166
        fuse_ops{&ctx, options.fast_math},
Paul's avatar
Paul committed
167
        dead_code_elimination{},
168
169
        replace_allocate{gpu_allocation_model{}, options.offload_copy},
        dead_code_elimination{},
170
171
        adjust_allocation{gpu_allocation_model{}},
        dead_code_elimination{},
172
        compile_ops{&ctx, options.exhaustive_tune},
173
        dead_code_elimination{},
Charlie Lin's avatar
Charlie Lin committed
174
175
        promote_literals{},
        dead_code_elimination{},
Paul's avatar
Paul committed
176
        write_literals{&ctx},
177
        schedule{gpu::schedule_model{ctx.get_current_device().nstreams()}, not enabled(MIGRAPHX_DISABLE_SCHEDULE_PASS{})},
Paul's avatar
Paul committed
178
        memory_coloring{"hip::allocate"},
179
        sync_device{},
180
        preallocate_param{"scratch", gpu_allocation_model{}},
Paul's avatar
Paul committed
181
        dead_code_elimination{},
Paul's avatar
Paul committed
182
        eliminate_allocation{"hip::allocate"},
183
        check_context<context>{},
184
        normalize_ops{},
185
186
        dead_code_elimination{},
        eliminate_identity{}
Paul's avatar
Paul committed
187
188
    };
    // clang-format on
Paul's avatar
Paul committed
189
}
Paul's avatar
Paul committed
190

191
std::string target::name() const { return "gpu"; }
Paul's avatar
Paul committed
192

193
migraphx::context target::get_context() const { return context(gpu::get_device_id()); }
194

Shucai Xiao's avatar
Shucai Xiao committed
195
argument target::copy_to(const argument& arg) const { return gpu::to_gpu(arg); }
196

Shucai Xiao's avatar
Shucai Xiao committed
197
argument target::copy_from(const argument& arg) const { return gpu::from_gpu(arg); }
198

Shucai Xiao's avatar
Shucai Xiao committed
199
argument target::allocate(const shape& s) const { return gpu::allocate_gpu(s); }
200

201
202
MIGRAPHX_REGISTER_TARGET(target);

Paul's avatar
Paul committed
203
} // namespace gpu
Paul's avatar
Paul committed
204
} // namespace MIGRAPHX_INLINE_NS
Paul's avatar
Paul committed
205
} // namespace migraphx