convolution.cpp 8.08 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
/*
 * The MIT License (MIT)
 *
 * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
Paul's avatar
Paul committed
24
#include <migraphx/gpu/convolution.hpp>
Paul's avatar
Paul committed
25
26
#include <migraphx/gpu/context.hpp>
#include <migraphx/generate.hpp>
wsttiger's avatar
wsttiger committed
27

Paul's avatar
Paul committed
28
namespace migraphx {
Paul's avatar
Paul committed
29
inline namespace MIGRAPHX_INLINE_NS {
wsttiger's avatar
wsttiger committed
30
31
32
33
34
namespace gpu {

shape miopen_convolution::compute_shape(const std::vector<shape>& inputs) const
{
    check_shapes{inputs, *this}.has(4).standard();
kahmed10's avatar
kahmed10 committed
35
36
    std::vector<shape> conv_inputs(inputs.begin(), inputs.begin() + 2);
    check_shapes{conv_inputs, *this}.max_ndims(5);
kahmed10's avatar
kahmed10 committed
37
    return op.normalize_compute_shape(conv_inputs);
wsttiger's avatar
wsttiger committed
38
}
kahmed10's avatar
kahmed10 committed
39

kahmed10's avatar
kahmed10 committed
40
inline shape reshape_if_1d(const shape& input)
kahmed10's avatar
kahmed10 committed
41
42
43
44
45
46
47
48
49
50
51
52
53
{
    shape new_shape{input};
    auto dims = new_shape.lens();

    if(dims.size() == 3)
    {
        std::vector<size_t> new_dims = dims;
        new_dims.insert(new_dims.begin() + 2, 1);
        new_shape = shape{input.type(), new_dims};
    }
    return new_shape;
}

wsttiger's avatar
wsttiger committed
54
55
56
argument miopen_convolution::compute(context& ctx,
                                     const shape& output_shape,
                                     const std::vector<argument>& args) const
wsttiger's avatar
wsttiger committed
57
{
kahmed10's avatar
kahmed10 committed
58
59
60
    auto x_desc = make_tensor(reshape_if_1d(args[0].get_shape()));
    auto w_desc = make_tensor(reshape_if_1d(args[1].get_shape()));
    auto y_desc = make_tensor(reshape_if_1d(output_shape));
wsttiger's avatar
wsttiger committed
61

62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
    if(solution_id == 0)
        MIGRAPHX_THROW("MIOpen Convolution: invalid solution ID");

    auto status = miopenConvolutionForwardImmediate(ctx.get_stream().get_miopen(),
                                                    w_desc.get(),
                                                    args[1].implicit(),
                                                    x_desc.get(),
                                                    args[0].implicit(),
                                                    cd.get(),
                                                    y_desc.get(),
                                                    args[3].implicit(),
                                                    args[2].implicit(),
                                                    args[2].get_shape().bytes(),
                                                    solution_id);

Paul's avatar
Paul committed
77
    if(status != miopenStatusSuccess)
78
        MIGRAPHX_THROW("MIOpen Convolution: running convolution failed");
wsttiger's avatar
wsttiger committed
79
80
81
    return args[3];
}

82
shape miopen_convolution::find(context& ctx, const shape& output_shape, std::vector<shape> inputs)
wsttiger's avatar
wsttiger committed
83
84
{
    shape workspace_shape{};
kahmed10's avatar
kahmed10 committed
85

kahmed10's avatar
kahmed10 committed
86
87
88
    auto x_desc = make_tensor(reshape_if_1d(inputs[0]));
    auto w_desc = make_tensor(reshape_if_1d(inputs[1]));
    auto y_desc = make_tensor(reshape_if_1d(output_shape));
wsttiger's avatar
wsttiger committed
89
90

    std::size_t workspace_size = 0;
Paul's avatar
Paul committed
91
92
93
94
95
96
    miopenConvolutionForwardGetWorkSpaceSize(ctx.get_stream().get_miopen(),
                                             w_desc.get(),
                                             x_desc.get(),
                                             cd.get(),
                                             y_desc.get(),
                                             &workspace_size);
wsttiger's avatar
wsttiger committed
97
98
    workspace_shape = shape{shape::int8_type, {workspace_size}};

Paul's avatar
Paul committed
99
100
    auto x         = to_gpu(generate_argument(inputs[0]));
    auto w         = to_gpu(generate_argument(inputs[1]));
Paul's avatar
Paul committed
101
    auto y         = allocate_gpu(output_shape);
wsttiger's avatar
wsttiger committed
102
103
104
105
    auto workspace = allocate_gpu(workspace_shape);

    int algo_count = 1;
    miopenConvAlgoPerf_t perf;
Paul's avatar
Paul committed
106
    auto status = miopenFindConvolutionForwardAlgorithm(ctx.get_stream().get_miopen(),
Paul's avatar
Paul committed
107
108
109
110
111
112
113
114
115
116
117
118
119
120
                                                        x_desc.get(),
                                                        x.implicit(),
                                                        w_desc.get(),
                                                        w.implicit(),
                                                        cd.get(),
                                                        y_desc.get(),
                                                        y.implicit(),
                                                        1,
                                                        &algo_count,
                                                        &perf,
                                                        workspace.implicit(),
                                                        workspace_size,
                                                        false);
    if(status != miopenStatusSuccess)
121
        MIGRAPHX_THROW("MIOpen Convolution: find convolution failed");
122
    algo = perf.fwd_algo;
123
124
125

    size_t solution_count;

126
127
128
129
130
131
    status = miopenConvolutionForwardGetSolutionCount(ctx.get_stream().get_miopen(),
                                                      w_desc.get(),
                                                      x_desc.get(),
                                                      cd.get(),
                                                      y_desc.get(),
                                                      &solution_count);
132
133
134
135
136
    if(status != miopenStatusSuccess)
        MIGRAPHX_THROW("MIOpen Convolution: get solution count failed");

    std::vector<miopenConvSolution_t> solutions(solution_count);

137
    status = miopenConvolutionForwardGetSolution(ctx.get_stream().get_miopen(),
138
139
140
141
142
143
144
145
146
147
148
149
                                                 w_desc.get(),
                                                 x_desc.get(),
                                                 cd.get(),
                                                 y_desc.get(),
                                                 solution_count,
                                                 &solution_count,
                                                 solutions.data());
    if(status != miopenStatusSuccess)
        MIGRAPHX_THROW("MIOpen Convolution: get solution failed");

    solution_id = solutions.front().solution_id;

wsttiger's avatar
wsttiger committed
150
151
152
    return shape{shape::int8_type, {perf.memory}};
}

Paul's avatar
Paul committed
153
154
155
void miopen_convolution::finalize(context& ctx,
                                  const shape& output_shape,
                                  std::vector<shape> inputs)
Paul's avatar
Paul committed
156
{
157
158
    if(cd == nullptr)
        cd = make_conv(op);
159
160
161
162
163
164
165
166
167
168
169
170
171
    if(solution_id == 0)
    {
        // Check that workspace hasn't changed
        auto size = inputs.at(2).bytes();
        auto ws   = find(ctx, output_shape, inputs);
        if(ws.bytes() > size)
            MIGRAPHX_THROW("MIOpen Convolution: workspace has changed during finalization.");
    }

    auto x_desc = make_tensor(reshape_if_1d(inputs[0]));
    auto w_desc = make_tensor(reshape_if_1d(inputs[1]));
    auto y_desc = make_tensor(reshape_if_1d(output_shape));

172
173
174
175
176
177
    auto status = miopenConvolutionForwardCompileSolution(ctx.get_stream().get_miopen(),
                                                          w_desc.get(),
                                                          x_desc.get(),
                                                          cd.get(),
                                                          y_desc.get(),
                                                          solution_id);
178
179
    if(status != miopenStatusSuccess)
        MIGRAPHX_THROW("MIOpen Convolution: compile solution failed");
Paul's avatar
Paul committed
180
181
}

wsttiger's avatar
wsttiger committed
182
} // namespace gpu
Paul's avatar
Paul committed
183
} // namespace MIGRAPHX_INLINE_NS
Paul's avatar
Paul committed
184
} // namespace migraphx