batchnorm.cpp 1.84 KB
Newer Older
Paul's avatar
Paul committed
1
2
3
4
#include <migraphx/gpu/batchnorm.hpp>
#include <migraphx/operators.hpp>
#include <migraphx/manage_ptr.hpp>
#include <migraphx/gpu/miopen.hpp>
5
6
#include <utility>

Paul's avatar
Paul committed
7
namespace migraphx {
Paul's avatar
Paul committed
8
inline namespace MIGRAPHX_INLINE_NS {
9
10
11
12
13
namespace gpu {

shape miopen_batch_norm_inference::compute_shape(const std::vector<shape>& inputs) const
{
    check_shapes{inputs, *this}.has(6);
wsttiger's avatar
wsttiger committed
14
    return op.compute_shape({inputs.at(0), inputs.at(1), inputs.at(2), inputs.at(3), inputs.at(4)});
15
16
}

wsttiger's avatar
wsttiger committed
17
18
19
argument miopen_batch_norm_inference::compute(context& ctx,
                                              const shape& output_shape,
                                              const std::vector<argument>& args) const
20
21
22
23
24
{
    auto x_desc  = make_tensor(args[0].get_shape());
    auto y_desc  = make_tensor(output_shape);
    auto bn_desc = make_tensor(args[3].get_shape());

Paul's avatar
Paul committed
25
26
    float alpha = 1.0;
    float beta = 0.0f;
27

Paul's avatar
Paul committed
28
    miopenBatchNormalizationForwardInference(ctx.get_stream().get_miopen(),
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
                                             miopenBatchNormMode_t(op.bn_mode),
                                             &alpha,
                                             &beta,
                                             x_desc.get(),
                                             args[0].implicit(),
                                             y_desc.get(),
                                             args[5].implicit(),
                                             bn_desc.get(),
                                             args[1].implicit(),
                                             args[2].implicit(),
                                             args[3].implicit(),
                                             args[4].implicit(),
                                             op.epsilon);

    return args[5];
}

} // namespace gpu
Paul's avatar
Paul committed
47
} // namespace MIGRAPHX_INLINE_NS
Paul's avatar
Paul committed
48
} // namespace migraphx