parse_multinomial.cpp 4.88 KB
Newer Older
1
2
3
/*
 * The MIT License (MIT)
 *
4
 * Copyright (c) 2015-2023 Advanced Micro Devices, Inc. All rights reserved.
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 */
turneram's avatar
turneram committed
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
#include <migraphx/onnx/op_parser.hpp>
#include <migraphx/onnx/checks.hpp>
#include <migraphx/ranges.hpp>
#include <migraphx/instruction.hpp>
#include <migraphx/make_op.hpp>
#include <random>

namespace migraphx {
inline namespace MIGRAPHX_INLINE_NS {
namespace onnx {

struct parse_multinomial : op_parser<parse_multinomial>
{
    std::vector<op_desc> operators() const { return {{"Multinomial"}}; }

    instruction_ref parse(const op_desc& /*opd*/,
                          const onnx_parser& /*parser*/,
                          const onnx_parser::node_info& info,
                          std::vector<instruction_ref> args) const
    {
        int dtype = 6;
        if(contains(info.attributes, "dtype"))
            dtype = info.attributes.at("dtype").i();
        shape::type_t output_type = get_type(dtype);

49
50
51
52
        size_t batch_size = 1;
        if(contains(info.attributes, "batch_size"))
            batch_size = info.attributes.at("batch_size").i();

turneram's avatar
turneram committed
53
54
55
        size_t sample_size = 1;
        if(contains(info.attributes, "sample_size"))
            sample_size = info.attributes.at("sample_size").i();
56
57
        else
            MIGRAPHX_THROW("PARSE_MULTINOMIAL: sample_size not given");
turneram's avatar
turneram committed
58
59
60
61

        // Subtract the per-batch maximum log-probability, making the per-batch max 0
        auto maxes =
            info.add_instruction(migraphx::make_op("reduce_max", {{"axes", {1}}}), args[0]);
62
        auto cdf = info.add_common_op("sub", args[0], maxes);
turneram's avatar
turneram committed
63
64
65
66
67
68
        // Take the element-wise exponent to get probabilities in the range (0, 1]
        cdf = info.add_instruction(migraphx::make_op("exp"), cdf);
        // Compute the cumulative density function
        cdf = info.add_instruction(
            migraphx::make_op("prefix_scan_sum", {{"axis", 1}, {"exclusive", false}}), cdf);

69
70
71
72
        uint32_t seed(0);
        if(contains(info.attributes, "seed"))
            seed = info.attributes.at("seed").i();
        instruction_ref randoms;
73

74
        if(args.size() > 0)
75
        {
76
77
78
79
80
81
82
83
            shape s0 = args[0]->get_shape();
            // TODO: Use literal if batch size is fixed
            if(s0.dynamic())
            {
                //  Dynamic batch_size will be taken from args[0].  Other contents of input are
                //  ignored here.
                randoms = info.add_instruction(
                    migraphx::make_op("rand_uniform",
84
85
86
                                      {{"seed", seed},
                                       //   {"sample_size", sample_size},
                                       {"use_auto_seed", not contains(info.attributes, "seed")}}),
87
88
89
90
91
92
93
94
95
                    args[0]);
            }
            else
            {
                // use literal.  It may be quite large.
                batch_size      = s0.lens().front();
                auto rand_dummy = info.add_literal(
                    migraphx::literal{migraphx::shape::float_type, {batch_size * sample_size}});

96
97
98
99
100
                randoms = info.add_instruction(
                    migraphx::make_op(
                        "rand_uniform",
                        {{"seed", seed}, {"use_auto_seed", not contains(info.attributes, "seed")}}),
                    rand_dummy);
101
            }
102
103
104
        }
        else
        {
105
106
107
108
109
            // use literal.  It may be quite large.
            auto rand_dummy = info.add_literal(
                migraphx::literal{migraphx::shape::float_type, {batch_size * sample_size}});
            randoms = info.add_instruction(migraphx::make_op("rand_uniform", {{"seed", seed}}),
                                           rand_dummy);
110
111
        }

turneram's avatar
turneram committed
112
        return info.add_instruction(
113
            migraphx::make_op("multinomial", {{"dtype", output_type}}), cdf, randoms);
turneram's avatar
turneram committed
114
115
116
117
118
119
    }
};

} // namespace onnx
} // namespace MIGRAPHX_INLINE_NS
} // namespace migraphx