change the data type for lens and strides from size_t to int in the shape class

edc23800 · Shucai Xiao · c7419a9c · edc23800 · edc23800 · edc23800
Commit edc23800 authored Feb 11, 2022 by Shucai Xiao
20 changed files
--- a/src/include/migraphx/op/pooling.hpp
+++ b/src/include/migraphx/op/pooling.hpp
@@ -22,9 +22,9 @@ namespace op {
 struct pooling
 {
    std::string mode                 = "average";
-    std::vector<std::size_t> padding = {0, 0};
-    std::vector<std::size_t> stride  = {1, 1};
-    std::vector<std::size_t> lengths = {1, 1};
+    std::vector<int> padding = {0, 0};
+    std::vector<int> stride  = {1, 1};
+    std::vector<int> lengths = {1, 1};
    bool ceil_mode                   = false;

    template <class Self, class F>
@@ -65,7 +65,7 @@ struct pooling
            MIGRAPHX_THROW("POOLING: input and attribute size mismatch!");
        }

-        std::vector<std::size_t> output_lens(input_lens.begin(), input_lens.begin() + 2);
+        std::vector<int> output_lens(input_lens.begin(), input_lens.begin() + 2);

        for(size_t i = 0; i < kdims; i++)
        {
@@ -75,10 +75,10 @@ struct pooling
                padding_factor = padding[i] + padding[i + kdims];
            dim_size = input_lens[i + 2] + padding_factor - lengths[i];
            assert(dim_size >= 0);
-            std::size_t len = (ceil_mode) ? ceil_divide<std::ptrdiff_t>(dim_size, stride[i])
+            int len = (ceil_mode) ? ceil_divide<std::ptrdiff_t>(dim_size, stride[i])
                                          : floor_divide<std::ptrdiff_t>(dim_size, stride[i]);

-            output_lens.push_back(std::size_t(std::max<std::ptrdiff_t>(1, len + 1)));
+            output_lens.push_back(int(std::max<std::ptrdiff_t>(1, len + 1)));
        }
        return inputs[0].with_lens(output_lens);
    }

--- a/src/include/migraphx/op/quant_convolution.hpp
+++ b/src/include/migraphx/op/quant_convolution.hpp
@@ -19,9 +19,9 @@ namespace op {

 struct quant_convolution
 {
-    std::vector<std::size_t> padding  = {0, 0};
-    std::vector<std::size_t> stride   = {1, 1};
-    std::vector<std::size_t> dilation = {1, 1};
+    std::vector<int> padding  = {0, 0};
+    std::vector<int> stride   = {1, 1};
+    std::vector<int> dilation = {1, 1};

    padding_mode_t padding_mode = default_;
    int group                   = 1;
@@ -60,7 +60,7 @@ struct quant_convolution
        const shape& input   = inputs.at(0);
        const shape& weights = inputs.at(1);
        auto t               = input.type();
-        size_t kdims         = input.lens().size() - 2;
+        int kdims         = input.lens().size() - 2;
        if(kdims != this->kdims())
        {
            MIGRAPHX_THROW("quant_convolution: input k-dims does not match attribute size");
@@ -73,14 +73,14 @@ struct quant_convolution
        }
        t = shape::int32_type;

-        std::vector<size_t> output_lens{input.lens()[0], weights.lens()[0]};
+        std::vector<int> output_lens{input.lens()[0], weights.lens()[0]};
        auto padding_size = padding.size();
-        for(size_t i = 0; i < kdims; i++)
+        for(int i = 0; i < kdims; i++)
        {
            auto padding_factor = 2 * padding[i];
            if(padding_size == 2 * kdims)
                padding_factor = padding[i] + padding[i + kdims];
-            output_lens.push_back(std::size_t(std::max<std::ptrdiff_t>(
+            output_lens.push_back(int(std::max<std::ptrdiff_t>(
                1,
                (input.lens()[i + 2] - (1 + dilation[i] * (weights.lens()[i + 2] - 1)) +
                 padding_factor) /
@@ -91,7 +91,7 @@ struct quant_convolution
        return inputs[0].with_lens(t, output_lens);
    }

-    size_t kdims() const
+    int kdims() const
    {
        check_attribute_size();
        return stride.size();

--- a/src/include/migraphx/op/reduce_op.hpp
+++ b/src/include/migraphx/op/reduce_op.hpp
@@ -69,7 +69,7 @@ struct reduce_op : op_name<Derived>
        return {{"normalize_axes", normalize}};
    }

-    std::vector<int64_t> tune_axes(std::size_t n_dim) const
+    std::vector<int64_t> tune_axes(int n_dim) const
    {
        auto tuned_axes = axes;
        if(tuned_axes.empty())
@@ -110,7 +110,7 @@ struct reduce_op : op_name<Derived>
    void reduce(tensor_view<T>& input,
                shape& batch_shape,
                std::vector<int64_t>& tuned_axes,
-                std::vector<std::size_t>& out_idx,
+                std::vector<int>& out_idx,
                tensor_view<T>& output) const
    {
        using accumulator = accumulator_type<T>;
@@ -132,7 +132,7 @@ struct reduce_op : op_name<Derived>
        argument result{output_shape};
        auto arg_lens   = args.front().get_shape().lens();
        auto tuned_axes = tune_axes(arg_lens.size());
-        std::vector<std::size_t> batch_lens(output_shape.lens().size(), 1);
+        std::vector<int> batch_lens(output_shape.lens().size(), 1);
        tune_dims(tuned_axes, arg_lens, batch_lens);
        shape batch_shape{output_shape.type(), batch_lens};
        visit_all(result, args[0])([&](auto output, auto input) {

--- a/src/include/migraphx/op/rnn.hpp
+++ b/src/include/migraphx/op/rnn.hpp
@@ -20,7 +20,7 @@ namespace op {

 struct rnn
 {
-    std::size_t hidden_size = 1;
+    int hidden_size = 1;
    std::vector<operation> actv_funcs{tanh{}, tanh{}};
    rnn_direction direction = rnn_direction::forward;
    float clip              = 0.0f;
@@ -44,7 +44,7 @@ struct rnn
            MIGRAPHX_THROW("RNN: hidden size mismatch in attribute and input");
        }

-        std::size_t num_directions = 1;
+        int num_directions = 1;
        if(direction == rnn_direction::bidirectional)
        {
            num_directions = 2;
@@ -55,7 +55,7 @@ struct rnn
            MIGRAPHX_THROW("RNN: num_direction mismatch in attribute and input");
        }

-        std::vector<std::size_t> out_dims(in_dims);
+        std::vector<int> out_dims(in_dims);
        out_dims.insert(out_dims.begin() + 1, num_directions);
        out_dims.back() = hidden_size;


--- a/src/include/migraphx/op/roialign.hpp
+++ b/src/include/migraphx/op/roialign.hpp
@@ -65,7 +65,7 @@ struct roialign
            MIGRAPHX_THROW("ROIALIGN: rois and batch indices inputs should have the same number!");
        }

-        std::vector<std::size_t> out_lens = x_lens;
+        std::vector<int> out_lens = x_lens;
        out_lens[0]                       = roi_lens[0];
        out_lens[2]                       = output_height;
        out_lens[3]                       = output_width;
@@ -76,27 +76,27 @@ struct roialign
    struct pos_weight
    {
        // neighbor indices for the bilinear interpolation
-        std::array<std::size_t, 4> pos = {0, 0, 0, 0};
+        std::array<int, 4> pos = {0, 0, 0, 0};
        // neighbor weights for the bilinear interpolation
        std::array<float, 4> w = {0.0f, 0.0f, 0.0f, 0.0f};
    };

-    auto calc_pos_weight(const std::array<std::size_t, 2>& dims,
+    auto calc_pos_weight(const std::array<int, 2>& dims,
                         const shape& comp_s,
                         const std::array<float, 2>& roi_start,
                         const std::array<float, 2>& bin_size,
-                         const std::array<std::size_t, 2>& bin_grid_size) const
+                         const std::array<int, 2>& bin_grid_size) const
    {
        std::vector<pos_weight> results(bin_grid_size[0] * bin_grid_size[1] * output_height *
                                        output_width);
        shape_for_each(comp_s, [&](auto idx) {
-            std::array<std::size_t, 2> p = {idx[0], idx[1]};
-            std::array<std::size_t, 2> i = {idx[2], idx[3]};
+            std::array<int, 2> p = {idx[0], idx[1]};
+            std::array<int, 2> i = {idx[2], idx[3]};
            auto index                   = comp_s.index(idx);

            std::array<float, 2> xy{};
-            std::array<int64_t, 2> low{};
-            std::array<int64_t, 2> high{};
+            std::array<int, 2> low{};
+            std::array<int, 2> high{};
            for(auto ii : range(p.size()))
            {
                xy[ii] = roi_start[ii] + p[ii] * bin_size[ii] +
@@ -140,7 +140,7 @@ struct roialign

        double operator()(double x, double y) { return std::max(x, y); }

-        double final(double x, std::size_t) { return (x); }
+        double final(double x, int) { return (x); }
    };

    struct avg_pool
@@ -149,12 +149,12 @@ struct roialign

        double operator()(double x, double y) { return x + y; }

-        double final(double x, std::size_t y) { return (y == 0) ? 0.0 : (x / y); }
+        double final(double x, int y) { return (y == 0) ? 0.0 : (x / y); }
    };

    template <class T, class Op>
    std::tuple<double, int64_t> calc_pooling(const T& data,
-                                             const std::array<std::size_t, 2>& bin_grid_size,
+                                             const std::array<int, 2>& bin_grid_size,
                                             const std::vector<pos_weight>& pos_weights,
                                             int64_t index,
                                             Op op) const
@@ -182,13 +182,13 @@ struct roialign
        argument result{output_shape};
        const auto& out_lens = output_shape.lens();
        int64_t n_rois       = out_lens[0];
-        std::size_t channels = out_lens[1];
+        int channels = out_lens[1];
        // output dims of height and width, in all 2-dim arrays, the first dim
        // is for height and second dim is for width
-        std::array<std::size_t, 2> out_dims = {out_lens[2], out_lens[3]};
+        std::array<int, 2> out_dims = {out_lens[2], out_lens[3]};
        const auto& x_lens                  = args.at(0).get_shape().lens();
        // input dims of height and width
-        std::array<std::size_t, 2> in_dims = {x_lens[2], x_lens[3]};
+        std::array<int, 2> in_dims = {x_lens[2], x_lens[3]};
        auto roi_s                         = args.at(1).get_shape();

        visit_all(result, args.at(0), args.at(1))([&](auto output, auto x, auto roi) {
@@ -207,7 +207,7 @@ struct roialign
                // Force malformed ROIs to be 1x1
                std::array<float, 2> roi_size{};
                std::array<float, 2> bin_size{};
-                std::array<std::size_t, 2> bin_grid_size{};
+                std::array<int, 2> bin_grid_size{};

                for(auto ii : range(roi_size.size()))
                {
@@ -222,13 +222,13 @@ struct roialign

                // we want to precalculate indices and weights shared by all channels,
                // this is the key point of optimization
-                std::vector<std::size_t> comp_lens = {
+                std::vector<int> comp_lens = {
                    out_dims[0], out_dims[1], bin_grid_size[0], bin_grid_size[1]};
                shape comp_s{shape::float_type, comp_lens};
                auto pre_calc =
                    this->calc_pos_weight(in_dims, comp_s, roi_starts, bin_size, bin_grid_size);

-                std::vector<std::size_t> comp_lens1 = {channels, out_dims[0], out_dims[1]};
+                std::vector<int> comp_lens1 = {channels, out_dims[0], out_dims[1]};
                shape comp_s1{migraphx::shape::float_type, comp_lens1};
                std::vector<int64_t> vec_index(channels, 0);
                shape_for_each(comp_s1, [&](auto idx) {

--- a/src/include/migraphx/op/slice.hpp
+++ b/src/include/migraphx/op/slice.hpp
@@ -46,22 +46,22 @@ struct slice

    std::string name() const { return "slice"; }

-    auto fix_index(const std::vector<std::size_t>& lens, std::size_t axis, int64_t index) const
+    auto fix_index(const std::vector<int>& lens, int axis, int64_t index) const
    {
        int64_t r = std::min(index, static_cast<int64_t>(lens[axis]));
        if(r < 0)
            r += lens[axis];
-        return std::size_t(r);
+        return int(r);
    }

    auto compute_offset(const shape& s) const
    {
-        const std::vector<std::size_t>& lens    = s.lens();
-        const std::vector<std::size_t>& strides = s.strides();
+        const std::vector<int>& lens    = s.lens();
+        const std::vector<int>& strides = s.strides();
        auto offset                             = 0;
        if(!axes.empty())
        {
-            for(std::size_t i = 0; i < axes.size(); i++)
+            for(int i = 0; i < axes.size(); i++)
            {
                auto axis = axes[i];
                offset += fix_index(lens, axis, starts[i]) * strides[axis];
@@ -69,7 +69,7 @@ struct slice
        }
        else
        {
-            for(std::size_t axis = 0; axis < lens.size(); axis++)
+            for(int axis = 0; axis < lens.size(); axis++)
            {
                offset += fix_index(lens, axis, starts[axis]) * strides[axis];
            }
@@ -95,8 +95,8 @@ struct slice
            MIGRAPHX_THROW("SLICE: inconsistent sizes");
        }

-        std::vector<std::size_t> new_lens = old_lens;
-        for(std::size_t i = 0; i < axes.size(); i++)
+        std::vector<int> new_lens = old_lens;
+        for(int i = 0; i < axes.size(); i++)
        {
            auto axis = axes[i];
            new_lens[axis] =

--- a/src/include/migraphx/par_for.hpp
+++ b/src/include/migraphx/par_for.hpp
@@ -28,23 +28,23 @@ struct joinable_thread : std::thread
 };

 template <class F>
-auto thread_invoke(std::size_t i, std::size_t tid, F f) -> decltype(f(i, tid))
+auto thread_invoke(int i, int tid, F f) -> decltype(f(i, tid))
 {
    f(i, tid);
 }

 template <class F>
-auto thread_invoke(std::size_t i, std::size_t, F f) -> decltype(f(i))
+auto thread_invoke(int i, int, F f) -> decltype(f(i))
 {
    f(i);
 }

 template <class F>
-void par_for_impl(std::size_t n, std::size_t threadsize, F f)
+void par_for_impl(int n, int threadsize, F f)
 {
    if(threadsize <= 1)
    {
-        for(std::size_t i = 0; i < n; i++)
+        for(int i = 0; i < n; i++)
            thread_invoke(i, 0, f);
    }
    else
@@ -54,15 +54,15 @@ void par_for_impl(std::size_t n, std::size_t threadsize, F f)
 #if(!defined(__GNUC__) || __GNUC__ != 5)
        const
 #endif
-            std::size_t grainsize = std::ceil(static_cast<double>(n) / threads.size());
+            int grainsize = std::ceil(static_cast<double>(n) / threads.size());

-        std::size_t work = 0;
-        std::size_t tid  = 0;
+        int work = 0;
+        int tid  = 0;
        std::generate(threads.begin(), threads.end(), [=, &work, &tid] {
            auto result = joinable_thread([=] {
-                std::size_t start = work;
-                std::size_t last  = std::min(n, work + grainsize);
-                for(std::size_t i = start; i < last; i++)
+                int start = work;
+                int last  = std::min(n, work + grainsize);
+                for(int i = start; i < last; i++)
                {
                    thread_invoke(i, tid, f);
                }
@@ -76,15 +76,15 @@ void par_for_impl(std::size_t n, std::size_t threadsize, F f)
 }

 template <class F>
-void par_for(std::size_t n, std::size_t min_grain, F f)
+void par_for(int n, int min_grain, F f)
 {
-    const auto threadsize = std::min<std::size_t>(std::thread::hardware_concurrency(),
-                                                  n / std::max<std::size_t>(1, min_grain));
+    const auto threadsize = std::min<int>(std::thread::hardware_concurrency(),
+                                                  n / std::max<int>(1, min_grain));
    par_for_impl(n, threadsize, f);
 }

 template <class F>
-void par_for(std::size_t n, F f)
+void par_for(int n, F f)
 {
    const int min_grain = 8;
    par_for(n, min_grain, f);

--- a/src/include/migraphx/rewrite_rnn.hpp
+++ b/src/include/migraphx/rewrite_rnn.hpp
@@ -69,7 +69,7 @@ struct rewrite_rnn
                                  instruction_ref last_cell_output,
                                  op::rnn_direction dirct) const;

-    std::size_t
+    int
    get_seq_len(const module& prog, instruction_ref input, instruction_ref seq_lens) const;

    instruction_ref pad_hidden_states(module& prog,

--- a/src/include/migraphx/shape.hpp
+++ b/src/include/migraphx/shape.hpp
@@ -66,52 +66,52 @@ struct shape

    shape();
    shape(type_t t);
-    shape(type_t t, std::vector<std::size_t> l);
-    shape(type_t t, std::vector<std::size_t> l, std::vector<std::size_t> s);
+    shape(type_t t, std::vector<int> l);
+    shape(type_t t, std::vector<int> l, std::vector<int> s);

    template <class Range>
-    shape(type_t t, const Range& l) : shape(t, std::vector<std::size_t>(l.begin(), l.end()))
+    shape(type_t t, const Range& l) : shape(t, std::vector<int>(l.begin(), l.end()))
    {
    }

    template <class Range1, class Range2>
    shape(type_t t, const Range1& l, const Range2& s)
        : shape(t,
-                std::vector<std::size_t>(l.begin(), l.end()),
-                std::vector<std::size_t>(s.begin(), s.end()))
+                std::vector<int>(l.begin(), l.end()),
+                std::vector<int>(s.begin(), s.end()))
    {
    }

    shape(const std::vector<shape>& subs);

    static shape
-    from_permutation(type_t t, const std::vector<std::size_t>& l, const std::vector<int64_t>& perm);
+    from_permutation(type_t t, const std::vector<int>& l, const std::vector<int64_t>& perm);
    type_t type() const;
-    const std::vector<std::size_t>& lens() const;
-    const std::vector<std::size_t>& strides() const;
-    std::size_t elements() const;
-    std::size_t bytes() const;
-    std::size_t type_size() const;
+    const std::vector<int>& lens() const;
+    const std::vector<int>& strides() const;
+    int elements() const;
+    int bytes() const;
+    int type_size() const;

    /// Map multiple indices to space index
-    std::size_t index(std::initializer_list<std::size_t> l) const;
+    int index(std::initializer_list<int> l) const;
    /// Map multiple indices to space index
-    std::size_t index(const std::vector<std::size_t>& l) const;
+    int index(const std::vector<int>& l) const;

    /// Map multiple indices from a range of iterator to a space index
    template <class Iterator>
-    std::size_t index(Iterator start, Iterator last) const
+    int index(Iterator start, Iterator last) const
    {
        assert(std::distance(start, last) <= this->lens().size());
        assert(this->lens().size() == this->strides().size());
-        return std::inner_product(start, last, this->strides().begin(), std::size_t{0}); // NOLINT
+        return std::inner_product(start, last, this->strides().begin(), int{0}); // NOLINT
    }

    /// Map element index to space index
-    std::size_t index(std::size_t i) const;
+    int index(int i) const;

-    std::vector<std::size_t> multi(std::size_t i) const;
-    void multi_copy(std::size_t i, std::size_t* start, const std::size_t* end) const;
+    std::vector<int> multi(int i) const;
+    void multi_copy(int i, int* start, const int* end) const;

    /// Returns true if the shape is packed with no padding
    bool packed() const;
@@ -128,8 +128,8 @@ struct shape

    shape normalize_standard() const;

-    shape with_lens(type_t t, const std::vector<std::size_t>& l) const;
-    shape with_lens(const std::vector<std::size_t>& l) const;
+    shape with_lens(type_t t, const std::vector<int>& l) const;
+    shape with_lens(const std::vector<int>& l) const;

    friend bool operator==(const shape& x, const shape& y);
    friend bool operator!=(const shape& x, const shape& y);
@@ -164,16 +164,16 @@ struct shape

        type operator()() const { return {}; }

-        std::size_t size(std::size_t n = 1) const { return sizeof(type) * n; }
+        int size(int n = 1) const { return sizeof(type) * n; }

        template <class U>
-        type* from(U* buffer, std::size_t n = 0) const
+        type* from(U* buffer, int n = 0) const
        {
            return reinterpret_cast<type*>(buffer) + n;
        }

        template <class U>
-        const type* from(const U* buffer, std::size_t n = 0) const
+        const type* from(const U* buffer, int n = 0) const
        {
            return reinterpret_cast<const type*>(buffer) + n;
        }
@@ -227,7 +227,7 @@ struct shape
    private:
    std::shared_ptr<const shape_impl> impl;

-    std::size_t element_space() const;
+    int element_space() const;
 };

 void migraphx_to_value(value& v, const shape& s);

--- a/src/include/migraphx/shape_for_each.hpp
+++ b/src/include/migraphx/shape_for_each.hpp
@@ -12,16 +12,16 @@ template <class F>
 void shape_for_each(const migraphx::shape& s, F f)
 {
    // Ensure calls to f use const ref to vector
-    auto call = [&f](const std::vector<std::size_t>& i) { f(i); };
-    std::vector<std::size_t> indices(s.lens().size());
+    auto call = [&f](const std::vector<int>& i) { f(i); };
+    std::vector<int> indices(s.lens().size());
    shape ss{s.type(), s.lens()};
-    for(std::size_t i = 0; i < ss.elements(); i++)
+    for(int i = 0; i < ss.elements(); i++)
    {
        std::transform(ss.strides().begin(),
                       ss.strides().end(),
                       ss.lens().begin(),
                       indices.begin(),
-                       [&](std::size_t stride, std::size_t len) {
+                       [&](int stride, int len) {
                           assert(len > 0 and stride > 0);
                           return (i / stride) % len;
                       });

--- a/src/include/migraphx/tensor_view.hpp
+++ b/src/include/migraphx/tensor_view.hpp
@@ -25,7 +25,7 @@ template <class T>
 struct tensor_view_iterator_read
 {
    T* view;
-    auto& operator()(std::size_t n) const
+    auto& operator()(int n) const
    {
        assert(view != nullptr);
        return (*view)[n];
@@ -36,9 +36,9 @@ template <class T>
 struct tensor_view
 {
    using value_type = T;
-    using iterator   = basic_iota_iterator<tensor_view_iterator_read<tensor_view<T>>, std::size_t>;
+    using iterator   = basic_iota_iterator<tensor_view_iterator_read<tensor_view<T>>, int>;
    using const_iterator =
-        basic_iota_iterator<tensor_view_iterator_read<const tensor_view<T>>, std::size_t>;
+        basic_iota_iterator<tensor_view_iterator_read<const tensor_view<T>>, int>;
    tensor_view() : m_data(nullptr) {}
    tensor_view(shape s, T* d) : m_data(d), m_shape(std::move(s)) {}

@@ -46,7 +46,7 @@ struct tensor_view

    bool empty() const { return m_data == nullptr || m_shape.lens().empty(); }

-    std::size_t size() const { return m_shape.elements(); }
+    int size() const { return m_shape.elements(); }

    T* data() { return this->m_data; }

@@ -55,17 +55,17 @@ struct tensor_view
    template <class... Ts, MIGRAPHX_REQUIRES(std::is_integral<Ts>{}...)>
    const T& operator()(Ts... xs) const
    {
-        assert(std::vector<std::size_t>{static_cast<std::size_t>(xs)...} < m_shape.lens());
-        assert(m_shape.index({static_cast<std::size_t>(xs)...}) < m_shape.bytes() / sizeof(T));
-        return m_data[m_shape.index({static_cast<std::size_t>(xs)...})];
+        assert(std::vector<int>{static_cast<int>(xs)...} < m_shape.lens());
+        assert(m_shape.index({static_cast<int>(xs)...}) < m_shape.bytes() / sizeof(T));
+        return m_data[m_shape.index({static_cast<int>(xs)...})];
    }

    template <class... Ts, MIGRAPHX_REQUIRES(std::is_integral<Ts>{}...)>
    T& operator()(Ts... xs)
    {
-        assert(std::vector<std::size_t>{static_cast<std::size_t>(xs)...} < m_shape.lens());
-        assert(m_shape.index({static_cast<std::size_t>(xs)...}) < m_shape.bytes() / sizeof(T));
-        return m_data[m_shape.index({static_cast<std::size_t>(xs)...})];
+        assert(std::vector<int>{static_cast<int>(xs)...} < m_shape.lens());
+        assert(m_shape.index({static_cast<int>(xs)...}) < m_shape.bytes() / sizeof(T));
+        return m_data[m_shape.index({static_cast<int>(xs)...})];
    }

    template <class Iterator, MIGRAPHX_REQUIRES(not std::is_integral<Iterator>{})>
@@ -84,13 +84,13 @@ struct tensor_view
        return m_data[m_shape.index(start, last)];
    }

-    T& operator[](std::size_t i)
+    T& operator[](int i)
    {
        assert(!this->empty() && i < this->size());
        return m_data[m_shape.index(i)];
    }

-    const T& operator[](std::size_t i) const
+    const T& operator[](int i) const
    {
        assert(!this->empty() && i < this->size());
        return m_data[m_shape.index(i)];
@@ -141,7 +141,7 @@ struct tensor_view
        if(!x.empty())
        {
            os << as_number(x.front());
-            for(std::size_t i = 1; i < x.m_shape.elements(); i++)
+            for(int i = 1; i < x.m_shape.elements(); i++)
            {
                os << ", " << as_number(x.m_data[x.m_shape.index(i)]);
            }
@@ -159,7 +159,7 @@ bool operator==(const tensor_view<T>& x, const tensor_view<U>& y)
 {
    if(x.get_shape() == y.get_shape())
    {
-        for(std::size_t i = 0; i < x.get_shape().elements(); i++)
+        for(int i = 0; i < x.get_shape().elements(); i++)
        {
            if(!float_equal(x[i], y[i]))
                return false;

--- a/src/insert_pad.cpp
+++ b/src/insert_pad.cpp
@@ -15,7 +15,7 @@ static void update_op(const instruction_ref& input, const instruction_ref& ins,
 {
    auto op         = ins->get_operator();
    auto val        = op.to_value();
-    auto op_padding = val.at("padding").to_vector<size_t>();
+    auto op_padding = val.at("padding").to_vector<int>();

    auto kdims = input->get_shape().lens().size() - 2;
    if(std::equal(op_padding.begin(),
@@ -25,9 +25,9 @@ static void update_op(const instruction_ref& input, const instruction_ref& ins,
        return;

    std::vector<int64_t> padding(input->get_shape().lens().size() * 2, 0);
-    std::vector<size_t> pads_l(op_padding.begin(), op_padding.begin() + kdims);
-    std::vector<size_t> pads_r(op_padding.begin() + kdims, op_padding.end());
-    op_padding = std::vector<size_t>(kdims * 2, 0);
+    std::vector<int> pads_l(op_padding.begin(), op_padding.begin() + kdims);
+    std::vector<int> pads_r(op_padding.begin() + kdims, op_padding.end());
+    op_padding = std::vector<int>(kdims * 2, 0);
    op.from_value({{"padding", op_padding}});

    std::copy(pads_l.begin(), pads_l.end(), padding.begin() + 2);
@@ -56,9 +56,9 @@ static void update_pooling(const instruction_ref& input, const instruction_ref&
        return;

    std::vector<int64_t> padding(input->get_shape().lens().size() * 2, 0);
-    std::vector<size_t> pads_l(op.padding.begin(), op.padding.begin() + kdims);
-    std::vector<size_t> pads_r(op.padding.begin() + kdims, op.padding.end());
-    op.padding = std::vector<size_t>(kdims * 2, 0);
+    std::vector<int> pads_l(op.padding.begin(), op.padding.begin() + kdims);
+    std::vector<int> pads_r(op.padding.begin() + kdims, op.padding.end());
+    op.padding = std::vector<int>(kdims * 2, 0);
    std::copy(pads_l.begin(), pads_l.end(), padding.begin() + 2);
    std::copy(pads_r.begin(), pads_r.end(), padding.begin() + kdims + 2 + 2);


--- a/src/normalize_attributes.cpp
+++ b/src/normalize_attributes.cpp
@@ -17,7 +17,7 @@ inline namespace MIGRAPHX_INLINE_NS {
 auto tune_attribute(const std::vector<int64_t>& vec,
                    const std::vector<int64_t>& axes,
                    const value& val,
-                    const std::vector<std::size_t>& lens)
+                    const std::vector<int>& lens)
 {
    std::vector<int64_t> result(vec);
    int64_t n_rank                                 = lens.size();
@@ -127,7 +127,7 @@ auto tune_pad_attribute(const value& val)
    return result;
 }

-bool normalize_attributes(operation& op, const std::vector<std::size_t>& lens)
+bool normalize_attributes(operation& op, const std::vector<int>& lens)
 {
    bool tuned = false;
    auto attrs = op.attributes();

--- a/src/onnx/include/migraphx/onnx/onnx_parser.hpp
+++ b/src/onnx/include/migraphx/onnx/onnx_parser.hpp
@@ -25,7 +25,7 @@ struct onnx_parser
    struct node_info
    {
        attribute_map attributes{};
-        std::size_t num_outputs = 1;
+        int num_outputs = 1;
        std::string name        = "";
        module* mod             = nullptr;
        instruction_ref make_contiguous(instruction_ref ins) const;
@@ -60,8 +60,8 @@ struct onnx_parser
    node_map nodes;
    std::unordered_map<std::string, instruction_ref> instructions;
    program prog                  = program();
-    std::size_t default_dim_value = 1;
-    std::unordered_map<std::string, std::vector<std::size_t>> map_input_dims;
+    int default_dim_value = 1;
+    std::unordered_map<std::string, std::vector<int>> map_input_dims;
    bool skip_unknown_operators = false;
    int64_t max_loop_iterations = 10;
    int64_t opset_version       = 13;
@@ -76,11 +76,11 @@ struct onnx_parser
    static int64_t get_opset_version(const onnx::ModelProto& model);

    void parse_from(std::istream& is, std::string name = "");
-    void parse_from(const void* data, std::size_t size);
+    void parse_from(const void* data, int size);
    void parse_graph(module* mod, const onnx::GraphProto& graph);
    literal parse_value(const onnx::AttributeProto& attr) const;
    literal parse_tensor(const onnx::TensorProto& t) const;
-    shape parse_type(const onnx::TypeProto& t, const std::vector<std::size_t>& input_dims) const;
+    shape parse_type(const onnx::TypeProto& t, const std::vector<int>& input_dims) const;
 };

 shape::type_t get_type(int dtype);

--- a/src/onnx/include/migraphx/onnx/padding.hpp
+++ b/src/onnx/include/migraphx/onnx/padding.hpp
@@ -12,9 +12,9 @@ bool is_asym_padding(const std::vector<int64_t>& padding);

 void cal_auto_padding_size(onnx_parser::node_info info,
                           value& v,
-                           const std::vector<std::size_t>& k_lens,
-                           const std::vector<std::size_t>& dilation,
-                           const std::vector<std::size_t>& in_lens,
+                           const std::vector<int>& k_lens,
+                           const std::vector<int>& dilation,
+                           const std::vector<int>& in_lens,
                           std::vector<int64_t>& paddings);

 void check_padding_mode(const onnx_parser::node_info& info, const std::string& op_name);

--- a/src/onnx/onnx.cpp
+++ b/src/onnx/onnx.cpp
@@ -54,7 +54,7 @@ program parse_onnx_buffer(const std::string& buffer, const onnx_options& options
    return parse_onnx_from(options, buffer.data(), buffer.size());
 }

-program parse_onnx_buffer(const void* data, std::size_t size, const onnx_options& options)
+program parse_onnx_buffer(const void* data, int size, const onnx_options& options)
 {
    return parse_onnx_from(options, data, size);
 }

--- a/src/onnx/onnx_parser.cpp
+++ b/src/onnx/onnx_parser.cpp
@@ -28,11 +28,11 @@ static onnx_parser::attribute_map get_attributes(const onnx::NodeProto& node)
 }

 static literal
-create_literal(shape::type_t shape_type, const std::vector<size_t>& dims, const char* data)
+create_literal(shape::type_t shape_type, const std::vector<int>& dims, const char* data)
 {
    // empty input
    auto elem_num =
-        std::accumulate(dims.begin(), dims.end(), std::size_t(1), std::multiplies<std::size_t>());
+        std::accumulate(dims.begin(), dims.end(), int(1), std::multiplies<int>());
    if(elem_num == 0)
    {
        return {};
@@ -45,11 +45,11 @@ create_literal(shape::type_t shape_type, const std::vector<size_t>& dims, const
 }

 template <class T, MIGRAPHX_REQUIRES(not std::is_pointer<T>{})>
-static literal create_literal(shape::type_t shape_type, const std::vector<size_t>& dims, T data)
+static literal create_literal(shape::type_t shape_type, const std::vector<int>& dims, T data)
 {
    // empty input
    auto elem_num =
-        std::accumulate(dims.begin(), dims.end(), std::size_t(1), std::multiplies<std::size_t>());
+        std::accumulate(dims.begin(), dims.end(), int(1), std::multiplies<int>());
    if(elem_num == 0)
    {
        return {};
@@ -64,7 +64,7 @@ static literal create_literal(shape::type_t shape_type, const std::vector<size_t
 template <class T>
 static literal from_repeated(shape::type_t t, const T& r)
 {
-    std::size_t size = r.size();
+    int size = r.size();
    return literal{{t, {size}}, r.begin(), r.end()};
 }

@@ -187,7 +187,7 @@ void onnx_parser::parse_from(std::istream& is, std::string name)
    }
 }

-void onnx_parser::parse_from(const void* data, std::size_t size)
+void onnx_parser::parse_from(const void* data, int size)
 {
    auto* mm = prog.get_main_module();
    onnx::ModelProto model;
@@ -247,7 +247,7 @@ void onnx_parser::parse_graph(module* mod, const onnx::GraphProto& graph)
                               "\" existing in parent graph!");
            }

-            std::vector<std::size_t> dims;
+            std::vector<int> dims;
            if(map_input_dims.count(name) > 0)
            {
                dims = map_input_dims.at(name);
@@ -278,7 +278,7 @@ void onnx_parser::parse_graph(module* mod, const onnx::GraphProto& graph)
        }

        std::vector<instruction_ref> result;
-        std::size_t output_num = static_cast<std::size_t>(node.output().size());
+        int output_num = static_cast<int>(node.output().size());
        if(ops.count(node.op_type()) == 0)
        {
            if(skip_unknown_operators)
@@ -293,7 +293,7 @@ void onnx_parser::parse_graph(module* mod, const onnx::GraphProto& graph)
                *this, {get_attributes(node), output_num, node_name, mod}, args);
        }

-        output_num = std::min<std::size_t>(output_num, result.size());
+        output_num = std::min<int>(output_num, result.size());
        std::transform(node.output().begin(),
                       node.output().begin() + output_num,
                       result.begin(),
@@ -351,7 +351,7 @@ literal onnx_parser::parse_value(const onnx::AttributeProto& attr) const

 literal onnx_parser::parse_tensor(const onnx::TensorProto& t) const
 {
-    std::vector<std::size_t> dims(t.dims().begin(), t.dims().end());
+    std::vector<int> dims(t.dims().begin(), t.dims().end());
    if(not t.external_data().empty())
    {
        const std::string& data_file = t.external_data().at(0).value();
@@ -401,7 +401,7 @@ literal onnx_parser::parse_tensor(const onnx::TensorProto& t) const
    MIGRAPHX_THROW("PARSE_TENSOR: Invalid tensor type");
 }
 shape onnx_parser::parse_type(const onnx::TypeProto& t,
-                              const std::vector<std::size_t>& input_dims) const
+                              const std::vector<int>& input_dims) const
 {
    shape::type_t shape_type = get_type(t.tensor_type().elem_type());
    if(!input_dims.empty())
@@ -409,12 +409,12 @@ shape onnx_parser::parse_type(const onnx::TypeProto& t,
        return {shape_type, input_dims};
    }

-    std::vector<std::size_t> dims;
+    std::vector<int> dims;
    auto&& tensor_dims = t.tensor_type().shape().dim();
    std::transform(tensor_dims.begin(),
                   tensor_dims.end(),
                   std::back_inserter(dims),
-                   [&](auto&& d) -> std::size_t {
+                   [&](auto&& d) -> int {
                       if(d.has_dim_value())
                       {
                           if(static_cast<int>(d.dim_value()) <= 0)

--- a/src/onnx/padding.cpp
+++ b/src/onnx/padding.cpp
@@ -10,12 +10,12 @@ namespace onnx {

 void cal_auto_padding_size(onnx_parser::node_info info,
                           value& v,
-                           const std::vector<std::size_t>& k_lens,
-                           const std::vector<std::size_t>& dilation,
-                           const std::vector<std::size_t>& in_lens,
+                           const std::vector<int>& k_lens,
+                           const std::vector<int>& dilation,
+                           const std::vector<int>& in_lens,
                           std::vector<int64_t>& paddings)
 {
-    size_t kdims = in_lens.size() - 2;
+    int kdims = in_lens.size() - 2;
    assert(k_lens.size() == kdims and dilation.size() == kdims);

    if(!contains(info.attributes, "auto_pad"))
@@ -29,7 +29,7 @@ void cal_auto_padding_size(onnx_parser::node_info info,
        bool is_same_upper = (auto_pad.find("SAME_UPPER") != std::string::npos);
        paddings.resize(2 * kdims);

-        for(size_t i = 0; i < paddings.size() / 2; i++)
+        for(int i = 0; i < paddings.size() / 2; i++)
        {
            calculate_padding(i,
                              paddings,
@@ -45,9 +45,9 @@ void cal_auto_padding_size(onnx_parser::node_info info,
 bool is_asym_padding(const std::vector<int64_t>& padding)
 {
    assert(padding.size() % 2 == 0);
-    size_t pad_ndims = padding.size() / 2;
+    int pad_ndims = padding.size() / 2;

-    for(size_t i = 0; i < pad_ndims; i++)
+    for(int i = 0; i < pad_ndims; i++)
    {
        if(padding[i] != padding[i + pad_ndims])
        {
@@ -106,9 +106,9 @@ void tune_padding_size(const value& v,
    }

    // asymmetric padding, make it symmetric
-    std::size_t n_dims = padding.size() / 2;
+    int n_dims = padding.size() / 2;
    s_start.resize(n_dims);
-    for(std::size_t i = 0; i < n_dims; ++i)
+    for(int i = 0; i < n_dims; ++i)
    {
        tune_padding_to_symmetric(
            padding[i], padding[i + n_dims], v.at("stride")[i].to<int64_t>(), s_start[i]);
@@ -122,7 +122,7 @@ void check_asym_padding(const onnx_parser::node_info& info,
                        int count_include_pad,
                        float pad_val)
 {
-    size_t pad_ndims  = padding.size() / 2;
+    int pad_ndims  = padding.size() / 2;
    auto left_pad_it  = padding.begin();
    auto right_pad_it = left_pad_it + pad_ndims;

@@ -134,18 +134,18 @@ void check_asym_padding(const onnx_parser::node_info& info,
        // add right pads
        asym_pads.insert(asym_pads.begin() + pad_ndims + 4, right_pad_it, padding.end());
        ins = info.add_instruction(make_op("pad", {{"pads", asym_pads}, {"value", pad_val}}), ins);
-        std::vector<size_t> new_padding(padding.size());
+        std::vector<int> new_padding(padding.size());
        // subtract asym padding originally found from parsing the operator
        std::transform(padding.begin(),
                       left_pad_it,
                       asym_pads.begin() + 2,
                       new_padding.begin(),
-                       std::minus<size_t>());
+                       std::minus<int>());
        std::transform(right_pad_it,
                       padding.end(),
                       asym_pads.begin() + pad_ndims + 4,
                       new_padding.begin() + pad_ndims,
-                       std::minus<size_t>());
+                       std::minus<int>());
        v["padding"] = new_padding;
    }
 }

--- a/src/onnx/parse_convolution.cpp
+++ b/src/onnx/parse_convolution.cpp
@@ -60,11 +60,11 @@ struct parse_convolution : op_parser<parse_convolution>
        if(contains(info.attributes, "auto_pad"))
        {
            auto weight_lens = weights->get_shape().lens();
-            std::vector<std::size_t> k_lens(weight_lens.begin() + 2, weight_lens.end());
+            std::vector<int> k_lens(weight_lens.begin() + 2, weight_lens.end());
            cal_auto_padding_size(info,
                                  values,
                                  k_lens,
-                                  values["dilation"].to_vector<std::size_t>(),
+                                  values["dilation"].to_vector<int>(),
                                  in_lens,
                                  padding);
            auto auto_pad = info.attributes["auto_pad"].s();
@@ -73,7 +73,7 @@ struct parse_convolution : op_parser<parse_convolution>
                values["padding_mode"] = to_value(op::padding_mode_t::same);
            }
        }
-        values["padding"] = std::vector<size_t>(padding.begin(), padding.end());
+        values["padding"] = std::vector<int>(padding.begin(), padding.end());

        if(contains(info.attributes, "group"))
        {

--- a/src/onnx/parse_expand.cpp
+++ b/src/onnx/parse_expand.cpp
@@ -21,7 +21,7 @@ struct parse_expand : op_parser<parse_expand>
        auto in_lens             = args[0]->get_shape().lens();
        migraphx::argument arg_s = args[1]->eval();
        check_arg_empty(arg_s, "Expand: dynamic shape is not supported");
-        std::vector<std::size_t> dims;
+        std::vector<int> dims;
        arg_s.visit([&](auto input) { dims.assign(input.begin(), input.end()); });
        auto out_lens = compute_broadcasted_lens(in_lens, dims);
        return info.add_instruction(make_op("multibroadcast", {{"out_lens", out_lens}}), args[0]);