#include #include #include #include #include #include #include #include #include #include #include namespace migraphx { inline namespace MIGRAPHX_INLINE_NS { template std::vector find_lasts(const module& m, Predicate pred) { std::vector result; fix([&](auto self, auto ins) { if(pred(ins)) { result.push_back(ins); return; } for(auto input : ins->inputs()) self(input); })(std::prev(m.end())); return result; } std::unordered_set preserve_output_layout(module& m) { std::unordered_set result; std::vector outputs = find_lasts(m, [](auto ins) { return ins->name() == "convolution" and ins->get_shape().lens().size() == 4; }); for(auto output : outputs) { auto permutation = find_permutation(output->get_shape()); auto layout = m.insert_instruction( std::next(output), make_op("layout", {{"permutation", permutation}}), output); result.insert(m.replace_instruction(output, layout)); } return result; } void transform_convolutions(module& m) { for(auto ins : iterator_for(m)) { if(ins->name() != "convolution") continue; if(ins->get_shape().lens().size() != 4) continue; auto v = ins->get_operator().to_value(); if(v.at("group").to() > 1) continue; auto args = ins->inputs(); std::transform(args.begin(), args.end(), args.begin(), [&](const auto& i) { return m.insert_instruction(ins, make_op("layout", {{"permutation", {0, 2, 3, 1}}}), i); }); auto conv = m.insert_instruction(ins, ins->get_operator(), args); auto c = m.insert_instruction(ins, make_op("contiguous"), conv); m.replace_instruction(ins, c); } } void remove_layout(module& m, const std::unordered_set& output_layouts) { for(auto ins : iterator_for(m)) { if(ins->name() != "layout") continue; if(ins->get_shape() != ins->inputs().front()->get_shape()) continue; if(contains(output_layouts, ins)) continue; m.replace_instruction(ins, ins->inputs().front()); } } void layout_nhwc::apply(module_pass_manager& mpm) const { std::unordered_set output_layouts = preserve_output_layout(mpm.get_module()); transform_convolutions(mpm.get_module()); mpm.run_pass(dead_code_elimination{}); mpm.run_pass(eliminate_contiguous{"contiguous"}); mpm.run_pass(dead_code_elimination{}); remove_layout(mpm.get_module(), output_layouts); mpm.run_pass(dead_code_elimination{}); } } // namespace MIGRAPHX_INLINE_NS } // namespace migraphx