Enable bn rewrite and check for literals

aa0b6230 · Paul · 5ff89419 · aa0b6230 · aa0b6230 · aa0b6230
Commit aa0b6230 authored Aug 24, 2018 by Paul
Showing with 58 additions and 47 deletions

src/fwd_conv_batchnorm_rewrite.cpp src/fwd_conv_batchnorm_rewrite.cpp +50 -47

src/include/migraph/instruction.hpp src/include/migraph/instruction.hpp +5 -0

src/targets/gpu/target.cpp src/targets/gpu/target.cpp +3 -0

No files found.
--- a/src/fwd_conv_batchnorm_rewrite.cpp
+++ b/src/fwd_conv_batchnorm_rewrite.cpp
@@ -10,54 +10,57 @@ void fwd_conv_batchnorm_rewrite::apply(program& p) const
 {
    for(auto ins : iterator_for(p))
    {
-        if(ins->op.name() == "batch_norm_inference")
-        {
-            auto ins_prev = ins->arguments[0];
-            if(ins_prev->op.name() == "convolution")
-            {
-                // Get scale, bias, mean, variance from instruction_ref
-                auto gamma    = ins->arguments[1]->lit;
-                auto bias     = ins->arguments[2]->lit;
-                auto mean     = ins->arguments[3]->lit;
-                auto variance = ins->arguments[4]->lit;
-                // Get epsilon
-                auto bn_op   = any_cast<batch_norm_inference>(ins->op);
-                auto epsilon = bn_op.epsilon;
-                // Get convolution weights
-                auto weights = ins_prev->arguments[1]->lit;
-                // Get convolution op
-                auto conv_op      = ins_prev->op;
-                auto out_channels = weights.get_shape().lens()[0];
-                auto in_channels  = weights.get_shape().lens()[1];
-                auto height       = weights.get_shape().lens()[2];
-                auto width        = weights.get_shape().lens()[3];
-                argument new_weights{weights.get_shape()};
-                argument new_bias{bias.get_shape()};
-                visit_all(weights, gamma, bias, mean, variance, new_weights, new_bias)(
-                    [&](auto weights2,
-                        auto gamma2,
-                        auto bias2,
-                        auto mean2,
-                        auto variance2,
-                        auto new_weights2,
-                        auto new_bias2) {
-                        dfor(out_channels, in_channels, height, width)(
-                            [&](std::size_t k, std::size_t c, std::size_t h, std::size_t w) {
-                                new_weights2(k, c, h, w) = gamma2(k) /
-                                                           std::sqrt(variance2(k) + epsilon) *
-                                                           weights2(k, c, h, w);
-                                new_bias2(k, c, h, w) =
-                                    bias2(k) - (mean2(k) / std::sqrt(variance2(k) + epsilon));
-                            });
+        if(ins->op.name() != "batch_norm_inference")
+            continue;
+        if(not std::all_of(ins->arguments.begin()+1, ins->arguments.end(), [](auto arg) { return arg->op.name() == "@literal"; }))
+            continue;
+
+        auto conv_ins = ins->arguments[0];
+        if(conv_ins->op.name() != "convolution")
+            continue;
+        if(conv_ins->arguments[1]->op.name() != "@literal")
+            continue;
+        // Get scale, bias, mean, variance from instruction_ref
+        const auto& gamma    = ins->arguments[1]->get_literal();
+        const auto& bias     = ins->arguments[2]->get_literal();
+        const auto& mean     = ins->arguments[3]->get_literal();
+        const auto& variance = ins->arguments[4]->get_literal();
+        // Get epsilon
+        auto bn_op   = any_cast<batch_norm_inference>(ins->op);
+        auto epsilon = bn_op.epsilon;
+        // Get convolution weights
+        const auto& weights = conv_ins->arguments[1]->get_literal();
+        // Get convolution op
+        auto conv_op      = conv_ins->op;
+        auto out_channels = weights.get_shape().lens()[0];
+        auto in_channels  = weights.get_shape().lens()[1];
+        auto height       = weights.get_shape().lens()[2];
+        auto width        = weights.get_shape().lens()[3];
+        argument new_weights{weights.get_shape()};
+        argument new_bias{bias.get_shape()};
+        visit_all(weights, gamma, bias, mean, variance, new_weights, new_bias)(
+            [&](auto weights2,
+                auto gamma2,
+                auto bias2,
+                auto mean2,
+                auto variance2,
+                auto new_weights2,
+                auto new_bias2) {
+                dfor(out_channels, in_channels, height, width)(
+                    [&](std::size_t k, std::size_t c, std::size_t h, std::size_t w) {
+                        new_weights2(k, c, h, w) = gamma2(k) /
+                                                   std::sqrt(variance2(k) + epsilon) *
+                                                   weights2(k, c, h, w);
+                        new_bias2(k, c, h, w) =
+                            bias2(k) - (mean2(k) / std::sqrt(variance2(k) + epsilon));
                    });
-                // Replace convolution instruction with updated weights
-                auto l_weights = p.add_literal({weights.get_shape(), new_weights.data()});
-                auto l_bias    = p.add_literal({bias.get_shape(), new_bias.data()});
-                auto c =
-                    p.replace_instruction(ins_prev, conv_op, {ins_prev->arguments[0], l_weights});
-                p.replace_instruction(ins, add{}, {c, l_bias});
-            }
-        }
+            });
+        // Replace convolution instruction with updated weights
+        auto l_weights = p.add_literal({weights.get_shape(), new_weights.data()});
+        auto l_bias    = p.add_literal({bias.get_shape(), new_bias.data()});
+        auto c =
+            p.replace_instruction(conv_ins, conv_op, {conv_ins->arguments[0], l_weights});
+        p.replace_instruction(ins, add{}, {c, l_bias});
    }
 }
 } // namespace migraph
--- a/src/include/migraph/instruction.hpp
+++ b/src/include/migraph/instruction.hpp
@@ -115,6 +115,11 @@ struct instruction
    }

    shape get_shape() const { return result; }
+    const literal& get_literal() const 
+    {
+        assert(op.name() == "@literal");
+        return lit; 
+    }

    friend bool operator==(instruction_ref ref, const instruction& i) { return i == ref; }


--- a/src/targets/gpu/target.cpp
+++ b/src/targets/gpu/target.cpp
@@ -10,6 +10,7 @@
 #include <migraph/dead_code_elimination.hpp>
 #include <migraph/simplify_reshapes.hpp>
 #include <migraph/eliminate_contiguous.hpp>
+#include <migraph/fwd_conv_batchnorm_rewrite.hpp>

 namespace migraph {
 namespace gpu {
@@ -24,6 +25,8 @@ std::vector<pass> target::get_passes(migraph::context& gctx) const
        auto_contiguous{},
        simplify_reshapes{},
        dead_code_elimination{},
+        fwd_conv_batchnorm_rewrite{},
+        dead_code_elimination{},
        lowering{ctx},
        fuse_ops{},
        dead_code_elimination{},