Enable conv+add fusion, same as conv+sum (#15268)

author Gu, Jinghui <jinghui.gu@intel.com>

Mon, 7 Jan 2019 22:10:27 +0000 (14:10 -0800)

committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>

Mon, 7 Jan 2019 22:42:45 +0000 (14:42 -0800)
author Gu, Jinghui <jinghui.gu@intel.com>
Mon, 7 Jan 2019 22:10:27 +0000 (14:10 -0800)
committer Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
Mon, 7 Jan 2019 22:42:45 +0000 (14:42 -0800)
diff --git a/caffe2/opt/optimize_ideep.cc b/caffe2/opt/optimize_ideep.cc

index 14360f8..e4a9feb 100644 (file)
--- a/caffe2/opt/optimize_ideep.cc
+++ b/caffe2/opt/optimize_ideep.cc
@@ -53,6 +53,15 @@ caffe2::OperatorDef* getMutableOpDef(repr::NeuralNetOperator& nnOp) {
    return dyn_cast<Caffe2Annotation>(annotation)->getMutableOperatorDef();
  }
  
+bool isOpType(const repr::NNGraph::NodeRef& nodeRef, string typeName) {
+  if (!repr::nn::is<repr::NeuralNetOperator>(nodeRef)) {
+    return false;
+  }
+  auto op = repr::nn::get<repr::NeuralNetOperator>(nodeRef);
+  auto opDef = getOpDef(*op);
+  return opDef.type() == typeName;
+}
+
  bool isOnIdeepDevice(const repr::NeuralNetOperator& nnOp) {
    // We only want to fuse for IDEEP convs
    const auto& op = getOpDef(nnOp);
@@ -245,11 +254,13 @@ void fuseConvSumForIdeep(repr::NNModule* nn, caffe2::Workspace* ws) {
        continue;
      }
  
-    if (!repr::nn::is<repr::Sum>(sumNode)) {
+    // CAUTION: On IDEEP device, only element-wise Add operator is
+    // supported yet. It totally works as element-wise sum without scalar broadcast.
+    if (!repr::nn::is<repr::Sum>(sumNode) && !isOpType(sumNode, "Add")) {
        continue;
      }
  
-    auto sum = repr::nn::get<repr::Sum>(sumNode);
+    auto sum = repr::nn::get<repr::NeuralNetOperator>(sumNode);
      if (!isOnIdeepDevice(*sum)) {
        LOG(WARNING) << "Not a IDEEP operator";
        continue;
diff --git a/caffe2/python/ideep/convfusion_op_test.py b/caffe2/python/ideep/convfusion_op_test.py

index 6445655..de66a4d 100644 (file)
--- a/caffe2/python/ideep/convfusion_op_test.py
+++ b/caffe2/python/ideep/convfusion_op_test.py
@@ -125,10 +125,11 @@ class ConvFusionTest(hu.HypothesisTestCase):
             batch_size=st.integers(1, 3),
             use_bias=st.booleans(),
             group=st.integers(1, 1),
+           sum_add=st.sampled_from(["Sum", "Add"]),
             **mu.gcs)
      def test_convolution_sum_fusion(self, stride, pad, kernel, size,
                               input_channels, output_channels,
-                             batch_size, use_bias, group, gc, dc):
+                             batch_size, use_bias, group, sum_add, gc, dc):
          conv_S0 = core.CreateOperator(
              "Conv",
              ["SX0", "Sw0", "Sb0"] if use_bias else ["SX0", "Sw0"],
@@ -150,7 +151,7 @@ class ConvFusionTest(hu.HypothesisTestCase):
              device_option=dc[0]
          )
          sum = core.CreateOperator(
-            "Sum",
+            sum_add,
              ["S0", "Y0"],
              ["S0"],
              device_option=dc[0]
@@ -264,10 +265,11 @@ class ConvFusionTest(hu.HypothesisTestCase):
             batch_size=st.integers(1, 3),
             use_bias=st.booleans(),
             group=st.integers(1, 1),
+           sum_add=st.sampled_from(["Sum", "Add"]),
             **mu.gcs)
      def test_convolution_sum_relu_fusion(self, stride, pad, kernel, size,
                               input_channels, output_channels,
-                             batch_size, use_bias, group, gc, dc):
+                             batch_size, use_bias, group, sum_add, gc, dc):
          conv_S0 = core.CreateOperator(
              "Conv",
              ["SX0", "Sw0", "Sb0"] if use_bias else ["SX0", "Sw0"],
@@ -289,7 +291,7 @@ class ConvFusionTest(hu.HypothesisTestCase):
              device_option=dc[0]
          )
          sum = core.CreateOperator(
-            "Sum",
+            sum_add,
              ["S0", "Y0"],
              ["S0"],
              device_option=dc[0]
author	Gu, Jinghui <jinghui.gu@intel.com>
	Mon, 7 Jan 2019 22:10:27 +0000 (14:10 -0800)
committer	Facebook Github Bot <facebook-github-bot@users.noreply.github.com>
	Mon, 7 Jan 2019 22:42:45 +0000 (14:42 -0800)
caffe2/opt/optimize_ideep.cc		patch \| blob \| history
caffe2/python/ideep/convfusion_op_test.py		patch \| blob \| history