From 5ef2e827030f7c9434416a1c7afccebcc28503c5 Mon Sep 17 00:00:00 2001
From: =?utf8?q?=EC=B5=9C=EC=84=B1=EC=A7=84/=EB=8F=99=EC=9E=91=EC=A0=9C?=
 =?utf8?q?=EC=96=B4Lab=28SR=29/Principal=20Engineer/=EC=82=BC=EC=84=B1?=
 =?utf8?q?=EC=A0=84=EC=9E=90?= <lotieye.choi@samsung.com>
Date: Wed, 11 Jul 2018 10:34:32 +0900
Subject: [PATCH] Add explicit padding to conv (#1936)

* Add explicit padding to conv

This commit adds explicit padding to conv.

Signed-off-by: SungJin Choi <lotieye.choi@samsung.com>

* Revise namespace as Explicit

This commit revises namespace as Explicit for consistency.

Signed-off-by: SungJin Choi <lotieye.choi@samsung.com>
---
 runtimes/pure_arm_compute/src/compilation.cc       | 152 +++++++++++++++++++++
 .../pure_arm_compute/src/internal/op/Conv2D.cc     |  44 ++++++
 runtimes/pure_arm_compute/src/internal/op/Conv2D.h |  48 +++++++
 .../pure_arm_compute/src/internal/op/NodeVisitor.h |   1 +
 runtimes/pure_arm_compute/src/model.cc             |  14 +-
 5 files changed, 255 insertions(+), 4 deletions(-)

diff --git a/runtimes/pure_arm_compute/src/compilation.cc b/runtimes/pure_arm_compute/src/compilation.cc
index 73d3dfc..631747c 100644
--- a/runtimes/pure_arm_compute/src/compilation.cc
+++ b/runtimes/pure_arm_compute/src/compilation.cc
@@ -327,6 +327,7 @@ public:
   void visit(const ::internal::tflite::op::Mul::Node &node) override;
   void visit(const ::internal::tflite::op::Div::Node &node) override;
   void visit(const ::internal::tflite::op::Conv2D::implicit::Node &node) override;
+  void visit(const ::internal::tflite::op::Conv2D::Explicit::Node &node) override;
   void visit(const ::internal::tflite::op::DepthwiseConv2D::implicit::Node &node) override;
   void visit(const ::internal::tflite::op::Dequantize::Node &node) override;
   void visit(const ::internal::tflite::op::MaxPool2D::implicit::Node &node) override;
@@ -817,6 +818,157 @@ void Planner::visit(const ::internal::tflite::op::Conv2D::implicit::Node &node)
   _builder.addStage(stage);
 }
 
+void Planner::visit(const ::internal::tflite::op::Conv2D::Explicit::Node &node)
+{
+  const ::internal::tflite::operand::Index ofm_index{node.param().ofm_index};
+
+  const ::internal::tflite::operand::Index ifm_index{node.param().ifm_index};
+  const ::internal::tflite::operand::Index ker_index{node.param().ker_index};
+  const ::internal::tflite::operand::Index bias_index{node.param().bias_index};
+
+  const ::internal::tflite::operand::Index vstride_index{node.param().vstride_index};
+  const ::internal::tflite::operand::Index hstride_index{node.param().hstride_index};
+
+  const ::internal::tflite::operand::Index padding_left_index{node.param().padding_left_index};
+  const ::internal::tflite::operand::Index padding_right_index{node.param().padding_right_index};
+  const ::internal::tflite::operand::Index padding_top_index{node.param().padding_top_index};
+  const ::internal::tflite::operand::Index padding_bottom_index{node.param().padding_bottom_index};
+
+  const ::internal::tflite::operand::Index activation_index{node.param().activation_index};
+
+  const auto ofm_shape = _ctx.at(ofm_index).shape().asFeature();
+  const auto ifm_shape = _ctx.at(ifm_index).shape().asFeature();
+  const auto ker_shape = _ctx.at(ker_index).shape().asKernel();
+  const auto bias_size = _ctx.at(bias_index).shape().asVector();
+
+  const int32_t padding_left = _ctx.at(padding_left_index).asScalar<int32_t>();
+  const int32_t padding_right = _ctx.at(padding_right_index).asScalar<int32_t>();
+  const int32_t padding_top = _ctx.at(padding_top_index).asScalar<int32_t>();
+  const int32_t padding_bottom = _ctx.at(padding_bottom_index).asScalar<int32_t>();
+
+  Stride stride;
+
+  stride.vertical = _ctx.at(vstride_index).asScalar<int32_t>();
+  stride.horizontal = _ctx.at(hstride_index).asScalar<int32_t>();
+
+  // TODO Should move to the place where the operand is handled, if it is possible.
+  // Set Shape Constraints and TensorInfo
+  _builder.addShapeConstr(ofm_index,
+                          asTensorInfo(ofm_shape, _ctx.at(ofm_index).type(),
+                                       _ctx.at(ofm_index).scale(), _ctx.at(ofm_index).zeroPoint()));
+  _builder.addShapeConstr(ifm_index,
+                          asTensorInfo(ifm_shape, _ctx.at(ifm_index).type(),
+                                       _ctx.at(ifm_index).scale(), _ctx.at(ifm_index).zeroPoint()));
+  _builder.addShapeConstr(ker_index,
+                          asTensorInfo(ker_shape, _ctx.at(ker_index).type(),
+                                       _ctx.at(ker_index).scale(), _ctx.at(ker_index).zeroPoint()));
+  _builder.addShapeConstr(bias_index, asTensorInfo(bias_size, _ctx.at(bias_index).type(),
+                                                   _ctx.at(bias_index).scale(),
+                                                   _ctx.at(bias_index).zeroPoint()));
+
+  // Set initializer for kernel
+  {
+    auto ker_base = _ctx.at(ker_index).data().base();
+    auto ker_size = _ctx.at(ker_index).data().size();
+    auto ker_type = _ctx.at(ker_index).type();
+
+    switch (ker_type)
+    {
+      case ANEURALNETWORKS_TENSOR_FLOAT32:
+      {
+        auto initializer = std::bind(initKernelTensor<float>, _1, ker_shape, ker_base, ker_size);
+        _builder.addInitializer(ker_index, initializer);
+        break;
+      }
+      case ANEURALNETWORKS_TENSOR_QUANT8_ASYMM:
+      {
+        auto initializer = std::bind(initKernelTensor<uint8_t>, _1, ker_shape, ker_base, ker_size);
+        _builder.addInitializer(ker_index, initializer);
+        break;
+      }
+      default:
+      {
+        throw std::runtime_error("Not supported");
+      }
+    }
+  }
+
+  // Set initializer for bias
+  {
+    auto bias_base = _ctx.at(bias_index).data().base();
+    auto bias_type = _ctx.at(bias_index).type();
+
+    switch (bias_type)
+    {
+      case ANEURALNETWORKS_TENSOR_FLOAT32:
+      {
+        auto initializer = std::bind(initVectorTensor<float>, _1, bias_base, bias_size);
+        _builder.addInitializer(bias_index, initializer);
+        break;
+      }
+      case ANEURALNETWORKS_TENSOR_INT32:
+      {
+        auto initializer = std::bind(initVectorTensor<int32_t>, _1, bias_base, bias_size);
+        _builder.addInitializer(bias_index, initializer);
+        break;
+      }
+      default:
+      {
+        throw std::runtime_error("Not supported");
+      }
+    }
+  }
+
+  // Construct operation parameters
+  struct Param
+  {
+    int ofm_index;
+    int ifm_index;
+    int ker_index;
+    int bias_index;
+
+    Padding padding;
+    Stride stride;
+
+    FuseCode activation;
+  };
+
+  Param param;
+
+  param.ofm_index = ofm_index.asInt();
+  param.ifm_index = ifm_index.asInt();
+  param.ker_index = ker_index.asInt();
+  param.bias_index = bias_index.asInt();
+
+  param.stride = stride;
+
+  param.padding.left = padding_left;
+  param.padding.right = padding_right;
+  param.padding.top = padding_top;
+  param.padding.bottom = padding_bottom;
+
+  param.activation = static_cast<FuseCode>(_ctx.at(activation_index).asScalar<int32_t>());
+
+  auto stage = [param](const IAllocationContext &ctx, IExecutionBuilder &builder) {
+    auto ofm_alloc = ctx.at(::internal::tflite::operand::Index{param.ofm_index});
+    auto ifm_alloc = ctx.at(::internal::tflite::operand::Index{param.ifm_index});
+    auto ker_alloc = ctx.at(::internal::tflite::operand::Index{param.ker_index});
+    auto bias_alloc = ctx.at(::internal::tflite::operand::Index{param.bias_index});
+
+    const auto conv_info = asPadStringInfo(param.padding, param.stride);
+
+    std::unique_ptr<::arm_compute::CLConvolutionLayer> fn{new ::arm_compute::CLConvolutionLayer};
+
+    fn->configure(ifm_alloc, ker_alloc, bias_alloc, ofm_alloc, conv_info);
+
+    builder.append("Conv2D", std::move(fn));
+
+    ActivationBuilder{builder}.append(param.activation, ofm_alloc);
+  };
+
+  _builder.addStage(stage);
+}
+
 void Planner::visit(const ::internal::tflite::op::DepthwiseConv2D::implicit::Node &node)
 {
   const ::internal::tflite::operand::Index ofm_index{node.param().ofm_index};
diff --git a/runtimes/pure_arm_compute/src/internal/op/Conv2D.cc b/runtimes/pure_arm_compute/src/internal/op/Conv2D.cc
index b0add3c..27b6822 100644
--- a/runtimes/pure_arm_compute/src/internal/op/Conv2D.cc
+++ b/runtimes/pure_arm_compute/src/internal/op/Conv2D.cc
@@ -11,6 +11,13 @@ namespace op
 {
 namespace Conv2D
 {
+namespace Explicit
+{
+
+void Node::accept(NodeVisitor &&v) const { v.visit(*this); }
+
+} // namespace Explicit
+
 namespace implicit
 {
 
@@ -30,6 +37,43 @@ namespace op
 {
 namespace Conv2D
 {
+namespace Explicit
+{
+
+Param::Param(uint32_t inputCount, const uint32_t *inputs, uint32_t outputCount,
+             const uint32_t *outputs)
+{
+  assert(inputCount == 10 && outputCount == 1);
+
+  ofm_index = outputs[0];
+
+  // Each input should be interpreted as follows:
+  //
+  //
+  //  0 -> IFM Tensor Index
+  //  1 -> Kernel Tensor Index
+  //  2 -> Bias Tensor Index
+  //  3 -> Padding_left index
+  //  4 -> Padding_right index
+  //  5 -> Padding_top index
+  //  6 -> Padding_bottom index
+  //  7 -> Stride (width) Index
+  //  8 -> Stride (height) INdex
+  //  9 -> Activation Index
+  ifm_index = inputs[0];
+  ker_index = inputs[1];
+  bias_index = inputs[2];
+  padding_left_index = inputs[3];
+  padding_right_index = inputs[4];
+  padding_top_index = inputs[5];
+  padding_bottom_index = inputs[6];
+  hstride_index = inputs[7];
+  vstride_index = inputs[8];
+  activation_index = inputs[9];
+}
+
+} // namespace Explicit
+
 namespace implicit
 {
 
diff --git a/runtimes/pure_arm_compute/src/internal/op/Conv2D.h b/runtimes/pure_arm_compute/src/internal/op/Conv2D.h
index 5764472..07cfa9c 100644
--- a/runtimes/pure_arm_compute/src/internal/op/Conv2D.h
+++ b/runtimes/pure_arm_compute/src/internal/op/Conv2D.h
@@ -13,6 +13,54 @@ namespace op
 {
 namespace Conv2D
 {
+namespace Explicit
+{
+
+struct Param
+{
+  int32_t ofm_index;
+
+  int32_t ifm_index;
+  int32_t ker_index;
+  int32_t bias_index;
+
+  int32_t hstride_index;
+  int32_t vstride_index;
+
+  int32_t padding_left_index;
+  int32_t padding_right_index;
+  int32_t padding_top_index;
+  int32_t padding_bottom_index;
+
+  int32_t activation_index;
+
+  Param() = default;
+  Param(uint32_t inputCount, const uint32_t *inputs, uint32_t outputCount, const uint32_t *outputs);
+};
+
+class Node final : public op::Node
+{
+public:
+  Node(const Param &param) : _param(param)
+  {
+    // DO NOTHING
+  }
+
+public:
+  virtual ~Node() = default;
+
+public:
+  const Param &param(void) const { return _param; }
+
+public:
+  void accept(NodeVisitor &&) const override;
+
+private:
+  const Param _param;
+};
+
+} // namespace Explicit
+
 namespace implicit
 {
 
diff --git a/runtimes/pure_arm_compute/src/internal/op/NodeVisitor.h b/runtimes/pure_arm_compute/src/internal/op/NodeVisitor.h
index 38a4750..f9a4660 100644
--- a/runtimes/pure_arm_compute/src/internal/op/NodeVisitor.h
+++ b/runtimes/pure_arm_compute/src/internal/op/NodeVisitor.h
@@ -41,6 +41,7 @@ struct NodeVisitor
   virtual void visit(const Mul::Node &) = 0;
   virtual void visit(const Div::Node &) = 0;
   virtual void visit(const Conv2D::implicit::Node &) = 0;
+  virtual void visit(const Conv2D::Explicit::Node &) = 0;
   virtual void visit(const DepthwiseConv2D::implicit::Node &) = 0;
   virtual void visit(const Dequantize::Node &) = 0;
   virtual void visit(const MaxPool2D::implicit::Node &) = 0;
diff --git a/runtimes/pure_arm_compute/src/model.cc b/runtimes/pure_arm_compute/src/model.cc
index 8d4052c..d12bd1e 100644
--- a/runtimes/pure_arm_compute/src/model.cc
+++ b/runtimes/pure_arm_compute/src/model.cc
@@ -137,10 +137,10 @@ int ANeuralNetworksModel_addOperation(ANeuralNetworksModel *model,
     }
     case ANEURALNETWORKS_CONV_2D:
     {
-      // inputCount is either 7 or 9 acccording to NN API specification.
+      // inputCount is either 7 or 10 acccording to NN API specification.
       //  - Padding is implicit when inputCount is 7
-      //  - Padding is explicit when inputCount is 9
-      assert(inputCount == 7 || inputCount == 9);
+      //  - Padding is explicit when inputCount is 10
+      assert(inputCount == 7 || inputCount == 10);
       assert(outputCount == 1);
 
       if (inputCount == 7)
@@ -155,7 +155,13 @@ int ANeuralNetworksModel_addOperation(ANeuralNetworksModel *model,
       }
       else
       {
-        throw std::runtime_error{"Explicit padding in Conv2D is not supported, yet"};
+        using internal::tflite::op::Conv2D::Explicit::Param;
+        using internal::tflite::op::Conv2D::Explicit::Node;
+
+        // Add 'operations'
+        auto &operations = model->deref().operations();
+
+        operations.emplace_back<Node>(Param{inputCount, inputs, outputCount, outputs});
       }
 
       break;
-- 
2.7.4