[neurun] Eliminate OperandIndex in Reduce*::Param (#9008)

author Sergei Barannikov/AI Tools Lab /SRR/Engineer/Samsung Electronics <s.barannikov@samsung.com>

Mon, 25 Nov 2019 08:26:09 +0000 (11:26 +0300)

committer 이한종/On-Device Lab(SR)/Engineer/삼성전자 <hanjoung.lee@samsung.com>

Mon, 25 Nov 2019 08:26:09 +0000 (17:26 +0900)
author Sergei Barannikov/AI Tools Lab /SRR/Engineer/Samsung Electronics <s.barannikov@samsung.com>
Mon, 25 Nov 2019 08:26:09 +0000 (11:26 +0300)
committer 이한종/On-Device Lab(SR)/Engineer/삼성전자 <hanjoung.lee@samsung.com>
Mon, 25 Nov 2019 08:26:09 +0000 (17:26 +0900)
diff --git a/runtime/neurun/backend/acl_cl/KernelGenerator.cc b/runtime/neurun/backend/acl_cl/KernelGenerator.cc

index d0bdacd..6f91551 100644 (file)
--- a/runtime/neurun/backend/acl_cl/KernelGenerator.cc
+++ b/runtime/neurun/backend/acl_cl/KernelGenerator.cc
@@ -524,7 +524,7 @@ void KernelGenerator::visit(const model::operation::ReduceSum &node)
  {
    const auto output_index{node.getOutputs().at(0)};
    const auto input_index{node.getInputs().at(model::operation::ReduceSum::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
  
    auto output_alloc = _tensor_builder->at(output_index).get();
    auto input_alloc = _tensor_builder->at(input_index).get();
@@ -1044,7 +1044,7 @@ void KernelGenerator::visit(const model::operation::ReduceMax &node)
  {
    const auto output_index{node.getOutputs().at(0)};
    const auto input_index{node.getInputs().at(model::operation::ReduceMax::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
  
    auto ofm_alloc = _tensor_builder->at(output_index).get();
    auto ifm_alloc = _tensor_builder->at(input_index).get();
@@ -1798,7 +1798,7 @@ void KernelGenerator::visit(const model::operation::Mean &node)
  {
    const auto ofm_index{node.getOutputs().at(0)};
    const auto ifm_index{node.getInputs().at(model::operation::Mean::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
    const auto keep_dims{node.param().keep_dims};
  
    auto ofm_alloc = _tensor_builder->at(ofm_index).get();
@@ -1882,7 +1882,7 @@ void KernelGenerator::visit(const model::operation::ReduceMin &node)
  {
    const auto ofm_index{node.getOutputs().at(0)};
    const auto ifm_index{node.getInputs().at(model::operation::ReduceMin::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
  
    auto ofm_alloc = _tensor_builder->at(ofm_index).get();
    auto ifm_alloc = _tensor_builder->at(ifm_index).get();
diff --git a/runtime/neurun/backend/acl_neon/KernelGenerator.cc b/runtime/neurun/backend/acl_neon/KernelGenerator.cc

index 89251d8..27f487e 100644 (file)
--- a/runtime/neurun/backend/acl_neon/KernelGenerator.cc
+++ b/runtime/neurun/backend/acl_neon/KernelGenerator.cc
@@ -433,7 +433,7 @@ void KernelGenerator::visit(const model::operation::Mean &node)
  {
    const auto ofm_index{node.getOutputs().at(0)};
    const auto ifm_index{node.getInputs().at(model::operation::Mean::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
    const auto keep_dims{node.param().keep_dims};
  
    auto ofm_alloc = _tensor_builder->at(ofm_index).get();
@@ -1249,7 +1249,7 @@ void KernelGenerator::visit(const model::operation::ReduceMax &node)
  {
    const auto ofm_index{node.getOutputs().at(0)};
    const auto ifm_index{node.getInputs().at(model::operation::ReduceMax::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
  
    auto ofm_alloc = _tensor_builder->at(ofm_index).get();
    auto ifm_alloc = _tensor_builder->at(ifm_index).get();
@@ -1287,7 +1287,7 @@ void KernelGenerator::visit(const model::operation::ReduceMin &node)
  {
    const auto ofm_index{node.getOutputs().at(0)};
    const auto ifm_index{node.getInputs().at(model::operation::ReduceMin::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
  
    auto ofm_alloc = _tensor_builder->at(ofm_index).get();
    auto ifm_alloc = _tensor_builder->at(ifm_index).get();
@@ -1325,7 +1325,7 @@ void KernelGenerator::visit(const model::operation::ReduceSum &node)
  {
    const auto output_index{node.getOutputs().at(0)};
    const auto input_index{node.getInputs().at(model::operation::ReduceSum::Input::INPUT)};
-  const auto &axes{_ctx.at(node.param().axis_index).asVector<int>()};
+  const auto &axes{node.param().axes};
  
    auto output_alloc = _tensor_builder->at(output_index).get();
    auto input_alloc = _tensor_builder->at(input_index).get();
diff --git a/runtime/neurun/core/include/model/operation/Mean.h b/runtime/neurun/core/include/model/operation/Mean.h

index 68ce20d..6841481 100644 (file)
--- a/runtime/neurun/core/include/model/operation/Mean.h
+++ b/runtime/neurun/core/include/model/operation/Mean.h
@@ -36,7 +36,7 @@ public:
  
    struct Param
    {
-    OperandIndex axis_index;
+    std::vector<int> axes;
      bool keep_dims;
    };
  
diff --git a/runtime/neurun/core/include/model/operation/ReduceMax.h b/runtime/neurun/core/include/model/operation/ReduceMax.h

index 054a9d9..18bd906 100644 (file)
--- a/runtime/neurun/core/include/model/operation/ReduceMax.h
+++ b/runtime/neurun/core/include/model/operation/ReduceMax.h
@@ -38,7 +38,7 @@ public:
  
    struct Param
    {
-    OperandIndex axis_index;
+    std::vector<int> axes;
    };
  
  public:
diff --git a/runtime/neurun/core/include/model/operation/ReduceMin.h b/runtime/neurun/core/include/model/operation/ReduceMin.h

index f8ef615..6541a2b 100644 (file)
--- a/runtime/neurun/core/include/model/operation/ReduceMin.h
+++ b/runtime/neurun/core/include/model/operation/ReduceMin.h
@@ -38,7 +38,7 @@ public:
  
    struct Param
    {
-    OperandIndex axis_index;
+    std::vector<int> axes;
    };
  
  public:
diff --git a/runtime/neurun/core/include/model/operation/ReduceSum.h b/runtime/neurun/core/include/model/operation/ReduceSum.h

index 94b1bc1..8ed87c2 100644 (file)
--- a/runtime/neurun/core/include/model/operation/ReduceSum.h
+++ b/runtime/neurun/core/include/model/operation/ReduceSum.h
@@ -36,7 +36,7 @@ public:
  
    struct Param
    {
-    OperandIndex axis_index;
+    std::vector<int> axes;
    };
  
  public:
diff --git a/runtime/neurun/core/src/compiler/OperationValidator.cc b/runtime/neurun/core/src/compiler/OperationValidator.cc

index d7c9d02..92b2f9a 100644 (file)
--- a/runtime/neurun/core/src/compiler/OperationValidator.cc
+++ b/runtime/neurun/core/src/compiler/OperationValidator.cc
@@ -140,24 +140,20 @@ void OperationValidator::visit(const model::operation::ReduceSum &node)
  
    const auto output_index{node.getOutputs().at(0)};
    const auto input_index{node.getInputs().at(model::operation::ReduceSum::Input::INPUT)};
-  const auto axis_index{node.param().axis_index};
+  const auto &axes = node.param().axes;
  
    UNUSED_RELEASE(output_index);
    UNUSED_RELEASE(input_index);
-  UNUSED_RELEASE(axis_index);
+  UNUSED_RELEASE(axes);
  
    const auto input_shape = _ctx.at(input_index).shape();
    const auto output_shape = _ctx.at(output_index).shape();
-  const auto axis_shape = _ctx.at(axis_index).shape();
  
    UNUSED_RELEASE(output_shape);
    UNUSED_RELEASE(input_shape);
-  UNUSED_RELEASE(axis_shape);
  
    assert(input_shape.rank() <= 4);
    assert(output_shape.rank() <= input_shape.rank());
-  assert(_ctx.at(axis_index).isConstant());
-  assert(axis_shape.rank() == 0 || axis_shape.rank() == 1);
  
    // NOTE For the 4-dimensions, if the rank of input and output are different, this runtime only
    // supports cases reducing height and width or reducing depth.
@@ -214,20 +210,17 @@ void OperationValidator::visit(const model::operation::ReduceMax &node)
  {
    const auto output_index{node.getOutputs().at(0)};
    const auto input_index{node.getInputs().at(model::operation::ReduceMax::Input::INPUT)};
-  const auto axis_index{node.param().axis_index};
+  const auto &axes = node.param().axes;
  
    auto output_shape = _ctx.at(output_index).shape();
    auto input_shape = _ctx.at(input_index).shape();
-  auto axis_shape = _ctx.at(axis_index).shape();
  
    UNUSED_RELEASE(output_shape);
    UNUSED_RELEASE(input_shape);
-  UNUSED_RELEASE(axis_shape);
+  UNUSED_RELEASE(axes);
  
    assert(input_shape.rank() <= 4);
    assert(output_shape.rank() <= input_shape.rank());
-  assert(_ctx.at(axis_index).isConstant());
-  assert(axis_shape.rank() == 0 || axis_shape.rank() == 1);
  
    // NOTE For the 4-dimensions, if the rank of input and output are different, this runtime only
    // supports cases reducing height and width or reducing depth.
@@ -642,20 +635,17 @@ void OperationValidator::visit(const model::operation::ReduceMin &node)
  {
    const auto ofm_index{node.getOutputs().at(0)};
    const auto ifm_index{node.getInputs().at(model::operation::ReduceMin::Input::INPUT)};
-  const auto axis_index{node.param().axis_index};
+  const auto &axes = node.param().axes;
  
    auto ifm_shape = _ctx.at(ifm_index).shape();
    auto ofm_shape = _ctx.at(ofm_index).shape();
-  auto axis_shape = _ctx.at(axis_index).shape();
  
    UNUSED_RELEASE(ifm_shape);
    UNUSED_RELEASE(ofm_shape);
-  UNUSED_RELEASE(axis_shape);
+  UNUSED_RELEASE(axes);
  
    assert(ifm_shape.rank() <= 4);
    assert(ofm_shape.rank() <= ifm_shape.rank());
-  assert(_ctx.at(axis_index).isConstant());
-  assert(axis_shape.rank() == 0 || axis_shape.rank() == 1);
  
    // NOTE For the 4-dimensions, if the rank of input and output are different, this runtime only
    // supports cases reducing height and width or reducing depth.
diff --git a/runtime/neurun/frontend/base_loader/base_loader.h b/runtime/neurun/frontend/base_loader/base_loader.h

index c28f464..269b3d8 100644 (file)
--- a/runtime/neurun/frontend/base_loader/base_loader.h
+++ b/runtime/neurun/frontend/base_loader/base_loader.h
@@ -679,16 +679,18 @@ void BaseLoader<LoaderDomain, SpecificLoader>::loadMean(const Operator *op)
    model::OperandIndexSequence inputs;
    model::OperandIndexSequence outputs;
  
-  const auto input_index = (*op->inputs())[0];
-  inputs.append(model::OperandIndex(input_index));
-  const auto output_index = (*op->outputs())[0];
-  outputs.append(model::OperandIndex(output_index));
+  loadOperationIO(op, inputs, outputs);
+  auto input = inputs.at(0);
+  auto axes = inputs.at(1);
+
+  if (!_graph.operands().at(axes).isConstant())
+    throw std::runtime_error("Mean: non-constant 'axes' is not supported.");
  
    model::operation::Mean::Param param;
-  param.axis_index = model::OperandIndex((*op->inputs())[1]);
+  param.axes = _graph.operands().at(axes).template asVector<int>();
    param.keep_dims = op->builtin_options_as_ReducerOptions()->keep_dims();
  
-  std::unique_ptr<model::Operation> new_op(new model::operation::Mean(inputs, outputs, param));
+  std::unique_ptr<model::Operation> new_op(new model::operation::Mean({input}, outputs, param));
    _graph.addOperation(std::move(new_op));
  }
  
@@ -698,15 +700,19 @@ void BaseLoader<LoaderDomain, SpecificLoader>::loadReduceMax(const Operator *op)
    model::OperandIndexSequence inputs;
    model::OperandIndexSequence outputs;
  
-  const auto input_index = (*op->inputs())[0];
-  inputs.append(model::OperandIndex(input_index));
-  const auto output_index = (*op->outputs())[0];
-  outputs.append(model::OperandIndex(output_index));
+  loadOperationIO(op, inputs, outputs);
+  auto input = inputs.at(0);
+  auto axes = inputs.at(1);
+
+  // FIXME Handle ReducerOptions.
+  if (!_graph.operands().at(axes).isConstant())
+    throw std::runtime_error("ReduceSum: non-constant 'axes' is not supported.");
  
    model::operation::ReduceMax::Param param;
-  param.axis_index = model::OperandIndex((*op->inputs())[1]);
+  param.axes = _graph.operands().at(axes).template asVector<int>();
  
-  std::unique_ptr<model::Operation> new_op(new model::operation::ReduceMax(inputs, outputs, param));
+  std::unique_ptr<model::Operation> new_op(
+      new model::operation::ReduceMax({input}, outputs, param));
    _graph.addOperation(std::move(new_op));
  }
  
@@ -799,13 +805,22 @@ void BaseLoader<LoaderDomain, SpecificLoader>::loadBatchToSpaceND(const Operator
  template <typename LoaderDomain, typename SpecificLoader>
  void BaseLoader<LoaderDomain, SpecificLoader>::loadReduceSum(const Operator *op)
  {
-  model::OperandIndexSequence inputs{(*op->inputs())[0]};
-  model::OperandIndexSequence outputs{(*op->outputs())[0]};
+  model::OperandIndexSequence inputs;
+  model::OperandIndexSequence outputs;
+
+  loadOperationIO(op, inputs, outputs);
+  auto input = inputs.at(0);
+  auto axes = inputs.at(1);
+
+  // FIXME Handle ReducerOptions.
+  if (!_graph.operands().at(axes).isConstant())
+    throw std::runtime_error("ReduceSum: non-constant 'axes' is not supported.");
  
    model::operation::ReduceSum::Param param;
-  param.axis_index = model::OperandIndex{static_cast<uint32_t>((*op->inputs())[1])};
+  param.axes = _graph.operands().at(axes).template asVector<int>();
  
-  std::unique_ptr<model::Operation> new_op{new model::operation::ReduceSum{inputs, outputs, param}};
+  std::unique_ptr<model::Operation> new_op{
+      new model::operation::ReduceSum{{input}, outputs, param}};
    _graph.addOperation(std::move(new_op));
  }
  
diff --git a/runtime/neurun/frontend/nnapi/wrapper/OperationFactory.cc b/runtime/neurun/frontend/nnapi/wrapper/OperationFactory.cc

index 214a56a..b88629e 100644 (file)
--- a/runtime/neurun/frontend/nnapi/wrapper/OperationFactory.cc
+++ b/runtime/neurun/frontend/nnapi/wrapper/OperationFactory.cc
@@ -519,7 +519,7 @@ OperationFactory::OperationFactory()
    };
  
    _map[ANEURALNETWORKS_REDUCE_SUM_EX] = [](const OperationFactory::Param &init_param,
-                                           neurun::model::Operands &) {
+                                           neurun::model::Operands &operands) {
      assert(init_param.input_count == 2);
      assert(init_param.output_count == 1);
  
@@ -530,10 +530,11 @@ OperationFactory::OperationFactory()
  
      OperandIndexSequence inputs{init_param.inputs[0]};
      OperandIndexSequence outputs{init_param.outputs[0]};
+    std::vector<std::int32_t> axes =
+        operands.at(OperandIndex{init_param.inputs[1]}).asVector<std::int32_t>();
  
      operation::ReduceSum::Param param;
-
-    param.axis_index = OperandIndex{init_param.inputs[1]};
+    param.axes.assign(axes.cbegin(), axes.cend());
  
      return new operation::ReduceSum{inputs, outputs, param};
    };
@@ -789,7 +790,7 @@ OperationFactory::OperationFactory()
    };
  
    _map[ANEURALNETWORKS_REDUCE_MAX_EX] = [](const OperationFactory::Param &init_param,
-                                           neurun::model::Operands &) {
+                                           neurun::model::Operands &operands) {
      assert(init_param.input_count == 2 && init_param.output_count == 1);
  
      OperandIndexSequence outputs{init_param.outputs[0]};
@@ -799,9 +800,11 @@ OperationFactory::OperationFactory()
      //  0 -> Input Tensor Index
      //  1 -> Axis Tensor Index
      OperandIndexSequence inputs{init_param.inputs[0]};
+    std::vector<std::int32_t> axes =
+        operands.at(OperandIndex{init_param.inputs[1]}).asVector<std::int32_t>();
  
      operation::ReduceMax::Param param;
-    param.axis_index = OperandIndex{init_param.inputs[1]};
+    param.axes.assign(axes.cbegin(), axes.cend());
  
      return new operation::ReduceMax{inputs, outputs, param};
    };
@@ -1446,9 +1449,11 @@ OperationFactory::OperationFactory()
      //  1 -> axis Tensor Index
      //  2 -> keep_dims Index
      OperandIndexSequence inputs{init_param.inputs[0]};
+    std::vector<std::int32_t> axes =
+        operands.at(OperandIndex{init_param.inputs[1]}).asVector<std::int32_t>();
  
      operation::Mean::Param param;
-    param.axis_index = OperandIndex{init_param.inputs[1]};
+    param.axes.assign(axes.cbegin(), axes.cend());
      param.keep_dims = operands.at(OperandIndex{init_param.inputs[2]}).asScalar<int32_t>() != 0;
  
      return new operation::Mean{inputs, outputs, param};
@@ -1510,7 +1515,7 @@ OperationFactory::OperationFactory()
    };
  
    _map[ANEURALNETWORKS_REDUCE_MIN_EX] = [](const OperationFactory::Param &init_param,
-                                           neurun::model::Operands &) {
+                                           neurun::model::Operands &operands) {
      assert(init_param.input_count == 2 && init_param.output_count == 1);
  
      OperandIndexSequence outputs{init_param.outputs[0]};
@@ -1520,9 +1525,11 @@ OperationFactory::OperationFactory()
      //  0 -> Input Tensor Index
      //  1 -> Axis Tensor Index
      OperandIndexSequence inputs{init_param.inputs[0]};
+    std::vector<std::int32_t> axes =
+        operands.at(OperandIndex{init_param.inputs[1]}).asVector<std::int32_t>();
  
      operation::ReduceMin::Param param;
-    param.axis_index = OperandIndex{init_param.inputs[1]};
+    param.axes.assign(axes.cbegin(), axes.cend());
  
      return new operation::ReduceMin{inputs, outputs, param};
    };
author	Sergei Barannikov/AI Tools Lab /SRR/Engineer/Samsung Electronics <s.barannikov@samsung.com>
	Mon, 25 Nov 2019 08:26:09 +0000 (11:26 +0300)
committer	이한종/On-Device Lab(SR)/Engineer/삼성전자 <hanjoung.lee@samsung.com>
	Mon, 25 Nov 2019 08:26:09 +0000 (17:26 +0900)
runtime/neurun/backend/acl_cl/KernelGenerator.cc		patch \| blob \| history
runtime/neurun/backend/acl_neon/KernelGenerator.cc		patch \| blob \| history
runtime/neurun/core/include/model/operation/Mean.h		patch \| blob \| history
runtime/neurun/core/include/model/operation/ReduceMax.h		patch \| blob \| history
runtime/neurun/core/include/model/operation/ReduceMin.h		patch \| blob \| history
runtime/neurun/core/include/model/operation/ReduceSum.h		patch \| blob \| history
runtime/neurun/core/src/compiler/OperationValidator.cc		patch \| blob \| history
runtime/neurun/frontend/base_loader/base_loader.h		patch \| blob \| history
runtime/neurun/frontend/nnapi/wrapper/OperationFactory.cc		patch \| blob \| history