Reimplement class InferenceEngineVision using InferenceEngineCommon

author Tae-Young Chung <ty83.chung@samsung.com>

Wed, 18 Sep 2019 08:30:35 +0000 (17:30 +0900)

committer Tae-Young Chung <ty83.chung@samsung.com>

Mon, 23 Sep 2019 06:09:43 +0000 (15:09 +0900)
author Tae-Young Chung <ty83.chung@samsung.com>
Wed, 18 Sep 2019 08:30:35 +0000 (17:30 +0900)
committer Tae-Young Chung <ty83.chung@samsung.com>
Mon, 23 Sep 2019 06:09:43 +0000 (15:09 +0900)
diff --git a/common/inference_engine_common_impl.cpp b/common/inference_engine_common_impl.cpp

index c04c9fcce473bc004e4bbfe6ead04768df8c108c..d1aa2ce99e22efa72dad320d14ab5e1dd8e6fbcd 100644 (file)
--- a/common/inference_engine_common_impl.cpp
+++ b/common/inference_engine_common_impl.cpp
@@ -37,33 +37,34 @@ extern "C" {
  namespace InferenceEngineInterface {
  namespace Common {
  
-InferenceEngineCommon::InferenceEngineCommon(std::string backend)
+InferenceEngineCommon::InferenceEngineCommon(std::string backend) :
+    handle(nullptr),
+    engine(nullptr)
  {
      LOGE("ENTER");
      mBackendLibName = "libinference-engine-" + backend + ".so";
+    LOGE("lib: %s", mBackendLibName.c_str());
      LOGE("LEAVE");
  }
  
  InferenceEngineCommon::~InferenceEngineCommon()
  {
      LOGW("ENTER");
-    if (handle){
-        destroy_t *engineDestroy = (destroy_t*)dlsym(handle, "EngineCommonDestroy");
-        engineDestroy(engine);
-        dlclose(handle);
-        engine = nullptr;
-        handle = nullptr;
-    }
+    if (handle)
+        Deinit();
  
      LOGW("LEAVE");
  }
  
  int InferenceEngineCommon::Init(std::string configFile,
-            std::string weightFile, std::string userFile)
+            std::string weightFile)
  {
      LOGW("ENTER");
      char *error = NULL;
-    handle = dlopen(mBackendLibName.c_str(), RTLD_LAZY);
+    LOGI("lib: %s", mBackendLibName.c_str());
+    handle = dlopen(mBackendLibName.c_str(), RTLD_NOW/*RTLD_LAZY*/);
+    LOGI("HANDLE : [%p]", handle);
+
      if (!handle) {
          LOGE("Fail to dlopen %s", mBackendLibName.c_str());
          LOGE("Error: %s\n", dlerror());
@@ -77,7 +78,7 @@ int InferenceEngineCommon::Init(std::string configFile,
          return INFERENCE_ENGINE_ERROR_INTERNAL;
      }
      
-    engine = EngineInit(configFile, weightFile, userFile);
+    engine = EngineInit(configFile, weightFile);
      if (engine == NULL) {
          LOGE("Fail to EngineInit");
          dlclose(handle);
@@ -90,7 +91,17 @@ int InferenceEngineCommon::Init(std::string configFile,
  
  void InferenceEngineCommon::Deinit()
  {
-    ;
+    LOGW("ENTER");
+
+    if (handle) {
+        destroy_t *engineDestroy = (destroy_t*)dlsym(handle, "EngineCommonDestroy");
+        engineDestroy(engine);
+        dlclose(handle);
+        engine = nullptr;
+        handle = nullptr;
+    }
+
+    LOGW("LEAVE");
  }
  
  int InferenceEngineCommon::SetInputTensorParam()
@@ -122,7 +133,7 @@ int InferenceEngineCommon::SetTargetDevice(inference_target_type_e type)
      return ret;
  }
  
-int InferenceEngineCommon::Load(inference_input_type_e type)
+int InferenceEngineCommon::Load()
  {
      int ret = engine->Load();
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
@@ -132,11 +143,29 @@ int InferenceEngineCommon::Load(inference_input_type_e type)
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
          LOGE("Fail to load CreateInputLayerPassage");
  
+    return ret;
+}
  
-    ret = engine->PrepareInputLayerPassage(type);
-    if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to load PrepareInputLayerPassage");
+int InferenceEngineCommon::GetInputLayerAttrType()
+{
+    return engine->GetInputLayerAttrType();
+}
  
+void * InferenceEngineCommon::GetInputDataPtr()
+{
+    return engine->GetInputDataPtr();
+}
+
+int InferenceEngineCommon::SetInputDataBuffer(tensor_t data)
+{
+    return engine->SetInputDataBuffer(data);
+}
+
+int InferenceEngineCommon::Run()
+{
+    int ret = engine->Run();
+    if (ret != INFERENCE_ENGINE_ERROR_NONE)
+        LOGE("Fail to run InferenceEngineCommon");
  
      return ret;
  }
@@ -145,7 +174,7 @@ int InferenceEngineCommon::Run(std::vector<float> tensor)
  {
      int ret = engine->Run(tensor);
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to run InferenceEngineVision");
+        LOGE("Fail to run InferenceEngineCommon");
  
      return ret;
  }
@@ -160,13 +189,14 @@ int InferenceEngineCommon::SetInputTensorParamNode(std::string node)
      return ret;
  }
  
-int InferenceEngineCommon::GetInferenceResult(std::vector<std::vector<int>>& dimInfo, std::vector<float*>& results)
+int InferenceEngineCommon::GetInferenceResult(tensor_t& results)
  {
      LOGE("ENTER");
-    int ret = engine->GetInferenceResult(dimInfo, results);
+    int ret = engine->GetInferenceResult(results);
  
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
          LOGE("Fail to GetInferenceResult");
+
      LOGE("LEAVE");
      return ret;
  }
diff --git a/include/inference_engine_common.h b/include/inference_engine_common.h

index f7fc23e0226464aa6bd13b00fd6cd28833d78f3b..78ba3c8abb2904bf92305703f401118019b02fac 100644 (file)
--- a/include/inference_engine_common.h
+++ b/include/inference_engine_common.h
@@ -30,32 +30,96 @@ public:
  
      virtual ~IInferenceEngineCommon() {};
  
-    // InputTensor
+    /**
+     * @brief Set parameters for an input tensor.
+     *
+     * @since_tizen 5.5
+     */
      virtual int SetInputTensorParam() = 0;
  
+    /**
+     * @brief Set an input node name.
+     *
+     * @since_tizen 5.5
+     */
      virtual int SetInputTensorParamNode(std::string node) = 0;
  
-    // OutputTensor
+    /**
+     * @brief Set parameters for output tensors.
+     *
+     * @since_tizen 5.5
+     */
      virtual int SetOutputTensorParam() = 0;
  
+    /**
+     * @brief Set output nodes' names.
+     *
+     * @since_tizen 5.5
+     */
      virtual int SetOutputTensorParamNodes(std::vector<std::string> nodes) = 0;
  
+    /**
+     * @brief Set target device.
+     * @details See #inference_target_type_e
+     *
+     * @since_tizen 5.5
+     */
      virtual int SetTargetDevice(inference_target_type_e type) = 0;
  
-    // Load and Run
+    /**
+     * @brief Load model data.
+     *
+     * @since_tizen 5.5
+     */
      virtual int Load() = 0;
  
+    /**
+     * @brief Create a memory.
+     *
+     * @since_tizen 5.5
+     */
      virtual int CreateInputLayerPassage() = 0;
  
-    virtual int PrepareInputLayerPassage(inference_input_type_e type) = 0;
+    /**
+     * @brief Get an input layer's type such as float32, float16, and so on.
+     *
+     * @since_tizen 5.5
+     */
+    virtual int GetInputLayerAttrType() = 0;
+
+    /**
+     * @brief Get an input data pointer.
+     *
+     * @since_tizen 5.5
+     */
+    virtual void* GetInputDataPtr() = 0;
+
+    /**
+     * @brief Set an input data buffer.
+     *
+     * @since_tizen 5.5
+     */
+    virtual int SetInputDataBuffer(tensor_t data) = 0;
+
+    /**
+     * @brief Run an inference.
+     *
+     * @since_tizen 5.5
+     */
+    virtual int Run() = 0;
  
      virtual int Run(std::vector<float> tensor) = 0;
  
-    virtual int GetInferenceResult(std::vector<std::vector<int>>& dimInfo, std::vector<float*>& results) = 0;
+    /**
+     * @brief Get inference results.
+     *
+     * @since_tizen 5.5
+     */
+    virtual int GetInferenceResult(tensor_t& results) = 0;
  };
  
  typedef void destroy_t(IInferenceEngineCommon*);
-typedef IInferenceEngineCommon* init_t(std::string configFile, std::string weightFile, std::string userFile);
+typedef IInferenceEngineCommon* init_t(std::string configFile, std::string weightFile);
  } /* Common */
  } /* InferenceEngineInterface */
  
diff --git a/include/inference_engine_common_impl.h b/include/inference_engine_common_impl.h

index ab78c912bea62d13dabc09b471325e71d2b9250d..6402f5ebf8ef74a1dc3cdd5df6049ace8e3abf13 100644 (file)
--- a/include/inference_engine_common_impl.h
+++ b/include/inference_engine_common_impl.h
@@ -33,33 +33,106 @@ public:
  
      ~InferenceEngineCommon();
  
-    int Init(std::string configFile,
-            std::string weightFile, std::string UserFile);
-
+    /**
+     * @brief Intialization.
+     * @details Load the backend engine by dlopen() and initialize the engine by
+     *          calling EngineCommonInit which is found by dlsym().
+     * @since_tizen 5.5
+     */
+    int Init(std::string configFile, std::string weightFile);
+
+    /**
+     * @brief De-initiaization.
+     * @details Destroy the engine by calling EngineCommonDestroy which is found dlsym().
+     *          Close the engine by dlclose().
+     * @since_tizen 5.5
+     */
      void Deinit();
  
-    // InputTensor
+    /**
+     * @brief Set parameters for an input tensor.
+     * @details Wrapper of class IInferenceEngineCommon
+     *
+     * @since_tizen 5.5
+     */
      int SetInputTensorParam();
  
+    /**
+     * @brief Set an input node name.
+     *
+     * @since_tizen 5.5
+     */
      int SetInputTensorParamNode(std::string node);
  
-    // OutputTensor
+    /**
+     * @brief Set parameters for output tensors.
+     *
+     * @since_tizen 5.5
+     */
      int SetOutputTensorParam();
  
+    /**
+     * @brief Set output nodes' names.
+     *
+     * @since_tizen 5.5
+     */
      int SetOutputTensorParamNodes(std::vector<std::string> nodes);
  
+    /**
+     * @brief Set target device.
+     * @details See #inference_target_type_e
+     *
+     * @since_tizen 5.5
+     */
      int SetTargetDevice(inference_target_type_e type);
  
-    // Load and Run
-    int Load(inference_input_type_e type);
+    /**
+     * @brief Load model data.
+     *
+     * @since_tizen 5.5
+     */
+    int Load();
+
+    /**
+     * @brief Get an input layer's type such as float32, float16, and so on.
+     *
+     * @since_tizen 5.5
+     */
+    int GetInputLayerAttrType();
+
+    /**
+     * @brief Get an input data pointer.
+     *
+     * @since_tizen 5.5
+     */
+    void* GetInputDataPtr();
+
+    /**
+     * @brief Set an input data buffer.
+     *
+     * @since_tizen 5.5
+     */
+    int SetInputDataBuffer(tensor_t data);
+
+    /**
+     * @brief Run an inference.
+     *
+     * @since_tizen 5.5
+     */
+    int Run();
  
      int Run(std::vector<float> tensor);
  
-    int GetInferenceResult(std::vector<std::vector<int>>& dimInfo, std::vector<float*>& results);
+    /**
+     * @brief Get inference results.
+     *
+     * @since_tizen 5.5
+     */
+    int GetInferenceResult(tensor_t& results);
  
  private:
      std::string mBackendLibName;
-    std::vector<std::string> mUserListName;
+
  protected:
      void *handle;
      IInferenceEngineCommon *engine;
diff --git a/include/inference_engine_type.h b/include/inference_engine_type.h

index 5860582fe4a3fa8b37945e3ff454b1534399f775..425ba52d2cecb20ceb9496b16da07b49c34db8c2 100644 (file)
--- a/include/inference_engine_type.h
+++ b/include/inference_engine_type.h
@@ -17,8 +17,6 @@
  #ifndef __INFERENCE_ENGINE_TYPE_H__
  #define __INFERENCE_ENGINE_TYPE_H__
  
-#include <opencv2/core.hpp>
-
  #ifdef __cplusplus
  extern "C" {
  #endif /* __cplusplus */
@@ -43,44 +41,27 @@ typedef enum {
         INFERENCE_TARGET_MAX
  } inference_target_type_e;
  
-typedef enum {
-       INFERENCE_INPUT_GENERAL = 0,
-       INFERENCE_INPUT_IMAGE,
-       INFERENCE_INPUT_MAX
-} inference_input_type_e;
-
-typedef struct _ImageClassficationResults {
-    int number_of_classes;
-    std::vector<int> indices;
-    std::vector<std::string> names;
-    std::vector<float> confidences;
-} ImageClassificationResults; /**< structure ImageClassificationResults */
-
-typedef struct _ObjectDetectionResults {
-    int number_of_objects;
-    std::vector<int> indices;
-    std::vector<std::string> names;
-    std::vector<float> confidences;
-    std::vector<cv::Rect> locations;
-} ObjectDetectionResults;  /**< structure ObjectDetectionResults */
-
-typedef struct _FaceDetectionResults {
-    int number_of_faces;
-    std::vector<float> confidences;
-    std::vector<cv::Rect> locations;
-} FaceDetectionResults;  /**< structure ObjectDetectionResults */
-
-typedef struct _FacialLandMarkDetectionResults {
-    int number_of_landmarks;
-    std::vector<cv::Point> locations;
-} FacialLandMarkDetectionResults;  /**< structure ObjectDetectionResults */
-
-typedef struct _InferenceResults{
-    int dimInfoSize;
+/**
+ * @brief Tensor defined by the dimension and their corresponding data
+ * @details @a dimInfo is the information
+ *          of a tensor, which is multi-dimension matix. @a data is the data pointer
+ *          corresponding to @a dimInfo. In case of an input image tensor with
+ *          resolution 224 x 224 and chanel 3, for example:
+ *          @code
+ *           // assume that image data address is known
+ *          float *pImagedata = ...;
+ *          std::vector<int> dim{ 1, 3, 224, 224};
+ *          tensor_t inputTensor;
+ *          inputTensor.dimInfo.push_back(dim);
+ *          inputTensor.data = (void*)pImageData;
+ *
+ *          // Do something with inputTensor
+ * @since_tizen 5.5
+ */
+typedef struct _tensor_t {
      std::vector<std::vector<int>> dimInfo;
-    std::vector<float*> data;
-} InferenceResults; /**< structure InferenceResults */
-
+    std::vector<void*> data;
+} tensor_t;
  
  #ifdef __cplusplus
  }
diff --git a/include/inference_engine_vision.h b/include/inference_engine_vision.h

deleted file mode 100644 (file)

index 26f4f89..0000000
--- a/include/inference_engine_vision.h
+++ /dev/null
@@ -1,71 +0,0 @@
-/**
- * Copyright (c) 2019 Samsung Electronics Co., Ltd All Rights Reserved
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef __INFERENCE_ENGINE_VISION_H__
-#define __INFERENCE_ENGINE_VISION_H__
-
-#include <vector>
-#include <string>
-
-#include "inference_engine_type.h"
-#include "inference_engine_common.h"
-#include <opencv2/core.hpp>
-
-namespace InferenceEngineInterface {
-namespace Vision {
-
-class IInferenceEngineVision : public virtual Common::IInferenceEngineCommon {
-public:
-    using Common::IInferenceEngineCommon::GetInferenceResult;
-    virtual ~IInferenceEngineVision() {};
-
-    // InputTensor
-
-    virtual int SetInputTensorParamInput(int width, int height, int dim, int ch) = 0;
-
-    virtual int SetInputTensorParamNorm(double deviation, double mean) = 0;
-
-    // OutputTensor
-
-    virtual int SetOutputTensorParamThresHold(double threshold) = 0;
-
-    virtual int SetOutputTensorParamNumbers(int number)  = 0;
-
-    virtual int SetOutputTensorParamType(int type) = 0;
-
-    // Load and Run
- 
-    virtual int Run(cv::Mat tensor) = 0;
-
-    virtual int GetInferenceResult(ImageClassificationResults& results) = 0;
-
-    virtual int GetInferenceResult(ObjectDetectionResults& results) = 0;
-
-    virtual int GetInferenceResult(FaceDetectionResults& results) = 0;
-
-    virtual int GetInferenceResult(FacialLandMarkDetectionResults& results) = 0;
-
-    virtual int GetNumberOfOutputs() = 0;
-    
-    virtual void SetUserListName(std::string userlist) = 0;
-};
-
-typedef void destroy_t(IInferenceEngineVision*);
-typedef IInferenceEngineVision* init_t(std::string configFile, std::string weightFile, std::string userFile);
-} /* Vision */
-} /* InferenceEngineInterface */
-
-#endif /* __INFERENCE_ENGINE_VISION_H__ */
diff --git a/include/inference_engine_vision_impl.h b/include/inference_engine_vision_impl.h

index 89a1c131116fa7b186d67881a7808bc6b0494ef9..6d181b586873586281d485829b94f0079c45a3c3 100644 (file)
--- a/include/inference_engine_vision_impl.h
+++ b/include/inference_engine_vision_impl.h
@@ -20,58 +20,198 @@
  #include <vector>
  #include <string>
  #include "inference_engine_common_impl.h"
-#include "inference_engine_vision.h"
+#include "inference_engine_common.h"
  #include "inference_engine_type.h"
  #include <opencv2/core.hpp>
+#include <opencv2/imgproc.hpp>
  
  
+using namespace InferenceEngineInterface::Common;
+
+typedef struct _ImageClassficationResults {
+    int number_of_classes;
+    std::vector<int> indices;
+    std::vector<std::string> names;
+    std::vector<float> confidences;
+} ImageClassificationResults; /**< structure ImageClassificationResults */
+
+typedef struct _ObjectDetectionResults {
+    int number_of_objects;
+    std::vector<int> indices;
+    std::vector<std::string> names;
+    std::vector<float> confidences;
+    std::vector<cv::Rect> locations;
+} ObjectDetectionResults;  /**< structure ObjectDetectionResults */
+
+typedef struct _FaceDetectionResults {
+    int number_of_faces;
+    std::vector<float> confidences;
+    std::vector<cv::Rect> locations;
+} FaceDetectionResults;  /**< structure FaceDetectionResults */
+
+typedef struct _FacialLandMarkDetectionResults {
+    int number_of_landmarks;
+    std::vector<cv::Point> locations;
+} FacialLandMarkDetectionResults;  /**< structure FacialLandMarkDetectionResults */
+
  namespace InferenceEngineInterface {
  namespace Vision {
  
-class InferenceEngineVision : public Common::InferenceEngineCommon {
+class InferenceEngineVision {
  public:
-    using Common::InferenceEngineCommon::GetInferenceResult;
+
      InferenceEngineVision(std::string backend);
  
      ~InferenceEngineVision();
  
+    /**
+     * @brief Intialization.
+     * @since_tizen 5.5
+     */
      int Init(std::string configFile,
              std::string weightFile, std::string UserFile);
  
+    /**
+     * @brief De-initiaization.
+     * @since_tizen 5.5
+     */
      void Deinit();
  
-    // Input Tensor parameters
+    /**
+     * @brief Set an input node name.
+     *
+     * @since_tizen 5.5
+     */
+    int SetInputTensorParamNode(std::string node);
+
+    /**
+     * @brief Set an input image's information.
+     *
+     * @since_tizen 5.5
+     */
      int SetInputTensorParamInput(int width, int height, int dim, int ch);
  
+    /**
+     * @brief Set mean and deviation values.
+     *
+     * @since_tizen 5.5
+     */
      int SetInputTensorParamNorm(double deviation, double mean);
  
-    // Output Tensor parameters
+    /**
+     * @brief Set output nodes' names.
+     *
+     * @since_tizen 5.5
+     */
+    int SetOutputTensorParamNodes(std::vector<std::string> nodes);
+
+    /**
+     * @brief Set threshold value.
+     *
+     * @since_tizen 5.5
+     */
      int SetOutputTensorParamThresHold(double threshold);
  
+    /**
+     * @brief Set the number of outputs.
+     *
+     * @since_tizen 5.5
+     */
      int SetOutputTensorParamNumbers(int number);
  
-    int SetOutputTensorParamType(int type);
-
+    /**
+     * @brief Set target device.
+     * @details See #inference_target_type_e
+     *
+     * @since_tizen 5.5
+     */
+    int SetTargetDevice(inference_target_type_e type);
+
+    /**
+     * @brief Load model data.
+     *
+     * @since_tizen 5.5
+     */
+    int Load();
+
+    /**
+     * @brief Run an inference with a tensor
+     *
+     * @since_tizen 5.5
+     */
      int Run(cv::Mat tensor);
  
+    /**
+     * @brief Get inference results of image classification.
+     *
+     * @since_tizen 5.5
+     */
      int GetInferenceResult(ImageClassificationResults& results);
  
+    /**
+     * @brief Get inference results of object detection.
+     *
+     * @since_tizen 5.5
+     */
      int GetInferenceResult(ObjectDetectionResults& results);
  
+    /**
+     * @brief Get inference results of face detection.
+     *
+     * @since_tizen 5.5
+     */
      int GetInferenceResult(FaceDetectionResults& results);
  
+    /**
+     * @brief Get inference results of facial landmark detection.
+     *
+     * @since_tizen 5.5
+     */
      int GetInferenceResult(FacialLandMarkDetectionResults& results);
  
-    int GetNumberOfOutputs();
+    /**
+     * @brief Set SetUserFile.
+     * @details Image Classification and Object Detection needs a user file
+     *          including labels of classification and objects.
+     * @since_tizen 5.5
+     */
+    int SetUserFile(std::string filename);
  
+protected:
+    /**
+     * @brief Set an input with a type of cv::Mat
+     * @details Set an input and pre-process the input
+     *
+     * @since_tizen 5.5
+     */
+    int SetInput(cv::Mat cvImg);
+
+    /**
+     * @brief Set user list name.
+     *
+     * @since_tizen 5.5
+     */
      void SetUserListName(std::string userlist);
  
  private:
      std::string mBackendLibName;
      std::vector<std::string> mUserListName;
-protected:
-    void *handle;
-    IInferenceEngineVision *engine;
+
+    int mCh;
+    int mDim;
+    cv::Size mInputSize;
+
+    double mDeviation;
+    double mMean;
+    double mThreshold;
+    int mOutputNumbers;
+    cv::Size mSourceSize;
+
+    cv::Mat mInputBuffer;
+    int mMatType;
+
+    InferenceEngineCommon *mCommonEngine; /**< InferenceEngineCommon is used to
+                                               do typical process */
  };
  
  } /* Vision */
diff --git a/packaging/inference-engine-interface.spec b/packaging/inference-engine-interface.spec

index 801b0e6e41ef106ee6dc954d2244a07d39ed13f4..cb275763b9f157201e9b29f4f211141326e0703f 100644 (file)
--- a/packaging/inference-engine-interface.spec
+++ b/packaging/inference-engine-interface.spec
@@ -1,7 +1,7 @@
  Name:        inference-engine-interface
  Summary:     Interface of inference engines
  Version:     0.0.1
-Release:     5
+Release:     6
  Group:       Multimedia/Framework
  License:     Apache-2.0
  Source0:     %{name}-%{version}.tar.gz
diff --git a/vision/inference_engine_vision_impl.cpp b/vision/inference_engine_vision_impl.cpp

index ae6a2fdcf0cb1c077de8fa035132faede60f1d96..0bf5a37d1c9d624fb761f537033e91dfffe8d21c 100644 (file)
--- a/vision/inference_engine_vision_impl.cpp
+++ b/vision/inference_engine_vision_impl.cpp
@@ -23,6 +23,7 @@
  #include <unistd.h>
  #include <time.h>
  #include <dlfcn.h>
+#include <queue>
  
  extern "C" {
  
@@ -35,28 +36,48 @@ extern "C" {
  #define LOG_TAG "INFERENCE_ENGINE_VISION"
  }
  
+typedef enum  {
+  InputAttrNoType = 0,
+  InputAttrFloat32 = 1,
+  InputAttrInt32 = 2,
+  InputAttrUInt8 = 3,
+  InputAttrInt64 = 4,
+  InputAttrString = 5,
+  InputAttrBool = 6,
+} InputAttrType;
+
  namespace InferenceEngineInterface {
  namespace Vision {
-InferenceEngineVision::InferenceEngineVision(std::string backend) : Common::InferenceEngineCommon(backend)
+
+InferenceEngineVision::InferenceEngineVision(std::string backend) :
+    mCh(0),
+    mDim(0),
+    mInputSize(cv::Size()),
+    mDeviation(0.0),
+    mMean(0.0),
+    mThreshold(0.0),
+    mOutputNumbers(0),
+    mSourceSize(cv::Size()),
+    mInputBuffer(cv::Mat()),
+    mMatType(0),
+    mCommonEngine(nullptr)
  {
      LOGE("ENTER");
-    mBackendLibName = "libinference-engine-" + backend + ".so";
+
+    mCommonEngine = new InferenceEngineCommon(backend);
+
      LOGE("LEAVE");
  }
  
  InferenceEngineVision::~InferenceEngineVision()
  {
      LOGW("ENTER");
-    if (handle) {
-        destroy_t *engineDestroy = (destroy_t*)dlsym(handle, "EngineVisionDestroy");
-        engineDestroy(engine);
-        dlclose(handle);
-        engine = nullptr;
-        handle = nullptr;
  
-        Common::InferenceEngineCommon::handle = nullptr;
-        Common::InferenceEngineCommon::engine = nullptr;
+    if (mCommonEngine != nullptr) {
+        delete mCommonEngine;
+        mCommonEngine = nullptr;
      }
+
      LOGW("LEAVE");
  }
  
@@ -64,146 +85,427 @@ int InferenceEngineVision::Init(std::string configFile,
              std::string weightFile, std::string userFile)
  {
      LOGW("ENTER");
-    char *error = NULL;
-    handle = dlopen(mBackendLibName.c_str(), RTLD_LAZY);
-    LOGI("HANDLE : [%p]", handle);
  
-    if (!handle) {
-        LOGE("Fail to dlopen %s", mBackendLibName.c_str());
-        LOGE("Error: %s\n", dlerror());
-        return  INFERENCE_ENGINE_ERROR_NOT_SUPPORTED;
+    int ret = mCommonEngine->Init(configFile, weightFile);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE) {
+        LOGE("Fail to init");
+        return ret;
      }
  
-    init_t* EngineInit = (init_t *)dlsym(handle, "EngineVisionInit");
-    if ((error = dlerror()) != NULL) {
-        LOGE("Error: %s\n", error);
-        dlclose(handle);
-        return INFERENCE_ENGINE_ERROR_INTERNAL;
+    size_t userFileLength = userFile.length();
+    if (userFileLength > 0 && access(userFile.c_str(), F_OK)) {
+        LOGE("userFilePath in [%s] ", userFile.c_str());
+        return INFERENCE_ENGINE_ERROR_INVALID_PATH;
      }
  
-    engine = EngineInit(configFile, weightFile, userFile);
-    LOGI("dlopen %s", mBackendLibName.c_str());
+    ret = (userFileLength > 0) ? SetUserFile(userFile) : INFERENCE_ENGINE_ERROR_NONE;
+    if (ret != INFERENCE_ENGINE_ERROR_NONE)
+        LOGW("Fail to read categoryList");
+
+    LOGW("LEAVE");
+    return INFERENCE_ENGINE_ERROR_NONE;
+}
  
-    if (engine == NULL) {
-        LOGE("Fail to EngineInit");
-        dlclose(handle);
-        return INFERENCE_ENGINE_ERROR_INTERNAL;
+int InferenceEngineVision::SetUserFile(std::string filename)
+{
+    std::ifstream fp(filename.c_str());
+    if (!fp.is_open()) {
+        return INFERENCE_ENGINE_ERROR_INVALID_PATH;
      }
  
-    Common::InferenceEngineCommon::handle = handle;
-    Common::InferenceEngineCommon::engine = engine;
+    std::string userListName;
+    while (!fp.eof()) {
+        std::getline(fp, userListName);
+        if (userListName.length())
+            SetUserListName(userListName);
+    }
+
+    fp.close();
  
-    LOGW("LEAVE");
      return INFERENCE_ENGINE_ERROR_NONE;
  }
  
+void InferenceEngineVision::SetUserListName(std::string userlist)
+{
+    mUserListName.push_back(userlist);
+}
+
  void InferenceEngineVision::Deinit()
  {
-    ;
+    mCommonEngine->Deinit();
  }
  
  int InferenceEngineVision::SetInputTensorParamInput(int width, int height, int dim, int ch)
  {
-    int ret = engine->SetInputTensorParamInput(width, height, dim, ch);
-    if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to SetInputTensorParamInput");
+    mCh = ch;
+    mDim = dim;
+    mInputSize = cv::Size(width, height);
  
-    return ret;
+    LOGI("InputSize is %d x %d\n", mInputSize.width, mInputSize.height);
+
+    return INFERENCE_ENGINE_ERROR_NONE;
  }
  
  int InferenceEngineVision::SetInputTensorParamNorm(double deviation, double mean)
  {
-    int ret = engine->SetInputTensorParamNorm(deviation, mean);
-    if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to SetInputTensorParamNorm");
+    mDeviation = deviation;
+    mMean = mean;
+
+    LOGI("mean %.4f, deviation %.4f", mMean, mDeviation);
  
+    return INFERENCE_ENGINE_ERROR_NONE;
+}
+
+int InferenceEngineVision::SetInputTensorParamNode(std::string node)
+{
+    LOGE("ENTER");
+    int ret = mCommonEngine->SetInputTensorParamNode(node);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE)
+        LOGE("Fail to SetInputTensorParamNode");
+    LOGE("LEAVE");
      return ret;
  }
  
-int InferenceEngineVision::SetOutputTensorParamThresHold(double threshold)
+int InferenceEngineVision::SetTargetDevice(inference_target_type_e type)
  {
-    int ret = engine->SetOutputTensorParamThresHold(threshold);
+    int ret = mCommonEngine->SetTargetDevice(type);
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to SetOutputTensorParamThresHold");
+        LOGE("Fail to SetTargetDevice");
  
      return ret;
  }
  
+int InferenceEngineVision::SetOutputTensorParamThresHold(double threshold)
+{
+    mThreshold = threshold;
+
+    LOGI("threshold %.4f", mThreshold);
+
+    return INFERENCE_ENGINE_ERROR_NONE;
+}
+
  int InferenceEngineVision::SetOutputTensorParamNumbers(int numbers)
  {
-    int ret = engine->SetOutputTensorParamNumbers(numbers);
-    if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to SetOuputTensorParamNumbers");
+    mOutputNumbers = numbers;
  
-    return ret;
+    LOGI("outputNumber %d", mOutputNumbers);
+
+    return INFERENCE_ENGINE_ERROR_NONE;
  }
  
-int InferenceEngineVision::SetOutputTensorParamType(int type)
+int InferenceEngineVision::SetOutputTensorParamNodes(std::vector<std::string> nodes)
  {
-    int ret = engine->SetOutputTensorParamType(type);
+    LOGI("ENTER");
+    int ret = mCommonEngine->SetOutputTensorParamNodes(nodes);
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to SetOutputTensorParamType");
+        LOGE("Fail to SetOutputTensorParamNodes");
+    LOGI("LEAVE");
+    return ret;
+}
+
+int InferenceEngineVision::Load()
+{
+    LOGI("ENTER");
+    int ret = mCommonEngine->Load();
+    if (ret != INFERENCE_ENGINE_ERROR_NONE) {
+        LOGE("Fail to load InferenceEngineVision");
+        return ret;
+    }
+
+    //get type and allocate memory to mInputBuffer;
+    InputAttrType attrType = static_cast<InputAttrType>(mCommonEngine->GetInputLayerAttrType());
+    if (attrType == InputAttrUInt8) {
+        mMatType = CV_8UC3;
+        LOGI("InputType is UINT8");
+    }
+    else if (attrType == InputAttrFloat32) {
+        mMatType = CV_32FC3;
+        LOGI("InputType FLOAT32");
+    }
+    else {
+        LOGE("Not supported");
+        ret = INFERENCE_ENGINE_ERROR_NOT_SUPPORTED_FORMAT;
+        return ret;
+    }
+
+    tensor_t inputData;
+    std::vector<int> info{1, mMatType, mInputSize.height, mInputSize.width};
+    inputData.dimInfo.push_back(info);
+
+    // some plug-in (opencv) doesn't allocate memory for input while loading models 
+    // But, others (tflite) allcate memory while loading.
+    // Thus, the SetInputData() will be implemented in plug-in such as OpenCV, but
+    // just leave empty in plug-in such as tflite.
+    ret = mCommonEngine->SetInputDataBuffer(inputData);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE) {
+        LOGE("Fail to SetInputData");
+        return ret;
+    }
+
+    void *dataPtr = mCommonEngine->GetInputDataPtr();
+    if (dataPtr == nullptr) {
+        LOGE("input data address is null");
+        return INFERENCE_ENGINE_ERROR_INTERNAL;
+    }
+
+    mInputBuffer = cv::Mat(mInputSize.height, mInputSize.width, mMatType, dataPtr);
  
      return ret;
  }
  
+int InferenceEngineVision::SetInput(cv::Mat cvImg)
+{
+    mSourceSize = cvImg.size();
+    int width = mInputSize.width;
+    int height = mInputSize.height;
+
+    //PreProcess();
+    cv::Mat sample;
+    if (cvImg.channels() == 3 && mCh == 1)
+        cv::cvtColor(cvImg, sample, cv::COLOR_BGR2GRAY);
+    else
+        sample = cvImg;
+
+    // size
+    cv::Mat sampleResized;
+    if (sample.size() != cv::Size(width, height))
+        cv::resize(sample, sampleResized, cv::Size(width, height));
+    else
+        sampleResized = sample;
+
+    // type
+    cv::Mat sampleFloat;
+    if (mCh == 3)
+        sampleResized.convertTo(sampleFloat, CV_32FC3);
+    else
+        sampleResized.convertTo(sampleFloat, CV_32FC1);
+
+    // normalize
+    cv::Mat sampleNormalized;
+    cv::Mat meanMat;
+    if (mCh == 3)
+        meanMat = cv::Mat(sampleFloat.size(), CV_32FC3, cv::Scalar((float)mMean, (float)mMean, (float)mMean));
+    else
+        meanMat = cv::Mat(sampleFloat.size(), CV_32FC1, cv::Scalar((float)mMean));
+
+    cv::subtract(sampleFloat, meanMat, sampleNormalized);
+
+    sampleNormalized /= (float)mDeviation;
+
+    sampleNormalized.convertTo(mInputBuffer, mMatType);
+
+    return INFERENCE_ENGINE_ERROR_NONE;
+}
+
  int InferenceEngineVision::Run(cv::Mat tensor)
  {
-    int ret = engine->Run(tensor);
+    LOGI("ENTER");
+    int ret = SetInput(tensor);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE)
+        LOGE("Fail to SetInput InferenceEngineVision");
+
+    ret = mCommonEngine->Run();
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
          LOGE("Fail to run InferenceEngineVision");
  
+    LOGI("LEAVE");
      return ret;
  }
  
  int InferenceEngineVision::GetInferenceResult(ImageClassificationResults& results)
  {
-    int ret = engine->GetInferenceResult(results);
+    // Will contain top N results in ascending order.
+    std::vector<std::pair<float, int>> top_results;
+    std::priority_queue<std::pair<float, int>,
+        std::vector<std::pair<float, int>>,
+        std::greater<std::pair<float, int>>> top_result_pq;
+    float value;
+
+    tensor_t outputData;
+    int ret = mCommonEngine->GetInferenceResult(outputData);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE) {
+        LOGE("fail to GetInferenceResults with ImageClassificationResults");
+        return ret;
+    }
+
+       std::vector<std::vector<int>> inferDimInfo(outputData.dimInfo);
+    std::vector<void*> inferResults(outputData.data.begin(), outputData.data.end());
+
+    long count = inferDimInfo[0][1];
+    LOGI("count: %ld", count);
+
+    float *prediction = reinterpret_cast<float*>(inferResults[0]);
+    for (int i = 0; i < count; ++i) {
+        value = prediction[i];
+        // Only add it if it beats the threshold and has a chance at being in
+        // the top N.
+        top_result_pq.push(std::pair<float, int>(value, i));
+
+        // If at capacity, kick the smallest value out.
+        if (top_result_pq.size() > mOutputNumbers) {
+            top_result_pq.pop();
+        }
+    }
+
+    // Copy to output vector and reverse into descending order.
+    while (!top_result_pq.empty()) {
+        top_results.push_back(top_result_pq.top());
+        top_result_pq.pop();
+    }
+    std::reverse(top_results.begin(), top_results.end());
+
+    int classIdx = -1;
+    results.number_of_classes = 0;
+    for (int idx = 0; idx < mOutputNumbers; ++idx) {
+        if (top_results[idx].first < mThreshold)
+            continue;
+        LOGI("idx:%d", idx);
+        LOGI("classIdx: %d", top_results[idx].second);
+        LOGI("classProb: %f", top_results[idx].first);
+
+        classIdx = top_results[idx].second;
+        results.indices.push_back(classIdx);
+        results.confidences.push_back(top_results[idx].first);
+        results.names.push_back(mUserListName[classIdx]);
+        results.number_of_classes++;
+    }
  
-    if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to GetClassficationResults");
-    // NULL CHECK?
      return ret;
  }
  
  int InferenceEngineVision::GetInferenceResult(ObjectDetectionResults& results)
  {
-    int ret = engine->GetInferenceResult(results);
+    tensor_t outputData;
+    int ret = mCommonEngine->GetInferenceResult(outputData);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE) {
+        LOGE("fail to GetInferenceResults with ObjectDetectionResults");
+        return ret;
+    }
  
-    if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to GetObjectDetectionResults");
+       std::vector<std::vector<int>> inferDimInfo(outputData.dimInfo);
+       std::vector<void*> inferResults(outputData.data.begin(), outputData.data.end());
+
+    float* boxes = reinterpret_cast<float*>(inferResults[0]);
+    float* classes = reinterpret_cast<float*>(inferResults[1]);
+    float* scores = reinterpret_cast<float*>(inferResults[2]);
+    int number_of_detections = (int)(reinterpret_cast<int*>(inferResults[3]));
+
+    int left, top, right, bottom;
+    cv::Rect loc;
+
+    results.number_of_objects = 0;
+    for (int idx = 0; idx < number_of_detections; ++idx) {
+        if (scores[idx] < mThreshold)
+            continue;
+
+        left =   (int)(boxes[idx*4 + 1] * mSourceSize.width);
+        top  =   (int)(boxes[idx*4 + 0] * mSourceSize.height);
+        right  = (int)(boxes[idx*4 + 3] * mSourceSize.width);
+        bottom = (int)(boxes[idx*4 + 2] * mSourceSize.height);
+
+        loc.x = left;
+        loc.y = top;
+        loc.width = right -left + 1;
+        loc.height = bottom - top + 1;
+
+        results.indices.push_back((int)classes[idx]);
+        results.confidences.push_back(scores[idx]);
+        results.names.push_back(mUserListName[(int)classes[idx]]);
+        results.locations.push_back(loc);
+        results.number_of_objects++;
+
+        LOGI("objectClass: %d", (int)classes[idx]);
+        LOGI("confidence:%f", scores[idx]);
+        LOGI("left:%d, top:%d, right:%d, bottom:%d", left, top, right, bottom);
+    }
  
      return ret;
  }
  
  int InferenceEngineVision::GetInferenceResult(FaceDetectionResults& results)
  {
-    int ret = engine->GetInferenceResult(results);
+    tensor_t outputData;
+    int ret = mCommonEngine->GetInferenceResult(outputData);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE) {
+        LOGE("fail to GetInferenceResults with FaceDetectionResults");
+        return ret;
+    }
  
-    if (ret != INFERENCE_ENGINE_ERROR_NONE)
-        LOGE("Fail to GetFaceDetectionResults");
+       std::vector<std::vector<int>> inferDimInfo(outputData.dimInfo);
+       std::vector<void*> inferResults(outputData.data.begin(), outputData.data.end());
+
+    float* boxes = reinterpret_cast<float*>(inferResults[0]);
+    float* classes = reinterpret_cast<float*>(inferResults[1]);
+    float* scores = reinterpret_cast<float*>(inferResults[2]);
+
+    int number_of_detections = (int)(reinterpret_cast<int*>(inferResults[3]));
+    int left, top, right, bottom;
+    cv::Rect loc;
+
+    results.number_of_faces = 0;
+    for (int idx = 0; idx < number_of_detections; ++idx) {
+        if (scores[idx] < mThreshold)
+            continue;
+
+        left =   (int)(boxes[idx*4 + 1] * mSourceSize.width);
+        top  =   (int)(boxes[idx*4 + 0] * mSourceSize.height);
+        right  = (int)(boxes[idx*4 + 3] * mSourceSize.width);
+        bottom = (int)(boxes[idx*4 + 2] * mSourceSize.height);
+
+        loc.x = left;
+        loc.y = top;
+        loc.width = right -left + 1;
+        loc.height = bottom - top + 1;
+
+        results.confidences.push_back(scores[idx]);
+        results.locations.push_back(loc);
+        results.number_of_faces++;
+
+        LOGI("confidence:%f", scores[idx]);
+        LOGI("class: %f", classes[idx]);
+        LOGI("left:%f, top:%f, right:%f, bottom:%f", boxes[idx*4 + 1], boxes[idx*4 + 0], boxes[idx*4 + 3], boxes[idx*4 + 2]);
+        LOGI("left:%d, top:%d, right:%d, bottom:%d", left, top, right, bottom);
+    }
  
      return ret;
  }
  
  int InferenceEngineVision::GetInferenceResult(FacialLandMarkDetectionResults& results)
  {
-    int ret = engine->GetInferenceResult(results);
+
+    tensor_t outputData;
+    int ret = mCommonEngine->GetInferenceResult(outputData);
+    if (ret != INFERENCE_ENGINE_ERROR_NONE) {
+        LOGE("fail to GetInferenceResults with FacialLandMarkDetectionResults");
+        return ret;
+    }
+
+       std::vector<std::vector<int>> inferDimInfo(outputData.dimInfo);
+       std::vector<void*> inferResults(outputData.data.begin(), outputData.data.end());
+
+    long number_of_detections = inferDimInfo[0][1];
+    float* loc = reinterpret_cast<float*>(inferResults[0]);
+
+    results.number_of_landmarks = 0;
  
      if (ret != INFERENCE_ENGINE_ERROR_NONE)
          LOGE("Fail to GetFacialLandMarkDetectionResults");
  
-    return ret;
-}
+    cv::Point point(0,0);
+    results.number_of_landmarks = 0;
+    LOGI("imgW:%d, imgH:%d", mSourceSize.width, mSourceSize.height);
+    for (int idx = 0; idx < number_of_detections; idx+=2) {
+        point.x = (int)(loc[idx] * mSourceSize.width);
+        point.y = (int)(loc[idx+1] * mSourceSize.height);
  
-int InferenceEngineVision::GetNumberOfOutputs()
-{
-    return engine->GetNumberOfOutputs();
-}
+        results.locations.push_back(point);
+        results.number_of_landmarks++;
  
-void InferenceEngineVision::SetUserListName(std::string userlist)
-{
-    ;
+        LOGI("x:%d, y:%d", point.x, point.y);
+    }
+
+    return ret;
  }
+
  } /* Vision */
  } /* InferenceEngineInterface */
author	Tae-Young Chung <ty83.chung@samsung.com>
	Wed, 18 Sep 2019 08:30:35 +0000 (17:30 +0900)
committer	Tae-Young Chung <ty83.chung@samsung.com>
	Mon, 23 Sep 2019 06:09:43 +0000 (15:09 +0900)
common/inference_engine_common_impl.cpp		patch \| blob \| history
include/inference_engine_common.h		patch \| blob \| history
include/inference_engine_common_impl.h		patch \| blob \| history
include/inference_engine_type.h		patch \| blob \| history
include/inference_engine_vision.h	[deleted file]	patch \| blob \| history
include/inference_engine_vision_impl.h		patch \| blob \| history
packaging/inference-engine-interface.spec		patch \| blob \| history
vision/inference_engine_vision_impl.cpp		patch \| blob \| history