Add NNFW runtime support

author Inki Dae <inki.dae@samsung.com>

Mon, 15 Jun 2020 09:25:23 +0000 (18:25 +0900)

committer Inki Dae <inki.dae@samsung.com>

Tue, 16 Jun 2020 06:56:47 +0000 (15:56 +0900)
author Inki Dae <inki.dae@samsung.com>
Mon, 15 Jun 2020 09:25:23 +0000 (18:25 +0900)
committer Inki Dae <inki.dae@samsung.com>
Tue, 16 Jun 2020 06:56:47 +0000 (15:56 +0900)
diff --git a/src/inference_engine_mlapi.cpp b/src/inference_engine_mlapi.cpp

index ddb650707dd1622500cdbc2aff067932c940d6b3..7052b75763a036e5bcd94d756566bdaa7a7bd490 100644 (file)
--- a/src/inference_engine_mlapi.cpp
+++ b/src/inference_engine_mlapi.cpp
@@ -52,6 +52,8 @@ namespace MLAPIImpl
  
                 mDesignated_outputs.clear();
                 std::vector<std::string>().swap(mDesignated_outputs);
+
+               ml_single_close(mSingle);
         }
  
         int InferenceMLAPI::SetPrivateData(void *data)
@@ -103,7 +105,7 @@ namespace MLAPIImpl
         {
                 LOGI("ENTER");
  
-               std::string model_str("");
+               std::string model_str(model_paths[0]);
  
                 // TODO. Set NNFW backend type and HW type properly.
  
@@ -127,7 +129,7 @@ namespace MLAPIImpl
  
                         // ML Single API of MLAPI requires model_paths rule like below,
                         // "so library file path,nb model file path" or vise versa.
-                       model_str += model_paths[0] + "," + model_paths[1];
+                       model_str += "," + model_paths[1];
                         break;
                 case INFERENCE_BACKEND_NNFW:
                         nnfw_type = ML_NNFW_TYPE_NNFW;
@@ -143,7 +145,6 @@ namespace MLAPIImpl
                                 return INFERENCE_ENGINE_ERROR_INVALID_PARAMETER;
                         }
  
-                       model_str += model_paths[0];
                         LOGI("NNFW tensor filter will be used.");
                         break;
                 // TODO.
@@ -186,22 +187,7 @@ namespace MLAPIImpl
         {
                 LOGI("ENTER");
  
-               // Output tensor buffers will be allocated by a backend plugin of ML Single API of nnstreamer
-               // So add a null tensor buffer object. This buffer will be updated at Run callback.
-
-               // Caution. this tensor buffer will be checked by upper framework to verity if
-               //                      the tensor buffer object is valid or not so fill dummy data to the tensor buffer.
-
-               // TODO. Consider multiple output tensors.
-
-               inference_engine_tensor_buffer tensor_buf = {
-                       0,
-               };
-               tensor_buf.data_type = INFERENCE_TENSOR_DATA_TYPE_FLOAT16;
-               tensor_buf.buffer = (void *) 1;
-               tensor_buf.size = 1;
-               tensor_buf.owner_is_backend = 1;
-               buffers.push_back(tensor_buf);
+               // TODO. Implement this function according to a given ML Single API backend properly.
  
                 LOGI("LEAVE");
  
@@ -233,10 +219,11 @@ namespace MLAPIImpl
                 LOGI("input tensor count = %u", cnt);
  
                 for (unsigned int i = 0; i < cnt; ++i) {
+                       inference_engine_tensor_info tensor_info;
                         ml_tensor_type_e in_type;
-                       unsigned int in_dim;
+                       unsigned int in_dim[ML_TENSOR_RANK_LIMIT];
                         char *in_name = NULL;
-                       size_t in_size;
+                       size_t in_size = 1;
  
                         ret = ml_tensors_info_get_tensor_type(in_info, i, &in_type);
                         if (ret != ML_ERROR_NONE) {
@@ -247,14 +234,26 @@ namespace MLAPIImpl
  
                         LOGI("input tensor type = %d", in_type);
  
-                       ret = ml_tensors_info_get_tensor_dimension(in_info, i, &in_dim);
+                       int type = ConvertTensorType(in_type);
+                       if (type == -1) {
+                               return INFERENCE_ENGINE_ERROR_NOT_SUPPORTED;
+                       }
+
+                       ret = ml_tensors_info_get_tensor_dimension(in_info, i, in_dim);
                         if (ret != ML_ERROR_NONE) {
                                 LOGE("Failed to request ml_tensors_info_get_tensor_dimension(%d).",
                                          ret);
                                 return INFERENCE_ENGINE_ERROR_INVALID_OPERATION;
                         }
  
-                       LOGI("input tensor dimension = %u", in_dim);
+                       LOGI("Input tensor dimension:");
+                       for (unsigned int shape_idx = 0; shape_idx < ML_TENSOR_RANK_LIMIT; ++shape_idx) {
+                               tensor_info.shape.push_back(in_dim[shape_idx]);
+                               in_size *= static_cast<size_t>(in_dim[shape_idx]);
+                               LOGI("%u", in_dim[shape_idx]);
+                       }
+
+                       LOGI("input tensor size = %u", in_size);
  
                         ret = ml_tensors_info_get_tensor_name(in_info, i, &in_name);
                         if (ret != ML_ERROR_NONE) {
@@ -265,27 +264,16 @@ namespace MLAPIImpl
  
                         LOGI("input tensor name = %s", in_name);
  
-                       ret = ml_tensors_info_get_tensor_size(in_info, i, &in_size);
-                       if (ret != ML_ERROR_NONE) {
-                               LOGE("Failed to request ml_tensors_info_get_tensor_size(%d).",
-                                        ret);
-                               return INFERENCE_ENGINE_ERROR_INVALID_OPERATION;
-                       }
+                       tensor_info.data_type = static_cast<inference_tensor_data_type_e>(type);
+                       tensor_info.size = in_size;
  
-                       LOGI("input tensor size = %u", in_size);
+                       property.tensor_infos.push_back(tensor_info);
  
                         // TODO. Compare tensor info from engine to one from a given property.
                 }
  
                 property.layer_names = mInputProperty.layer_names;
  
-               std::vector<inference_engine_tensor_info>::iterator iter;
-               for (iter = mInputProperty.tensor_infos.begin();
-                        iter != mInputProperty.tensor_infos.end(); iter++) {
-                       inference_engine_tensor_info tensor_info = *iter;
-                       property.tensor_infos.push_back(tensor_info);
-               }
-
                 LOGI("LEAVE");
  
                 return INFERENCE_ENGINE_ERROR_NONE;
@@ -296,16 +284,95 @@ namespace MLAPIImpl
         {
                 LOGI("ENTER");
  
-               property.layer_names = mOutputProperty.layer_names;
+               ml_tensors_info_h out_info = NULL;
+
+               // TODO. Need to check if model file loading is done.
+
+               int ret = ml_single_get_output_info(mSingle, &out_info);
+               if (ret != ML_ERROR_NONE) {
+                       LOGE("Failed to request ml_single_get_output_info(%d).", ret);
+                       return INFERENCE_ENGINE_ERROR_INVALID_OPERATION;
+               }
+
+               unsigned int cnt;
+               ret = ml_tensors_info_get_count(out_info, &cnt);
+               if (ret != ML_ERROR_NONE) {
+                       LOGE("Failed to request ml_tensors_info_get_count(%d).", ret);
+                       return INFERENCE_ENGINE_ERROR_INVALID_OPERATION;
+               }
+
+               LOGI("output tensor count = %u", cnt);
+
+               for (unsigned int i = 0; i < cnt; ++i) {
+                       inference_engine_tensor_info tensor_info;
+                       ml_tensor_type_e out_type;
+                       unsigned int out_dim[ML_TENSOR_RANK_LIMIT];
+                       char *out_name = NULL;
+                       size_t out_size = 1;
+
+                       ret = ml_tensors_info_get_tensor_type(out_info, i, &out_type);
+                       if (ret != ML_ERROR_NONE) {
+                               LOGE("Failed to request ml_tensors_info_get_tensor_type(%d).",
+                                        ret);
+                               return INFERENCE_ENGINE_ERROR_INVALID_OPERATION;
+                       }
+
+                       LOGI("output tensor type = %d", out_type);
  
-               inference_engine_tensor_info tensor_info;
+                       int type = ConvertTensorType(out_type);
+                       if (type == -1) {
+                               return INFERENCE_ENGINE_ERROR_NOT_SUPPORTED;
+                       }
+
+                       ret = ml_tensors_info_get_tensor_dimension(out_info, i, out_dim);
+                       if (ret != ML_ERROR_NONE) {
+                               LOGE("Failed to request ml_tensors_info_get_tensor_dimension(%d).",
+                                        ret);
+                               return INFERENCE_ENGINE_ERROR_INVALID_OPERATION;
+                       }
+
+                       int shape_size = 0;
+
+                       LOGI("Output tensor dimension:");
+
+                       for (unsigned int shape_idx = 0; shape_idx < ML_TENSOR_RANK_LIMIT; ++shape_idx) {
+                               out_size *= static_cast<size_t>(out_dim[shape_idx]);
  
-               // TODO. Set tensor info from a given ML Single API of nnstreamer backend instead of fixed one.
+                               if (out_dim[shape_idx] == 1 && shape_size == 0)
+                                       shape_size = shape_idx;
  
-               tensor_info.data_type = INFERENCE_TENSOR_DATA_TYPE_FLOAT16;
-               tensor_info.shape = { 1, 1001 };
-               tensor_info.size = 1001;
-               property.tensor_infos.push_back(tensor_info);
+                               LOGI("%d", out_dim[shape_idx]);
+                       }
+
+                       LOGI("Shape size of output tensor : %d", shape_size);
+                       LOGI("Reversed output tensor dimension:");
+
+                       // Reverse shape order.
+                       for (int idx = shape_size; idx >= 0; --idx) {
+                               tensor_info.shape.push_back(out_dim[idx]);
+                               LOGI("%u", out_dim[idx]);
+                       }
+
+                       LOGI("output tensor size = %zu", out_size);
+
+                       ret = ml_tensors_info_get_tensor_name(out_info, i, &out_name);
+                       if (ret != ML_ERROR_NONE) {
+                               LOGE("Failed to request ml_tensors_info_get_tensor_name(%d).",
+                                        ret);
+                               return INFERENCE_ENGINE_ERROR_INVALID_OPERATION;
+                       }
+
+                       LOGI("output tensor name = %s", out_name);
+
+                       tensor_info.data_type = static_cast<inference_tensor_data_type_e>(type);
+                       tensor_info.size = out_size;
+
+                       property.tensor_infos.push_back(tensor_info);
+
+                       // TODO. Compare tensor info from engine to one from a given property.
+               }
+
+               property.layer_names = mOutputProperty.layer_names;
  
                 LOGI("LEAVE");
  
@@ -397,6 +464,27 @@ namespace MLAPIImpl
                 return INFERENCE_ENGINE_ERROR_NONE;
         }
  
+       int InferenceMLAPI::ConvertTensorType(int tensor_type)
+       {
+               LOGI("ENTER");
+
+               switch (tensor_type) {
+               case ML_TENSOR_TYPE_FLOAT32:
+                       return INFERENCE_TENSOR_DATA_TYPE_FLOAT32;
+               case ML_TENSOR_TYPE_UINT8:
+                       return INFERENCE_TENSOR_DATA_TYPE_UINT8;
+               case ML_TENSOR_TYPE_UINT16:
+                       return INFERENCE_TENSOR_DATA_TYPE_UINT16;
+               default:
+                       LOGE("Tensor type(%d) is invalid.", tensor_type);
+                       return INFERENCE_ENGINE_ERROR_INVALID_PARAMETER;
+               }
+
+               LOGI("LEAVE");
+
+               return -1;
+       }
+
         int InferenceMLAPI::Run(
                         std::vector<inference_engine_tensor_buffer> &input_buffers,
                         std::vector<inference_engine_tensor_buffer> &output_buffers)
@@ -462,7 +550,6 @@ namespace MLAPIImpl
                 }
  
                 LOGI("Output tensor = %u", output_buffers[0].size);
-
                 LOGI("LEAVE");
  
                 return INFERENCE_ENGINE_ERROR_NONE;
diff --git a/src/inference_engine_mlapi_private.h b/src/inference_engine_mlapi_private.h

index 91b1ab2a31b6baab8fa1ec1fdef1a9eede591673..6612eb763171de5b5bfbf880ac97bb82272a6c89 100644 (file)
--- a/src/inference_engine_mlapi_private.h
+++ b/src/inference_engine_mlapi_private.h
@@ -76,6 +76,7 @@ namespace MLAPIImpl
                 int CheckTensorBuffers(
                                 std::vector<inference_engine_tensor_buffer> &input_buffers,
                                 std::vector<inference_engine_tensor_buffer> &output_buffers);
+               int ConvertTensorType(int tensor_type);
  
                 int mPluginType;
                 int mTargetDevice;
author	Inki Dae <inki.dae@samsung.com>
	Mon, 15 Jun 2020 09:25:23 +0000 (18:25 +0900)
committer	Inki Dae <inki.dae@samsung.com>
	Tue, 16 Jun 2020 06:56:47 +0000 (15:56 +0900)
src/inference_engine_mlapi.cpp		patch \| blob \| history
src/inference_engine_mlapi_private.h		patch \| blob \| history