}
};
-enum class ResultType { NONE, OBJECT_DETECTION, FACE_DETECTION, FACE_LANDMARK };
+enum class ResultType { NONE, OBJECT_DETECTION, FACE_DETECTION, FACE_LANDMARK, IMAGE_CLASSIFICATION };
struct BaseResultType {
ResultType _type { ResultType::NONE };
}
};
+struct IcResultType : public BaseResultType {
+ IcResultType() : BaseResultType(ResultType::IMAGE_CLASSIFICATION)
+ {}
+ std::vector<std::string> _labels;
+
+ std::shared_ptr<BaseResultType> clone() override
+ {
+ return std::make_shared<IcResultType>(*this);
+ }
+};
+
enum class ServiceType { NONE, AUTO_ZOOM };
enum class InputFeedType { NONE, CAMERA, SCREEN_CAPTURE };
--- /dev/null
+/**
+ * Copyright (c) 2024 Samsung Electronics Co., Ltd All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef __MV_IMAGE_CLASSIFICATION_H__
+#define __MV_IMAGE_CLASSIFICATION_H__
+
+#include "IInferenceTaskInterface.h"
+#include "mv_image_classification_internal.h"
+#include "SingleoCommonTypes.h"
+
+namespace singleo
+{
+namespace inference
+{
+namespace backends
+{
+class MvImageClassification : public IInferenceTaskInterface
+{
+private:
+ mv_image_classification_h _handle {};
+ IcResultType _output_data {};
+
+public:
+ MvImageClassification();
+ virtual ~MvImageClassification();
+
+ void configure() override;
+ void prepare() override;
+ void invoke(BaseDataType &input, bool async) override;
+ BaseResultType &result() override;
+};
+
+} // backends
+} // inference
+} // singleo
+
+#endif
--- /dev/null
+/**
+ * Copyright (c) 2024 Samsung Electronics Co., Ltd All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <stdexcept>
+#include "MvImageClassification.h"
+#include "SingleoLog.h"
+
+using namespace std;
+
+namespace singleo
+{
+namespace inference
+{
+namespace backends
+{
+MvImageClassification::MvImageClassification()
+{
+ int ret = mv_image_classification_create(&_handle);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to create image classification handle.");
+}
+
+MvImageClassification::~MvImageClassification()
+{
+ mv_image_classification_destroy(_handle);
+}
+
+void MvImageClassification::configure()
+{
+ int ret = mv_image_classification_configure(_handle);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to configure image classification.");
+}
+
+void MvImageClassification::prepare()
+{
+ int ret = mv_image_classification_prepare(_handle);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to prepare image classification.");
+}
+
+void MvImageClassification::invoke(BaseDataType &input, bool async)
+{
+ ImageDataType &data = dynamic_cast<ImageDataType &>(input);
+
+ if (data._data_type != DataType::IMAGE) {
+ SINGLEO_LOGE("Invalid input type.");
+ throw invalid_argument("Input type not support.");
+ }
+
+ mv_source_h mv_src;
+
+ int ret = mv_create_source(&mv_src);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to create mv source.");
+
+ try {
+ ret = mv_source_fill_by_buffer(mv_src, data.ptr, data.width * data.height * data.byte_per_pixel, data.width,
+ data.height, MEDIA_VISION_COLORSPACE_RGB888);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to convert to mv source.");
+
+ ret = mv_image_classification_inference(_handle, mv_src);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to invoke image classification.");
+ } catch (std::runtime_error &e) {
+ SINGLEO_LOGE("%s", e.what());
+ }
+
+ ret = mv_destroy_source(mv_src);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to destroy mv source.");
+}
+
+BaseResultType &MvImageClassification::result()
+{
+ unsigned long frame_number;
+ unsigned int result_cnt;
+
+ int ret = mv_image_classification_get_result_count(_handle, &frame_number, &result_cnt);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to get image classification result count.");
+
+ _output_data._labels.clear();
+ _output_data._frame_number = frame_number;
+
+ for (unsigned int idx = 0; idx < result_cnt; ++idx) {
+ const char *label = NULL;
+
+ ret = mv_image_classification_get_label(_handle, idx, &label);
+ if (ret != MEDIA_VISION_ERROR_NONE)
+ throw runtime_error("Fail to get image classification label.");
+
+ _output_data._labels.emplace_back(label);
+ }
+
+ return _output_data;
+}
+
+}
+}
+}