[Tensor] Support multiple data types in copyData

author Donghyeon Jeong <dhyeon.jeong@samsung.com>

Thu, 2 Nov 2023 00:50:45 +0000 (09:50 +0900)

committer Jijoong Moon <jijoong.moon@samsung.com>

Fri, 3 Nov 2023 10:29:05 +0000 (19:29 +0900)
author Donghyeon Jeong <dhyeon.jeong@samsung.com>
Thu, 2 Nov 2023 00:50:45 +0000 (09:50 +0900)
committer Jijoong Moon <jijoong.moon@samsung.com>
Fri, 3 Nov 2023 10:29:05 +0000 (19:29 +0900)
diff --git a/nntrainer/tensor/tensor.cpp b/nntrainer/tensor/tensor.cpp

index f2e7e79de709d3b013e6e1eb31c155558e6d73f6..5ee888f9c81c9d8d73006a0f075ec7c950e8f73e 100644 (file)
--- a/nntrainer/tensor/tensor.cpp
+++ b/nntrainer/tensor/tensor.cpp
@@ -3041,17 +3041,46 @@ void Tensor::copyData(const Tensor &from) {
    if (size() != from.size())
      throw std::invalid_argument("Size of tensor to copy must match");
  
-  if (getDataType() != from.getDataType())
-    throw std::invalid_argument("Data type of tensor to copy must match");
-
-  if (getDataType() == ml::train::TensorDim::DataType::FP32) {
-    copy(from.getData<float>());
-  } else if (getDataType() == ml::train::TensorDim::DataType::FP16) {
+  if (getDataType() == from.getDataType()) {
+    if (getDataType() == ml::train::TensorDim::DataType::FP32) {
+      copy(from.getData<float>());
+    } else if (getDataType() == ml::train::TensorDim::DataType::FP16) {
  #ifdef ENABLE_FP16
-    copy(from.getData<_FP16>());
+      copy(from.getData<_FP16>());
  #else
-    throw std::invalid_argument("Error: enable-fp16 is not enabled");
+      throw std::invalid_argument("Error: enable-fp16 is not enabled");
+#endif
+    } else {
+      copy(from.getData<uint8_t>());
+    }
+  } else {
+    if (getDataType() == ml::train::TensorDim::DataType::FP32) {
+      if (from.getDataType() == ml::train::TensorDim::DataType::FP16) {
+#ifdef ENABLE_FP16
+        scopy(size(), from.getData<_FP16>(), 1, getData<float>(), 1);
+#else
+        throw std::invalid_argument("Error: enable-fp16 is not enabled");
  #endif
+      } else if (from.getDataType() == ml::train::TensorDim::DataType::QINT8) {
+        scopy_int8_to_float32(from.size(), from.getData<uint8_t>(), 1,
+                              getData<float>(), 1);
+      } else if (from.getDataType() == ml::train::TensorDim::DataType::QINT4) {
+        scopy_int4_to_float32((from.size() + 1) / 2, from.getData<uint8_t>(), 1,
+                              getData<float>(), 1);
+      }
+    } else if (getDataType() == ml::train::TensorDim::DataType::FP16) {
+#ifdef ENABLE_FP16
+      if (from.getDataType() == ml::train::TensorDim::DataType::QINT8) {
+        scopy_int8_to_float16(from.size(), from.getData<uint8_t>(), 1,
+                              getData<_FP16>(), 1);
+      } else if (from.getDataType() == ml::train::TensorDim::DataType::QINT4) {
+        scopy_int4_to_float16((from.size() + 1) / 2, from.getData<uint8_t>(), 1,
+                              getData<_FP16>(), 1);
+      }
+#else
+      throw std::invalid_argument("Error: enable-fp16 is not enabled");
+#endif
+    }
    }
  }
  
@@ -3124,16 +3153,6 @@ void Tensor::save(std::ostream &file) {
      << " is too big. It cannot be represented by std::streamsize";
  
    if (this->getDataType() == ml::train::TensorDim::DataType::FP32) {
-
-    // std::vector<_FP16> temp(size());
-    // for (unsigned int i = 0; i < size(); ++i) {
-    //   temp[i] = static_cast<_FP16>(getData()[i]);
-    // }
-
-    // checkedWrite(file, (char *)temp.data(),
-    //              static_cast<std::streamsize>(size() * sizeof(_FP16)),
-    //              "[Tensor::save] operation failed");
-
      checkedWrite(file, (char *)getData(), sz,
                   "[Tensor::save] operation failed");
    } else if (this->getDataType() == ml::train::TensorDim::DataType::FP16) {
@@ -3684,40 +3703,6 @@ void Tensor::setZeroPoints(std::vector<uint8_t> zp) {
  
  std::vector<uint8_t> Tensor::getZeroPoints() const { return zero_points; }
  
-void Tensor::flate(Tensor &output) const {
-  if (output.getDataType() == Tdatatype::FP32) {
-    float *o_data = output.getData<float>();
-    const uint8_t *data = getData<uint8_t>();
-
-    if (getDataType() == Tdatatype::QINT4) {
-      for (unsigned int i = 0; i < (output.getDim().getDataLen() + 1) / 2;
-           ++i) {
-        unsigned int idx = i * 2;
-        o_data[idx] = data[i] >> 4;
-        if (idx + 1 < output.getDim().getDataLen())
-          o_data[idx + 1] = data[i] & 0x0f;
-      }
-    } else if (getDataType() == Tdatatype::QINT8) {
-      for (unsigned int i = 0; i < output.getDim().getDataLen(); ++i) {
-        o_data[i] = data[i];
-      }
-    }
-  } else if (output.getDataType() == Tdatatype::FP16) {
-#ifdef ENABLE_FP16
-    _FP16 *o_data = output.getData<_FP16>();
-    const uint8_t *data = getData<uint8_t>();
-
-    if (getDataType() == Tdatatype::QINT8) {
-      for (unsigned int i = 0; i < output.getDim().getDataLen(); ++i) {
-        o_data[i] = data[i];
-      }
-    }
-#else
-    throw std::invalid_argument("enble-fp16 is not set");
-#endif
-  }
-}
-
  void Tensor::dequantize(Tensor &output, unsigned int axis) const {
    if (getDataType() == Tdatatype::FP32 || getDataType() == Tdatatype::FP16) {
      throw std::invalid_argument("Error: Tensor cannot be dequantized");
@@ -3764,16 +3749,10 @@ void Tensor::dequantize(Tensor &output, unsigned int axis) const {
    size_t h = (axis == 2) ? zero_points.size() : 1;
    size_t w = (axis == 3) ? zero_points.size() : 1;
  
+  output.copyData(*this);
+
    if (output.getDataType() == Tdatatype::FP16) {
  #ifdef ENABLE_FP16
-    if (getDataType() == Tdatatype::QINT4) {
-      scopy_int4_to_float16((size() + 1) / 2, getData<uint8_t>(), 1,
-                            output.getData<_FP16>(), 1);
-    } else if (getDataType() == Tdatatype::QINT8) {
-      // @todo scopy for qint8
-      flate(output);
-    }
-
      std::vector<_FP16> zero_points_16(zero_points.begin(), zero_points.end());
      Tensor zero_points_fp16_tensor(
        {{b, c, h, w}, {getFormat(), Tdatatype::FP16}}, zero_points_16.data());
@@ -3789,9 +3768,6 @@ void Tensor::dequantize(Tensor &output, unsigned int axis) const {
      throw std::invalid_argument("enble-fp16 is not set");
  #endif
    } else if (output.getDataType() == Tdatatype::FP32) {
-    // @todo need scopy for uint8 to float
-    flate(output);
-
      std::vector<float> zero_points_32(zero_points.begin(), zero_points.end());
      Tensor zero_points_fp32_tensor(
        {{b, c, h, w}, {getFormat(), Tdatatype::FP32}}, zero_points_32.data());
diff --git a/nntrainer/tensor/tensor.h b/nntrainer/tensor/tensor.h

index 8a1cab2828e2de1397effe39f519f21e680d8bbb..43aececcecd734e3909ab39ca4a627434c996046 100644 (file)
--- a/nntrainer/tensor/tensor.h
+++ b/nntrainer/tensor/tensor.h
@@ -2004,12 +2004,6 @@ public:
     */
    void dequantize(Tensor &output, unsigned int axis) const;
  
-  /**
-   * @brief      copy QINT Tensor and save to output tensor
-   * @param[out] output Tensor to store the result
-   */
-  void flate(Tensor &output) const;
-
    static constexpr float epsilon = 1e-5;
  
  private:
author	Donghyeon Jeong <dhyeon.jeong@samsung.com>
	Thu, 2 Nov 2023 00:50:45 +0000 (09:50 +0900)
committer	Jijoong Moon <jijoong.moon@samsung.com>
	Fri, 3 Nov 2023 10:29:05 +0000 (19:29 +0900)
nntrainer/tensor/tensor.cpp		patch \| blob \| history
nntrainer/tensor/tensor.h		patch \| blob \| history