[Tensor] Operational Improvements and Functionality Simplification

author Donghyeon Jeong <dhyeon.jeong@samsung.com>

Fri, 12 Jul 2024 07:33:11 +0000 (16:33 +0900)

committer Jijoong Moon <jijoong.moon@samsung.com>

Fri, 26 Jul 2024 01:27:26 +0000 (10:27 +0900)
author Donghyeon Jeong <dhyeon.jeong@samsung.com>
Fri, 12 Jul 2024 07:33:11 +0000 (16:33 +0900)
committer Jijoong Moon <jijoong.moon@samsung.com>
Fri, 26 Jul 2024 01:27:26 +0000 (10:27 +0900)
diff --git a/nntrainer/tensor/float_tensor.cpp b/nntrainer/tensor/float_tensor.cpp

index 5ac40ca7817e5bef18bbac70fccfca164bf67e07..d1a697ec5b0c00ccfa380eaca47d84716fbb2b77 100644 (file)
--- a/nntrainer/tensor/float_tensor.cpp
+++ b/nntrainer/tensor/float_tensor.cpp
@@ -814,6 +814,18 @@ void FloatTensor::copyData(const Tensor &from) {
    }
  }
  
+void FloatTensor::copy_with_stride(const Tensor &input, Tensor &output) {
+  for (unsigned int b = 0; b < output.batch(); ++b) {
+    for (unsigned int c = 0; c < output.channel(); ++c) {
+      for (unsigned int h = 0; h < output.height(); ++h) {
+        for (unsigned int w = 0; w < output.width(); ++w) {
+          output.setValue(b, c, h, w, input.getValue<float>(b, c, h, w));
+        }
+      }
+    }
+  }
+}
+
  std::vector<unsigned int> FloatTensor::argmax() const {
    std::vector<unsigned int> result;
    const float *data = (float *)getData();
@@ -1061,12 +1073,11 @@ std::vector<Tensor> FloatTensor::split(std::vector<size_t> sizes, int axis) {
    return ret;
  }
  
-Tensor FloatTensor::cat(const std::vector<Tensor> &tensors, int axis) {
+Tensor FloatTensor::concat(const std::vector<Tensor> &tensors, int axis) {
    if (axis == -1) {
      axis = 3;
    }
  
-  Tensor ret;
    auto ref_dim = tensors.front().getDim();
    bool is_format_nchw = (ref_dim.getFormat() == Tformat::NCHW);
    ref_dim.setTensorDim(axis, 1);
@@ -1106,7 +1117,7 @@ Tensor FloatTensor::cat(const std::vector<Tensor> &tensors, int axis) {
    auto ret_dim = ref_dim;
    ret_dim.setTensorDim(axis, axis_dim);
  
-  ret = Tensor(ret_dim);
+  Tensor ret = Tensor(ret_dim);
  
    std::array<unsigned, 4> loc = {0, 0, 0, 0};
    for (auto &t : tensors) {
diff --git a/nntrainer/tensor/float_tensor.h b/nntrainer/tensor/float_tensor.h

index 1adfebb2264af73aa7036070b462d89ce8f2f12a..68e09468663ae4c633af3086c2c968743a79431f 100644 (file)
--- a/nntrainer/tensor/float_tensor.h
+++ b/nntrainer/tensor/float_tensor.h
@@ -363,7 +363,7 @@ public:
    /**
     * @copydoc Tensor::cat(const std::vector<Tensor> &tensors, int axis)
     */
-  static Tensor cat(const std::vector<Tensor> &tensors, int axis);
+  Tensor concat(const std::vector<Tensor> &tensors, int axis) override;
  
    /**
     * @copydoc Tensor::copy(const Tensor &from)
@@ -375,6 +375,13 @@ public:
     */
    void copyData(const Tensor &from);
  
+  /**
+   * @brief      Copy the Tensor
+   * @param[in]  input Tensor to be copied
+   * @param[out] output output Tensor
+   */
+  void copy_with_stride(const Tensor &input, Tensor &output) override;
+
    /**
     * @copydoc Tensor::argmax()
     */
diff --git a/nntrainer/tensor/half_tensor.cpp b/nntrainer/tensor/half_tensor.cpp

index 26ac4e8546369d54ba2ebb98b2ced98eada80d24..b76393d8c781d84a0d0dba7652102ffc18f735cd 100644 (file)
--- a/nntrainer/tensor/half_tensor.cpp
+++ b/nntrainer/tensor/half_tensor.cpp
@@ -887,11 +887,10 @@ std::vector<Tensor> HalfTensor::split(std::vector<size_t> sizes, int axis) {
    return ret;
  }
  
-Tensor HalfTensor::cat(const std::vector<Tensor> &tensors, int axis) {
+Tensor HalfTensor::concat(const std::vector<Tensor> &tensors, int axis) {
    if (axis == -1) {
      axis = 3;
    }
-  Tensor ret;
    auto ref_dim = tensors.front().getDim();
    bool is_format_nchw = (ref_dim.getFormat() == Tformat::NCHW);
    ref_dim.setTensorDim(axis, 1);
@@ -931,7 +930,7 @@ Tensor HalfTensor::cat(const std::vector<Tensor> &tensors, int axis) {
    auto ret_dim = ref_dim;
    ret_dim.setTensorDim(axis, axis_dim);
  
-  ret = Tensor(ret_dim);
+  Tensor output = Tensor(ret_dim);
  
    std::array<unsigned, 4> loc = {0, 0, 0, 0};
    for (auto &t : tensors) {
@@ -950,7 +949,7 @@ Tensor HalfTensor::cat(const std::vector<Tensor> &tensors, int axis) {
      }
  
      for (size_t i = 0u, sz = t.size(); i < sz; ++i) {
-      iter_value(loc, start_loc, ret, tensor_dim_arr) = t.getValue<_FP16>(i);
+      iter_value(loc, start_loc, output, tensor_dim_arr) = t.getValue<_FP16>(i);
      }
  
      if (is_format_nchw) {
@@ -965,7 +964,7 @@ Tensor HalfTensor::cat(const std::vector<Tensor> &tensors, int axis) {
        }
      }
    }
-  return ret;
+  return output;
  }
  
  void HalfTensor::print(std::ostream &out) const {
@@ -1060,6 +1059,18 @@ void HalfTensor::copyData(const Tensor &from) {
    }
  }
  
+void HalfTensor::copy_with_stride(const Tensor &input, Tensor &output) {
+  for (unsigned int b = 0; b < output.batch(); ++b) {
+    for (unsigned int c = 0; c < output.channel(); ++c) {
+      for (unsigned int h = 0; h < output.height(); ++h) {
+        for (unsigned int w = 0; w < output.width(); ++w) {
+          output.setValue(b, c, h, w, input.getValue<_FP16>(b, c, h, w));
+        }
+      }
+    }
+  }
+}
+
  std::vector<unsigned int> HalfTensor::argmax() const {
    std::vector<unsigned int> result;
    const _FP16 *data = (_FP16 *)getData();
diff --git a/nntrainer/tensor/half_tensor.h b/nntrainer/tensor/half_tensor.h

index 439882076ce3149ff7ce8aefb6f77caa10a852b4..77bf5fdf55c3682ab9ea847b3fc10261ff085bf4 100644 (file)
--- a/nntrainer/tensor/half_tensor.h
+++ b/nntrainer/tensor/half_tensor.h
@@ -353,7 +353,7 @@ public:
    /**
     * @copydoc Tensor::cat(const std::vector<Tensor> &tensors, int axis)
     */
-  static Tensor cat(const std::vector<Tensor> &tensors, int axis);
+  Tensor concat(const std::vector<Tensor> &tensors, int axis) override;
  
    /**
     * @copydoc Tensor::copy(const Tensor &from)
@@ -365,6 +365,13 @@ public:
     */
    void copyData(const Tensor &from);
  
+  /**
+   * @brief      Copy the Tensor
+   * @param[in]  input Tensor to be copied
+   * @param[out] output output Tensor
+   */
+  void copy_with_stride(const Tensor &input, Tensor &output) override;
+
    /**
     * @copydoc Tensor::argmax()
     */
diff --git a/nntrainer/tensor/tensor.cpp b/nntrainer/tensor/tensor.cpp

index 2c815e2913006ab33434e2917c4e98661937b378..dfb0be0433d04ebbfa2b1ef4977662aaa69c7e26 100644 (file)
--- a/nntrainer/tensor/tensor.cpp
+++ b/nntrainer/tensor/tensor.cpp
@@ -818,27 +818,19 @@ std::vector<Tensor> Tensor::split(std::vector<size_t> sizes, int axis) {
    return itensor->split(sizes, axis);
  }
  
-Tensor Tensor::cat(const std::vector<Tensor> &tensors, int axis) {
+Tensor Tensor::concat(const std::vector<Tensor> &tensors, int axis) {
    NNTR_THROW_IF(!(-1 <= axis && axis < 4), std::invalid_argument)
      << "cannot split axis of axis: " << axis;
  
    NNTR_THROW_IF(tensors.empty(), std::invalid_argument)
      << "given tensor vector is empty";
  
-  Tensor output;
-  Tdatatype dtype = tensors.front().getDim().getDataType();
-
-  if (dtype == Tdatatype::FP32) {
-    output = FloatTensor::cat(tensors, axis);
-  } else if (dtype == ml::train::TensorDim::DataType::FP16) {
-#ifdef ENABLE_FP16
-    output = HalfTensor::cat(tensors, axis);
-#else
-    throw std::invalid_argument("Error: enable-fp16 is not enabled");
-#endif
-  }
+  return itensor->concat(tensors, axis);
+}
  
-  return output;
+Tensor Tensor::cat(const std::vector<Tensor> &tensors, int axis) {
+  Tensor input = tensors[0];
+  return input.concat(tensors, axis);
  }
  
  void Tensor::print(std::ostream &out) const {
@@ -874,18 +866,8 @@ void Tensor::copy(const Tensor &from) {
      // if tensor size and data type match, copy data
      itensor->copy(from);
    } else {
-    // replace with a new tensor that are the same with the given tensor
-    if (from.getDataType() == ml::train::TensorDim::DataType::FP32) {
-      Tensor t = Tensor(from.getDim(), from.getData<float>());
-      swap(t, *this);
-    } else if (from.getDataType() == ml::train::TensorDim::DataType::FP16) {
-#ifdef ENABLE_FP16
-      Tensor t = Tensor(from.getDim(), from.getData<_FP16>());
-      swap(t, *this);
-#else
-      throw std::invalid_argument("Error: enable-fp16 is not enabled");
-#endif
-    }
+    Tensor t = Tensor(from.getDim(), from.getData<char>());
+    swap(t, *this);
    }
  }
  
@@ -893,37 +875,13 @@ void Tensor::copyData(const Tensor &from) { itensor->copyData(from); }
  
  void Tensor::copy_with_stride(const Tensor &from) {
    if (itensor->getDim() == from.getDim()) {
-    // if the tensor dim matches, copy the data
-    for (unsigned int b = 0; b < batch(); ++b) {
-      for (unsigned int c = 0; c < channel(); ++c) {
-        for (unsigned int h = 0; h < height(); ++h) {
-          for (unsigned int w = 0; w < width(); ++w) {
-            setValue(b, c, h, w, from.getValue<float>(b, c, h, w));
-          }
-        }
-      }
-    }
+    // If the tensor dim matches, copy the data. This also applies to
+    // uncontigous tensor.
+    itensor->copy_with_stride(from, *this);
    } else {
      // replace with a new tensor that has the same data as the given tensor
      Tensor t = Tensor(from.getDim(), true);
-    for (unsigned int b = 0; b < t.batch(); ++b) {
-      for (unsigned int c = 0; c < t.channel(); ++c) {
-        for (unsigned int h = 0; h < t.height(); ++h) {
-          for (unsigned int w = 0; w < t.width(); ++w) {
-            if (getDataType() == ml::train::TensorDim::DataType::FP32) {
-              t.setValue(b, c, h, w, from.getValue<float>(b, c, h, w));
-            } else if (getDataType() == ml::train::TensorDim::DataType::FP16) {
-              /// @todo remove #ifdef ENABLE_FP16
-#ifdef ENABLE_FP16
-              t.setValue(b, c, h, w, from.getValue<_FP16>(b, c, h, w));
-#else
-              throw std::invalid_argument("Error: enable-fp16 is not enabled");
-#endif
-            }
-          }
-        }
-      }
-    }
+    itensor->copy_with_stride(from, t);
      swap(t, *this);
    }
  }
diff --git a/nntrainer/tensor/tensor.h b/nntrainer/tensor/tensor.h

index bfd98978405e8b0a21688e000641951c74ff3d7e..4e8765849fbe5dff9bc6b816345f058fc6ee5e48 100644 (file)
--- a/nntrainer/tensor/tensor.h
+++ b/nntrainer/tensor/tensor.h
@@ -1145,6 +1145,15 @@ public:
     */
    std::vector<Tensor> split(std::vector<size_t> sizes, int axis = 0);
  
+  /**
+   * @brief concatenate tensors along axis
+   *
+   * @param tensors tensors to be concatenated to the first tensor
+   * @param axis axis
+   * @return Tensor concatenated tensor
+   */
+  Tensor concat(const std::vector<Tensor> &tensors, int axis = 0);
+
    /**
     * @brief concatenate tensors along axis
     *
diff --git a/nntrainer/tensor/tensor_base.h b/nntrainer/tensor/tensor_base.h

index 1831de0a8fac93f3f780d7607ce1ab3b254e7549..c3b4bfb87547e94922d113340f14e32a88ea883e 100644 (file)
--- a/nntrainer/tensor/tensor_base.h
+++ b/nntrainer/tensor/tensor_base.h
@@ -396,6 +396,11 @@ public:
     */
    virtual std::vector<Tensor> split(std::vector<size_t> sizes, int axis) = 0;
  
+  /**
+   * @copydoc Tensor::concat(const std::vector<Tensor> &tensors, int axis)
+   */
+  virtual Tensor concat(const std::vector<Tensor> &tensors, int axis) = 0;
+
    /**
     * @copydoc Tensor::print(std::ostream &out)
     */
@@ -431,6 +436,13 @@ public:
     */
    virtual void copyData(const Tensor &from) = 0;
  
+  /**
+   * @brief      Copy the Tensor
+   * @param[in]  input Tensor to be copied
+   * @param[out] output output Tensor
+   */
+  virtual void copy_with_stride(const Tensor &input, Tensor &output) = 0;
+
    /**
     * @copydoc Tensor::argmax()
     */
author	Donghyeon Jeong <dhyeon.jeong@samsung.com>
	Fri, 12 Jul 2024 07:33:11 +0000 (16:33 +0900)
committer	Jijoong Moon <jijoong.moon@samsung.com>
	Fri, 26 Jul 2024 01:27:26 +0000 (10:27 +0900)
nntrainer/tensor/float_tensor.cpp		patch \| blob \| history
nntrainer/tensor/float_tensor.h		patch \| blob \| history
nntrainer/tensor/half_tensor.cpp		patch \| blob \| history
nntrainer/tensor/half_tensor.h		patch \| blob \| history
nntrainer/tensor/tensor.cpp		patch \| blob \| history
nntrainer/tensor/tensor.h		patch \| blob \| history
nntrainer/tensor/tensor_base.h		patch \| blob \| history