split off Reshape for common layers

author Jonathan L Long <jonlong@cs.berkeley.edu>

Thu, 11 Sep 2014 05:42:45 +0000 (22:42 -0700)

committer Evan Shelhamer <shelhamer@imaginarynumber.net>

Thu, 18 Sep 2014 19:41:46 +0000 (12:41 -0700)
author Jonathan L Long <jonlong@cs.berkeley.edu>
Thu, 11 Sep 2014 05:42:45 +0000 (22:42 -0700)
committer Evan Shelhamer <shelhamer@imaginarynumber.net>
Thu, 18 Sep 2014 19:41:46 +0000 (12:41 -0700)
diff --git a/include/caffe/common_layers.hpp b/include/caffe/common_layers.hpp

index deb4a57..1f945ca 100644 (file)
--- a/include/caffe/common_layers.hpp
+++ b/include/caffe/common_layers.hpp
@@ -40,6 +40,8 @@ class ArgMaxLayer : public Layer<Dtype> {
        : Layer<Dtype>(param) {}
    virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
      return LayerParameter_LayerType_ARGMAX;
@@ -81,6 +83,8 @@ class ConcatLayer : public Layer<Dtype> {
        : Layer<Dtype>(param) {}
    virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
      return LayerParameter_LayerType_CONCAT;
@@ -159,6 +163,8 @@ class EltwiseLayer : public Layer<Dtype> {
        : Layer<Dtype>(param) {}
    virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
      return LayerParameter_LayerType_ELTWISE;
@@ -198,7 +204,7 @@ class FlattenLayer : public Layer<Dtype> {
   public:
    explicit FlattenLayer(const LayerParameter& param)
        : Layer<Dtype>(param) {}
-  virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
@@ -251,6 +257,8 @@ class InnerProductLayer : public Layer<Dtype> {
        : Layer<Dtype>(param) {}
    virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
      return LayerParameter_LayerType_INNER_PRODUCT;
@@ -285,7 +293,7 @@ class MVNLayer : public Layer<Dtype> {
   public:
    explicit MVNLayer(const LayerParameter& param)
        : Layer<Dtype>(param) {}
-  virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
@@ -319,7 +327,7 @@ class SilenceLayer : public Layer<Dtype> {
   public:
    explicit SilenceLayer(const LayerParameter& param)
        : Layer<Dtype>(param) {}
-  virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top) {}
  
    virtual inline LayerParameter_LayerType type() const {
@@ -351,7 +359,7 @@ class SoftmaxLayer : public Layer<Dtype> {
   public:
    explicit SoftmaxLayer(const LayerParameter& param)
        : Layer<Dtype>(param) {}
-  virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
@@ -388,6 +396,8 @@ class CuDNNSoftmaxLayer : public SoftmaxLayer<Dtype> {
        : SoftmaxLayer<Dtype>(param) {}
    virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top);
    virtual ~CuDNNSoftmaxLayer();
  
   protected:
@@ -413,7 +423,7 @@ class SplitLayer : public Layer<Dtype> {
   public:
    explicit SplitLayer(const LayerParameter& param)
        : Layer<Dtype>(param) {}
-  virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
@@ -448,6 +458,8 @@ class SliceLayer : public Layer<Dtype> {
        : Layer<Dtype>(param) {}
    virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top);
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top);
  
    virtual inline LayerParameter_LayerType type() const {
      return LayerParameter_LayerType_SLICE;
diff --git a/src/caffe/layers/argmax_layer.cpp b/src/caffe/layers/argmax_layer.cpp

index 4b67f24..0d1a107 100644 (file)
--- a/src/caffe/layers/argmax_layer.cpp
+++ b/src/caffe/layers/argmax_layer.cpp
@@ -16,6 +16,11 @@ void ArgMaxLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
    CHECK_GE(top_k_, 1) << " top k must not be less than 1.";
    CHECK_LE(top_k_, bottom[0]->count() / bottom[0]->num())
        << "top_k must be less than or equal to the number of classes.";
+}
+
+template <typename Dtype>
+void ArgMaxLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top) {
    if (out_max_val_) {
      // Produces max_ind and max_val
      (*top)[0]->Reshape(bottom[0]->num(), 2, top_k_, 1);
diff --git a/src/caffe/layers/concat_layer.cpp b/src/caffe/layers/concat_layer.cpp

index 73d28b1..10a11f1 100644 (file)
--- a/src/caffe/layers/concat_layer.cpp
+++ b/src/caffe/layers/concat_layer.cpp
@@ -14,7 +14,11 @@ void ConcatLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
      "concat_dim should be >= 0";
    CHECK_LE(concat_dim_, 1) <<
      "For now concat_dim <=1, it can only concat num and channels";
+}
  
+template <typename Dtype>
+void ConcatLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top) {
    // Initialize with the first blob.
    count_ = bottom[0]->count();
    num_ = bottom[0]->num();
diff --git a/src/caffe/layers/cudnn_softmax_layer.cpp b/src/caffe/layers/cudnn_softmax_layer.cpp

index 6dab2d6..79ba523 100644 (file)
--- a/src/caffe/layers/cudnn_softmax_layer.cpp
+++ b/src/caffe/layers/cudnn_softmax_layer.cpp
@@ -17,12 +17,20 @@ void CuDNNSoftmaxLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
    SoftmaxLayer<Dtype>::LayerSetUp(bottom, top);
    // Initialize CUDNN.
    CUDNN_CHECK(cudnnCreate(&handle_));
+  cudnn::createTensor4dDesc<Dtype>(&bottom_desc_);
+  cudnn::createTensor4dDesc<Dtype>(&top_desc_);
+}
+
+template <typename Dtype>
+void CuDNNSoftmaxLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top) {
+  SoftmaxLayer<Dtype>::Reshape(bottom, top);
    int N = bottom[0]->num();
    int K = bottom[0]->channels();
    int H = bottom[0]->height();
    int W = bottom[0]->width();
-  cudnn::createTensor4dDesc<Dtype>(&bottom_desc_, N, K, H, W);
-  cudnn::createTensor4dDesc<Dtype>(&top_desc_, N, K, H, W);
+  cudnn::setTensor4dDesc<Dtype>(&bottom_desc_, N, K, H, W);
+  cudnn::setTensor4dDesc<Dtype>(&top_desc_, N, K, H, W);
  }
  
  template <typename Dtype>
diff --git a/src/caffe/layers/eltwise_layer.cpp b/src/caffe/layers/eltwise_layer.cpp

index ca157a8..569560f 100644 (file)
--- a/src/caffe/layers/eltwise_layer.cpp
+++ b/src/caffe/layers/eltwise_layer.cpp
@@ -17,6 +17,20 @@ void EltwiseLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        == EltwiseParameter_EltwiseOp_PROD
        && this->layer_param().eltwise_param().coeff_size())) <<
        "Eltwise layer only takes coefficients for summation.";
+  op_ = this->layer_param_.eltwise_param().operation();
+  // Blob-wise coefficients for the elementwise operation.
+  coeffs_ = vector<Dtype>(bottom.size(), 1);
+  if (this->layer_param().eltwise_param().coeff_size()) {
+    for (int i = 0; i < bottom.size(); ++i) {
+      coeffs_[i] = this->layer_param().eltwise_param().coeff(i);
+    }
+  }
+  stable_prod_grad_ = this->layer_param_.eltwise_param().stable_prod_grad();
+}
+
+template <typename Dtype>
+void EltwiseLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top) {
    const int num = bottom[0]->num();
    const int channels = bottom[0]->channels();
    const int height = bottom[0]->height();
@@ -28,15 +42,6 @@ void EltwiseLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
      CHECK_EQ(width, bottom[i]->width());
    }
    (*top)[0]->Reshape(num, channels, height, width);
-  op_ = this->layer_param_.eltwise_param().operation();
-  // Blob-wise coefficients for the elementwise operation.
-  coeffs_ = vector<Dtype>(bottom.size(), 1);
-  if (this->layer_param().eltwise_param().coeff_size()) {
-    for (int i = 0; i < bottom.size(); ++i) {
-      coeffs_[i] = this->layer_param().eltwise_param().coeff(i);
-    }
-  }
-  stable_prod_grad_ = this->layer_param_.eltwise_param().stable_prod_grad();
    // If max operation, we will initialize the vector index part.
    if (this->layer_param_.eltwise_param().operation() ==
        EltwiseParameter_EltwiseOp_MAX && top->size() == 1) {
diff --git a/src/caffe/layers/flatten_layer.cpp b/src/caffe/layers/flatten_layer.cpp

index 8c1fc74..65310cd 100644 (file)
--- a/src/caffe/layers/flatten_layer.cpp
+++ b/src/caffe/layers/flatten_layer.cpp
@@ -7,7 +7,7 @@
  namespace caffe {
  
  template <typename Dtype>
-void FlattenLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+void FlattenLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top) {
    int channels_out = bottom[0]->channels() * bottom[0]->height()
        * bottom[0]->width();
diff --git a/src/caffe/layers/inner_product_layer.cpp b/src/caffe/layers/inner_product_layer.cpp

index 3ba0e1f..ecd05a0 100644 (file)
--- a/src/caffe/layers/inner_product_layer.cpp
+++ b/src/caffe/layers/inner_product_layer.cpp
@@ -14,11 +14,8 @@ void InnerProductLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top) {
    const int num_output = this->layer_param_.inner_product_param().num_output();
    bias_term_ = this->layer_param_.inner_product_param().bias_term();
-  // Figure out the dimensions
-  M_ = bottom[0]->num();
-  K_ = bottom[0]->count() / bottom[0]->num();
    N_ = num_output;
-  (*top)[0]->Reshape(bottom[0]->num(), num_output, 1, 1);
+  K_ = bottom[0]->count() / bottom[0]->num();
    // Check if we need to set up the weights
    if (this->blobs_.size() > 0) {
      LOG(INFO) << "Skipping parameter initialization";
@@ -42,12 +39,22 @@ void InnerProductLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
        bias_filler->Fill(this->blobs_[1].get());
      }
    }  // parameter initialization
-  // Setting up the bias multiplier
+  this->param_propagate_down_.resize(this->blobs_.size(), true);
+}
+
+template <typename Dtype>
+void InnerProductLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top) {
+  // Figure out the dimensions
+  M_ = bottom[0]->num();
+  CHECK_EQ(bottom[0]->count() / bottom[0]->num(), K_) << "Input size "
+    "incompatible with inner product parameters.";
+  (*top)[0]->Reshape(bottom[0]->num(), N_, 1, 1);
+  // Set up the bias multiplier
    if (bias_term_) {
      bias_multiplier_.Reshape(1, 1, 1, M_);
      caffe_set(M_, Dtype(1), bias_multiplier_.mutable_cpu_data());
    }
-  this->param_propagate_down_.resize(this->blobs_.size(), true);
  }
  
  template <typename Dtype>
diff --git a/src/caffe/layers/mvn_layer.cpp b/src/caffe/layers/mvn_layer.cpp

index 4d90702..6a57b3e 100644 (file)
--- a/src/caffe/layers/mvn_layer.cpp
+++ b/src/caffe/layers/mvn_layer.cpp
@@ -8,7 +8,7 @@
  namespace caffe {
  
  template <typename Dtype>
-void MVNLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+void MVNLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top) {
    (*top)[0]->Reshape(bottom[0]->num(), bottom[0]->channels(),
        bottom[0]->height(), bottom[0]->width());
diff --git a/src/caffe/layers/slice_layer.cpp b/src/caffe/layers/slice_layer.cpp

index 9fa1275..ed679a9 100644 (file)
--- a/src/caffe/layers/slice_layer.cpp
+++ b/src/caffe/layers/slice_layer.cpp
@@ -18,6 +18,11 @@ void SliceLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
    std::copy(slice_param.slice_point().begin(),
        slice_param.slice_point().end(),
        std::back_inserter(slice_point_));
+}
+
+template <typename Dtype>
+void SliceLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
+      vector<Blob<Dtype>*>* top) {
    count_ = 0;
    num_ = bottom[0]->num();
    channels_ = bottom[0]->channels();
@@ -50,7 +55,6 @@ void SliceLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
           count_ += (*top)[i]->count();
        }
      }
-
    } else {
      if (slice_dim_ == 0) {
        CHECK_EQ(num_ % top->size(), 0)
diff --git a/src/caffe/layers/softmax_layer.cpp b/src/caffe/layers/softmax_layer.cpp

index 952db74..60668a3 100644 (file)
--- a/src/caffe/layers/softmax_layer.cpp
+++ b/src/caffe/layers/softmax_layer.cpp
@@ -8,7 +8,7 @@
  namespace caffe {
  
  template <typename Dtype>
-void SoftmaxLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+void SoftmaxLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top) {
    (*top)[0]->Reshape(bottom[0]->num(), bottom[0]->channels(),
        bottom[0]->height(), bottom[0]->width());
diff --git a/src/caffe/layers/split_layer.cpp b/src/caffe/layers/split_layer.cpp

index 3bed347..40d3600 100644 (file)
--- a/src/caffe/layers/split_layer.cpp
+++ b/src/caffe/layers/split_layer.cpp
@@ -7,7 +7,7 @@
  namespace caffe {
  
  template <typename Dtype>
-void SplitLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+void SplitLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
        vector<Blob<Dtype>*>* top) {
    count_ = bottom[0]->count();
    for (int i = 0; i < top->size(); ++i) {
author	Jonathan L Long <jonlong@cs.berkeley.edu>
	Thu, 11 Sep 2014 05:42:45 +0000 (22:42 -0700)
committer	Evan Shelhamer <shelhamer@imaginarynumber.net>
	Thu, 18 Sep 2014 19:41:46 +0000 (12:41 -0700)
include/caffe/common_layers.hpp		patch \| blob \| history
src/caffe/layers/argmax_layer.cpp		patch \| blob \| history
src/caffe/layers/concat_layer.cpp		patch \| blob \| history
src/caffe/layers/cudnn_softmax_layer.cpp		patch \| blob \| history
src/caffe/layers/eltwise_layer.cpp		patch \| blob \| history
src/caffe/layers/flatten_layer.cpp		patch \| blob \| history
src/caffe/layers/inner_product_layer.cpp		patch \| blob \| history
src/caffe/layers/mvn_layer.cpp		patch \| blob \| history
src/caffe/layers/slice_layer.cpp		patch \| blob \| history
src/caffe/layers/softmax_layer.cpp		patch \| blob \| history
src/caffe/layers/split_layer.cpp		patch \| blob \| history