accumulate gradients in inner product layer

author Sergio <sguada@gmail.com>

Sat, 27 Sep 2014 06:03:26 +0000 (23:03 -0700)

committer Evan Shelhamer <shelhamer@imaginarynumber.net>

Wed, 27 May 2015 21:07:20 +0000 (14:07 -0700)
author Sergio <sguada@gmail.com>
Sat, 27 Sep 2014 06:03:26 +0000 (23:03 -0700)
committer Evan Shelhamer <shelhamer@imaginarynumber.net>
Wed, 27 May 2015 21:07:20 +0000 (14:07 -0700)
diff --git a/src/caffe/layers/inner_product_layer.cpp b/src/caffe/layers/inner_product_layer.cpp

index 89e0c8f..83c3235 100644 (file)
--- a/src/caffe/layers/inner_product_layer.cpp
+++ b/src/caffe/layers/inner_product_layer.cpp
@@ -101,13 +101,13 @@ void InnerProductLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,
      const Dtype* bottom_data = bottom[0]->cpu_data();
      // Gradient with respect to weight
      caffe_cpu_gemm<Dtype>(CblasTrans, CblasNoTrans, N_, K_, M_, (Dtype)1.,
-        top_diff, bottom_data, (Dtype)0., this->blobs_[0]->mutable_cpu_diff());
+        top_diff, bottom_data, (Dtype)1., this->blobs_[0]->mutable_cpu_diff());
    }
    if (bias_term_ && this->param_propagate_down_[1]) {
      const Dtype* top_diff = top[0]->cpu_diff();
      // Gradient with respect to bias
      caffe_cpu_gemv<Dtype>(CblasTrans, M_, N_, (Dtype)1., top_diff,
-        bias_multiplier_.cpu_data(), (Dtype)0.,
+        bias_multiplier_.cpu_data(), (Dtype)1.,
          this->blobs_[1]->mutable_cpu_diff());
    }
    if (propagate_down[0]) {
diff --git a/src/caffe/layers/inner_product_layer.cu b/src/caffe/layers/inner_product_layer.cu

index a9e1784..dd90cac 100644 (file)
--- a/src/caffe/layers/inner_product_layer.cu
+++ b/src/caffe/layers/inner_product_layer.cu
@@ -33,13 +33,13 @@ void InnerProductLayer<Dtype>::Backward_gpu(const vector<Blob<Dtype>*>& top,
      const Dtype* bottom_data = bottom[0]->gpu_data();
      // Gradient with respect to weight
      caffe_gpu_gemm<Dtype>(CblasTrans, CblasNoTrans, N_, K_, M_, (Dtype)1.,
-        top_diff, bottom_data, (Dtype)0., this->blobs_[0]->mutable_gpu_diff());
+        top_diff, bottom_data, (Dtype)1., this->blobs_[0]->mutable_gpu_diff());
    }
    if (bias_term_ && this->param_propagate_down_[1]) {
      const Dtype* top_diff = top[0]->gpu_diff();
      // Gradient with respect to bias
      caffe_gpu_gemv<Dtype>(CblasTrans, M_, N_, (Dtype)1., top_diff,
-        bias_multiplier_.gpu_data(), (Dtype)0.,
+        bias_multiplier_.gpu_data(), (Dtype)1.,
          this->blobs_[1]->mutable_gpu_diff());
    }
    if (propagate_down[0]) {
author	Sergio <sguada@gmail.com>
	Sat, 27 Sep 2014 06:03:26 +0000 (23:03 -0700)
committer	Evan Shelhamer <shelhamer@imaginarynumber.net>
	Wed, 27 May 2015 21:07:20 +0000 (14:07 -0700)
src/caffe/layers/inner_product_layer.cpp		patch \| blob \| history
src/caffe/layers/inner_product_layer.cu		patch \| blob \| history