Use Blobs instead of SyncedMemorys for the bias_multiplier_'s.

jeffdonahue · jeffdonahue · commit fb8c0616f482 · 2014-07-15T13:48:10.000-07:00
diff --git a/include/caffe/vision_layers.hpp b/include/caffe/vision_layers.hpp
@@ -55,7 +55,7 @@ class ConvolutionLayer : public Layer<Dtype> {
   int num_output_;
   int group_;
   Blob<Dtype> col_buffer_;
-  shared_ptr<SyncedMemory> bias_multiplier_;
+  shared_ptr<Blob<Dtype> > bias_multiplier_;
   bool bias_term_;
   int M_;
   int K_;
@@ -157,7 +157,7 @@ class InnerProductLayer : public Layer<Dtype> {
   int K_;
   int N_;
   bool bias_term_;
-  shared_ptr<SyncedMemory> bias_multiplier_;
+  shared_ptr<Blob<Dtype> > bias_multiplier_;
 };
 
 // Forward declare PoolingLayer and SplitLayer for use in LRNLayer.
diff --git a/src/caffe/layers/conv_layer.cpp b/src/caffe/layers/conv_layer.cpp
@@ -78,12 +78,8 @@ void ConvolutionLayer<Dtype>::SetUp(const vector<Blob<Dtype>*>& bottom,
   }
   // Set up the bias filler
   if (bias_term_) {
-    bias_multiplier_.reset(new SyncedMemory(N_ * sizeof(Dtype)));
-    Dtype* bias_multiplier_data =
-        reinterpret_cast<Dtype*>(bias_multiplier_->mutable_cpu_data());
-    for (int i = 0; i < N_; ++i) {
-        bias_multiplier_data[i] = 1.;
-    }
+    bias_multiplier_.reset(new Blob<Dtype>(1, 1, 1, N_));
+    caffe_set(N_, Dtype(1), bias_multiplier_->mutable_cpu_data());
   }
   this->param_propagate_down_.resize(this->blobs_.size(), true);
 }
@@ -114,7 +110,7 @@ Dtype ConvolutionLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bottom,
       if (bias_term_) {
         caffe_cpu_gemm<Dtype>(CblasNoTrans, CblasNoTrans, num_output_,
             N_, 1, (Dtype)1., this->blobs_[1]->cpu_data(),
-            reinterpret_cast<const Dtype*>(bias_multiplier_->cpu_data()),
+            bias_multiplier_->cpu_data(),
             (Dtype)1., top_data + (*top)[i]->offset(n));
       }
     }
@@ -148,7 +144,7 @@ void ConvolutionLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,
       for (int n = 0; n < num_; ++n) {
         caffe_cpu_gemv<Dtype>(CblasNoTrans, num_output_, N_,
             1., top_diff + top[0]->offset(n),
-            static_cast<const Dtype*>(bias_multiplier_->cpu_data()), 1.,
+            bias_multiplier_->cpu_data(), 1.,
             bias_diff);
       }
     }
diff --git a/src/caffe/layers/conv_layer.cu b/src/caffe/layers/conv_layer.cu
@@ -35,7 +35,7 @@ Dtype ConvolutionLayer<Dtype>::Forward_gpu(const vector<Blob<Dtype>*>& bottom,
       if (bias_term_) {
         caffe_gpu_gemm<Dtype>(CblasNoTrans, CblasNoTrans, num_output_,
             N_, 1, (Dtype)1., this->blobs_[1]->gpu_data(),
-            reinterpret_cast<const Dtype*>(bias_multiplier_->gpu_data()),
+            bias_multiplier_->gpu_data(),
             (Dtype)1., top_data + (*top)[i]->offset(n));
       }
     }
@@ -69,7 +69,7 @@ void ConvolutionLayer<Dtype>::Backward_gpu(const vector<Blob<Dtype>*>& top,
       for (int n = 0; n < num_; ++n) {
         caffe_gpu_gemv<Dtype>(CblasNoTrans, num_output_, N_,
             1., top_diff + top[0]->offset(n),
-            static_cast<const Dtype*>(bias_multiplier_->gpu_data()), 1.,
+            bias_multiplier_->gpu_data(), 1.,
             bias_diff);
       }
     }
diff --git a/src/caffe/layers/inner_product_layer.cpp b/src/caffe/layers/inner_product_layer.cpp
@@ -47,12 +47,8 @@ void InnerProductLayer<Dtype>::SetUp(const vector<Blob<Dtype>*>& bottom,
   }  // parameter initialization
   // Setting up the bias multiplier
   if (bias_term_) {
-    bias_multiplier_.reset(new SyncedMemory(M_ * sizeof(Dtype)));
-    Dtype* bias_multiplier_data =
-        reinterpret_cast<Dtype*>(bias_multiplier_->mutable_cpu_data());
-    for (int i = 0; i < M_; ++i) {
-        bias_multiplier_data[i] = 1.;
-    }
+    bias_multiplier_.reset(new Blob<Dtype>(1, 1, 1, M_));
+    caffe_set(M_, Dtype(1), bias_multiplier_->mutable_cpu_data());
   }
   this->param_propagate_down_.resize(this->blobs_.size(), true);
 }
@@ -67,7 +63,7 @@ Dtype InnerProductLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bottom,
       bottom_data, weight, (Dtype)0., top_data);
   if (bias_term_) {
     caffe_cpu_gemm<Dtype>(CblasNoTrans, CblasNoTrans, M_, N_, 1, (Dtype)1.,
-        reinterpret_cast<const Dtype*>(bias_multiplier_->cpu_data()),
+        bias_multiplier_->cpu_data(),
         this->blobs_[1]->cpu_data(), (Dtype)1., top_data);
   }
   return Dtype(0);
@@ -88,7 +84,7 @@ void InnerProductLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,
     const Dtype* top_diff = top[0]->cpu_diff();
     // Gradient with respect to bias
     caffe_cpu_gemv<Dtype>(CblasTrans, M_, N_, (Dtype)1., top_diff,
-        reinterpret_cast<const Dtype*>(bias_multiplier_->cpu_data()), (Dtype)0.,
+        bias_multiplier_->cpu_data(), (Dtype)0.,
         this->blobs_[1]->mutable_cpu_diff());
   }
   if (propagate_down[0]) {
diff --git a/src/caffe/layers/inner_product_layer.cu b/src/caffe/layers/inner_product_layer.cu
@@ -23,7 +23,7 @@ Dtype InnerProductLayer<Dtype>::Forward_gpu(const vector<Blob<Dtype>*>& bottom,
       bottom_data, weight, (Dtype)0., top_data);
   if (bias_term_) {
     caffe_gpu_gemm<Dtype>(CblasNoTrans, CblasNoTrans, M_, N_, 1, (Dtype)1.,
-        reinterpret_cast<const Dtype*>(bias_multiplier_->gpu_data()),
+        bias_multiplier_->gpu_data(),
         this->blobs_[1]->gpu_data(), (Dtype)1., top_data);
   }
   return Dtype(0);
@@ -44,7 +44,7 @@ void InnerProductLayer<Dtype>::Backward_gpu(const vector<Blob<Dtype>*>& top,
     const Dtype* top_diff = top[0]->gpu_diff();
     // Gradient with respect to bias
     caffe_gpu_gemv<Dtype>(CblasTrans, M_, N_, (Dtype)1., top_diff,
-        reinterpret_cast<const Dtype*>(bias_multiplier_->gpu_data()), (Dtype)0.,
+        bias_multiplier_->gpu_data(), (Dtype)0.,
         this->blobs_[1]->mutable_gpu_diff());
   }
   if (propagate_down[0]) {

Original file line number	Diff line number	Diff line change
`@@ -78,12 +78,8 @@ void ConvolutionLayer<Dtype>::SetUp(const vector<Blob<Dtype>*>& bottom,`
`78`	`78`	`}`
`79`	`79`	`// Set up the bias filler`
`80`	`80`	`if (bias_term_) {`
`81`		`- bias_multiplier_.reset(new SyncedMemory(N_ * sizeof(Dtype)));`
`82`		`- Dtype* bias_multiplier_data =`
`83`		`- reinterpret_cast<Dtype*>(bias_multiplier_->mutable_cpu_data());`
`84`		`- for (int i = 0; i < N_; ++i) {`
`85`		`- bias_multiplier_data[i] = 1.;`
`86`		`- }`
	`81`	`+ bias_multiplier_.reset(new Blob<Dtype>(1, 1, 1, N_));`
	`82`	`+ caffe_set(N_, Dtype(1), bias_multiplier_->mutable_cpu_data());`
`87`	`83`	`}`
`88`	`84`	`this->param_propagate_down_.resize(this->blobs_.size(), true);`
`89`	`85`	`}`
`@@ -114,7 +110,7 @@ Dtype ConvolutionLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bottom,`
`114`	`110`	`if (bias_term_) {`
`115`	`111`	`caffe_cpu_gemm<Dtype>(CblasNoTrans, CblasNoTrans, num_output_,`
`116`	`112`	`N_, 1, (Dtype)1., this->blobs_[1]->cpu_data(),`
`117`		`- reinterpret_cast<const Dtype*>(bias_multiplier_->cpu_data()),`
	`113`	`+ bias_multiplier_->cpu_data(),`
`118`	`114`	`(Dtype)1., top_data + (*top)[i]->offset(n));`
`119`	`115`	`}`
`120`	`116`	`}`
`@@ -148,7 +144,7 @@ void ConvolutionLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,`
`148`	`144`	`for (int n = 0; n < num_; ++n) {`
`149`	`145`	`caffe_cpu_gemv<Dtype>(CblasNoTrans, num_output_, N_,`
`150`	`146`	`1., top_diff + top[0]->offset(n),`
`151`		`- static_cast<const Dtype*>(bias_multiplier_->cpu_data()), 1.,`
	`147`	`+ bias_multiplier_->cpu_data(), 1.,`
`152`	`148`	`bias_diff);`
`153`	`149`	`}`
`154`	`150`	`}`
Original file line number	Diff line number	Diff line change
`@@ -35,7 +35,7 @@ Dtype ConvolutionLayer<Dtype>::Forward_gpu(const vector<Blob<Dtype>*>& bottom,`
`35`	`35`	`if (bias_term_) {`
`36`	`36`	`caffe_gpu_gemm<Dtype>(CblasNoTrans, CblasNoTrans, num_output_,`
`37`	`37`	`N_, 1, (Dtype)1., this->blobs_[1]->gpu_data(),`
`38`		`- reinterpret_cast<const Dtype*>(bias_multiplier_->gpu_data()),`
	`38`	`+ bias_multiplier_->gpu_data(),`
`39`	`39`	`(Dtype)1., top_data + (*top)[i]->offset(n));`
`40`	`40`	`}`
`41`	`41`	`}`
`@@ -69,7 +69,7 @@ void ConvolutionLayer<Dtype>::Backward_gpu(const vector<Blob<Dtype>*>& top,`
`69`	`69`	`for (int n = 0; n < num_; ++n) {`
`70`	`70`	`caffe_gpu_gemv<Dtype>(CblasNoTrans, num_output_, N_,`
`71`	`71`	`1., top_diff + top[0]->offset(n),`
`72`		`- static_cast<const Dtype*>(bias_multiplier_->gpu_data()), 1.,`
	`72`	`+ bias_multiplier_->gpu_data(), 1.,`
`73`	`73`	`bias_diff);`
`74`	`74`	`}`
`75`	`75`	`}`