BVLC
diff --git a/‎src/caffe/net.cpp‎
Lines changed: 23 additions & 59 deletions b/‎src/caffe/net.cpp‎
Lines changed: 23 additions & 59 deletions
diff --git a/‎src/caffe/proto/caffe.proto‎
Lines changed: 30 additions & 22 deletions b/‎src/caffe/proto/caffe.proto‎
Lines changed: 30 additions & 22 deletions
diff --git a/‎src/caffe/test/test_gradient_based_solver.cpp‎
Lines changed: 3 additions & 3 deletions b/‎src/caffe/test/test_gradient_based_solver.cpp‎
Lines changed: 3 additions & 3 deletions
@@ -112,36 +112,19 @@ void Net<Dtype>::Init(const NetParameter& in_param) {
       memory_used_ += top_vecs_[layer_id][top_id]->count();
     }
     DLOG(INFO) << "Memory required for data: " << memory_used_ * sizeof(Dtype);
-    const int blobs_lr_size = layer_param.blobs_lr_size();
+    const int param_size = layer_param.param_size();
     const int num_param_blobs = layers_[layer_id]->blobs().size();
-    CHECK(blobs_lr_size == num_param_blobs || blobs_lr_size == 0)
-        << "Incorrect blobs lr size: should be either 0 "
-        << "or the same as the number of the layer's parameter blobs.";
-    if (blobs_lr_size) {
-      // Check if this layer needs backward operation itself
-      for (int param_id = 0; param_id < blobs_lr_size; ++param_id) {
-        const bool param_need_backward = layer_param.blobs_lr(param_id) > 0;
-        need_backward |= param_need_backward;
-        layers_[layer_id]->set_param_propagate_down(param_id,
-                                                    param_need_backward);
-      }
-    } else if (layers_[layer_id]->blobs().size()) {
-      // catch: if a layer param does not specify blobs_lr, we should assume the
-      // learning rate to be 1. Thus we will need to perform backward.
-      need_backward = true;
-      for (int param_id = 0; param_id < blobs_lr_size; ++param_id) {
-        layers_[layer_id]->set_param_propagate_down(param_id, true);
-      }
+    CHECK_LE(param_size, num_param_blobs)
+        << "Too many params specified for layer " << layer_param.name();
+    ParamSpec default_param_spec;
+    for (int param_id = 0; param_id < num_param_blobs; ++param_id) {
+      const ParamSpec* param_spec = (param_id < param_size) ?
+          &layer_param.param(param_id) : &default_param_spec;
+      const bool param_need_backward = param_spec->lr_mult() > 0;
+      need_backward |= param_need_backward;
+      layers_[layer_id]->set_param_propagate_down(param_id,
+                                                  param_need_backward);
     }
-    const int param_size = layer_param.param_size();
-    CHECK(param_size == num_param_blobs || param_size == 0)
-        << "Incorrect param size: should be either 0 or the same as "
-           "the number of the layer's parameter blobs: " << num_param_blobs;
-    const int param_share_mode_size = layer_param.param_share_mode_size();
-    CHECK(param_share_mode_size == num_param_blobs ||
-          param_share_mode_size == 0)
-        << "Incorrect param_share_mode size: should be either 0 or the same as "
-           "the number of the layer's parameter blobs: " << num_param_blobs;
     for (int param_id = 0; param_id < num_param_blobs; ++param_id) {
       AppendParam(param, layer_id, param_id);
     }
@@ -407,7 +390,8 @@ void Net<Dtype>::AppendParam(const NetParameter& param, const int layer_id,
                              const int param_id) {
   const LayerParameter& layer_param = layers_[layer_id]->layer_param();
   const int param_size = layer_param.param_size();
-  string param_name = param_size ? layer_param.param(param_id) : "";
+  string param_name =
+      (param_size > param_id) ? layer_param.param(param_id).name() : "";
   if (param_name.size()) {
     param_display_names_.push_back(param_name);
   } else {
@@ -441,10 +425,9 @@ void Net<Dtype>::AppendParam(const NetParameter& param, const int layer_id,
     Blob<Dtype>* this_blob = layers_[layer_id]->blobs()[param_id].get();
     Blob<Dtype>* owner_blob =
         layers_[owner_layer_id]->blobs()[owner_param_id].get();
-    const int param_share_mode_size = layer_param.param_share_mode_size();
-    if (param_share_mode_size > param_id &&
-        (layer_param.param_share_mode(param_id) ==
-         LayerParameter_DimCheckMode_PERMISSIVE)) {
+    const int param_size = layer_param.param_size();
+    if (param_size > param_id && (layer_param.param(param_id).share_mode() ==
+                                  ParamSpec_DimCheckMode_PERMISSIVE)) {
       // Permissive dimension checking -- only check counts are the same.
       CHECK_EQ(this_blob->count(), owner_blob->count())
           << "Shared parameter blobs must have the same count.";
@@ -467,34 +450,15 @@ void Net<Dtype>::AppendParam(const NetParameter& param, const int layer_id,
 template <typename Dtype>
 void Net<Dtype>::GetLearningRateAndWeightDecay() {
   LOG(INFO) << "Collecting Learning Rate and Weight Decay.";
+  ParamSpec default_param_spec;
   for (int i = 0; i < layers_.size(); ++i) {
     vector<shared_ptr<Blob<Dtype> > >& layer_blobs = layers_[i]->blobs();
-    // push the learning rate mutlipliers
-    if (layers_[i]->layer_param().blobs_lr_size()) {
-      CHECK_EQ(layers_[i]->layer_param().blobs_lr_size(), layer_blobs.size());
-      for (int j = 0; j < layer_blobs.size(); ++j) {
-        float local_lr = layers_[i]->layer_param().blobs_lr(j);
-        CHECK_GE(local_lr, 0.);
-        params_lr_.push_back(local_lr);
-      }
-    } else {
-      for (int j = 0; j < layer_blobs.size(); ++j) {
-        params_lr_.push_back(1.);
-      }
-    }
-    // push the weight decay multipliers
-    if (layers_[i]->layer_param().weight_decay_size()) {
-      CHECK_EQ(layers_[i]->layer_param().weight_decay_size(),
-          layer_blobs.size());
-      for (int j = 0; j < layer_blobs.size(); ++j) {
-        float local_decay = layers_[i]->layer_param().weight_decay(j);
-        CHECK_GE(local_decay, 0.);
-        params_weight_decay_.push_back(local_decay);
-      }
-    } else {
-      for (int j = 0; j < layer_blobs.size(); ++j) {
-        params_weight_decay_.push_back(1.);
-      }
+    for (int j = 0; j < layer_blobs.size(); ++j) {
+      const ParamSpec* param_spec =
+          (layers_[i]->layer_param().param_size() > j) ?
+          &layers_[i]->layer_param().param(j) : &default_param_spec;
+      params_lr_.push_back(param_spec->lr_mult());
+      params_weight_decay_.push_back(param_spec->decay_mult());
     }
   }
 }
 
@@ -209,6 +209,31 @@ message NetStateRule {
   repeated string not_stage = 5;
 }
 
+// Specifies training parameters (multipliers on global learning constants,
+// and the name and other settings used for weight sharing).
+message ParamSpec {
+  // The names of the parameter blobs -- useful for sharing parameters among
+  // layers, but never required otherwise.  To share a parameter between two
+  // layers, give it a (non-empty) name.
+  optional string name = 1;
+
+  // Whether to require shared weights to have the same shape, or just the same
+  // count -- defaults to STRICT if unspecified.
+  optional DimCheckMode share_mode = 2;
+  enum DimCheckMode {
+    // STRICT (default) requires that num, channels, height, width each match.
+    STRICT = 0;
+    // PERMISSIVE requires only the count (num*channels*height*width) to match.
+    PERMISSIVE = 1;
+  }
+
+  // The multiplier on the global learning rate for this parameter.
+  optional float lr_mult = 3 [default = 1.0];
+
+  // The multiplier on the global weight decay for this parameter.
+  optional float decay_mult = 4 [default = 1.0];
+}
+
 // NOTE
 // Update the next available ID when you add a new LayerParameter field.
 //
@@ -224,29 +249,12 @@ message LayerParameter {
   // to each top blob.
   repeated float loss_weight = 5;
 
-  // The blobs containing the numeric parameters of the layer
-  repeated BlobProto blobs = 6;
+  // Specifies training parameters (multipliers on global learning constants,
+  // and the name and other settings used for weight sharing).
+  repeated ParamSpec param = 6;
 
-  // The names of the parameter blobs -- useful for sharing parameters among
-  // layers (but never required).
-  repeated string param = 7;
-
-  // Whether to require shared weights to have the same shape, or just the same
-  // count -- defaults to STRICT if unspecified.
-  repeated DimCheckMode param_share_mode = 8;
-  enum DimCheckMode {
-    // STRICT (default) requires that num, channels, height, width each match.
-    STRICT = 0;
-    // PERMISSIVE requires only the count (num*channels*height*width) to match.
-    PERMISSIVE = 1;
-  }
-
-  // The ratio that is multiplied on the global learning rate. If you want to
-  // set the learning ratio for one blob, you need to set it for all blobs.
-  repeated float blobs_lr = 9;
-
-  // The weight decay that is multiplied on the global weight decay.
-  repeated float weight_decay = 10;
+  // The blobs containing the numeric parameters of the layer.
+  repeated BlobProto blobs = 7;
 
   // Rules controlling whether and when a layer is included in the network,
   // based on the current NetState.  You may specify a non-zero number of rules
 
@@ -64,7 +64,7 @@ class GradientBasedSolverTest : public MultiDeviceTest<TypeParam> {
        "lr_policy: 'fixed' "
        "net_param { "
        "  name: 'TestNetwork' "
-       "  layers: { "
+       "  layer { "
        "    name: 'data' "
        "    type: 'DummyData' "
        "    dummy_data_param { "
@@ -83,7 +83,7 @@ class GradientBasedSolverTest : public MultiDeviceTest<TypeParam> {
        "    top: 'data' "
        "    top: 'targets' "
        "  } "
-       "  layers: { "
+       "  layer { "
        "    name: 'innerprod' "
        "    type: 'InnerProduct' "
        "    inner_product_param { "
@@ -100,7 +100,7 @@ class GradientBasedSolverTest : public MultiDeviceTest<TypeParam> {
        "    bottom: 'data' "
        "    top: 'innerprod' "
        "  } "
-       "  layers: { "
+       "  layer { "
        "    name: 'loss' "
        "    type: 'EuclideanLoss' "
        "    bottom: 'innerprod' "