BVLC · nickcarlevaris · Feb 16, 2015 · Feb 17, 2015 · tnarihi · Feb 16, 2015
diff --git a/include/caffe/filler.hpp b/include/caffe/filler.hpp
@@ -157,6 +157,27 @@ class XavierFiller : public Filler<Dtype> {
   }
 };
 
+/**
+ * @brief Fills a Blob with values @f$ x \sim N(-a, +a) @f$ where @f$ a @f$ is
+ *        set by the number of incoming nodes, based on the paper [He,
+ *        Zhang, Ren and Sun 2015]
+ */
+template <typename Dtype>
+class MSRFiller : public Filler<Dtype> {
+ public:
+  explicit MSRFiller(const FillerParameter& param)
+      : Filler<Dtype>(param) {}
+  virtual void Fill(Blob<Dtype>* blob) {
+    CHECK(blob->count());
+    int fan_in = blob->count() / blob->num();
+    Dtype std = sqrt(Dtype(2) / fan_in);
+    caffe_rng_gaussian<Dtype>(blob->count(), Dtype(0), std,
+        blob->mutable_cpu_data());
+    CHECK_EQ(this->filler_param_.sparse(), -1)
+         << "Sparsity not supported by this Filler.";
+  }
+};
+
 
 /**
  * @brief Get a specific filler from the specification given in FillerParameter.
@@ -177,6 +198,8 @@ Filler<Dtype>* GetFiller(const FillerParameter& param) {
     return new UniformFiller<Dtype>(param);
   } else if (type == "xavier") {
     return new XavierFiller<Dtype>(param);
+  } else if (type == "msr") {
+    return new MSRFiller<Dtype>(param);
   } else {
     CHECK(false) << "Unknown filler name: " << param.type();
   }

diff --git a/src/caffe/test/test_filler.cpp b/src/caffe/test/test_filler.cpp
@@ -142,4 +142,40 @@ TYPED_TEST(GaussianFillerTest, TestFill) {
   EXPECT_LE(var, target_var * 5.);
 }
 
+template <typename Dtype>
+class MSRFillerTest : public ::testing::Test {
+ protected:
+  MSRFillerTest()
+      : blob_(new Blob<Dtype>(1000, 3, 4, 5)),
+        filler_param_() {
+    filler_.reset(new MSRFiller<Dtype>(filler_param_));
+    filler_->Fill(blob_);
+  }
+  virtual ~MSRFillerTest() { delete blob_; }
+  Blob<Dtype>* const blob_;
+  FillerParameter filler_param_;
+  shared_ptr<MSRFiller<Dtype> > filler_;
+};
+
+TYPED_TEST_CASE(MSRFillerTest, TestDtypes);
+
+TYPED_TEST(MSRFillerTest, TestFill) {
+  EXPECT_TRUE(this->blob_);
+  const int count = this->blob_->count();
+  const TypeParam* data = this->blob_->cpu_data();
+  TypeParam mean = 0.;
+  TypeParam ex2 = 0.;
+  for (int i = 0; i < count; ++i) {
+    mean += data[i];
+    ex2 += data[i] * data[i];
+  }
+  mean /= count;
+  ex2 /= count;
+  TypeParam std = sqrt(ex2 - mean*mean);
+  int fan_in = 3*4*5;
+  TypeParam target_std = sqrt(2.0 / fan_in);
+  EXPECT_NEAR(mean, 0.0, 0.1);
+  EXPECT_NEAR(std, target_std, 0.1);
+}
+
 }  // namespace caffe