add div layer with broadcasting

vera121 · vera121 · commit a12333400d6a · 2019-06-26T05:37:53.000+02:00
diff --git a/FEATURES.md b/FEATURES.md
@@ -10,6 +10,7 @@ atan_layer
 batch_to_space_nd_layer  
 crop_and_resize  
 depth_to_space_layer  
+div_layer  
 expand_dims_nd_layer  
 gather_layer  
 gather_nd_layer  
diff --git a/include/caffe/layers/div_layer.hpp b/include/caffe/layers/div_layer.hpp
@@ -0,0 +1,48 @@
+#ifndef CAFFE_DIV_LAYER_HPP_
+#define CAFFE_DIV_LAYER_HPP_
+
+#include <vector>
+
+#include "caffe/blob.hpp"
+#include "caffe/layer.hpp"
+#include "caffe/proto/caffe.pb.h"
+
+namespace caffe {
+
+/*
+ * @brief Compute elementwise div. Support broadcasting as numpy and TensorFlow do.
+ *
+ * Note: Two dimensions are compatible for broadcasting if both are the same or either is 1.
+ * The rule starts with the right-most dimension, and works towards the left-most dimension.
+ */
+
+template <typename Dtype>
+class DivLayer : public Layer<Dtype> {
+ public:
+  explicit DivLayer(const LayerParameter& param)
+      : Layer<Dtype>(param) {}
+  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+      const vector<Blob<Dtype>*>& top);
+
+  virtual inline const char* type() const { return "Div"; }
+  virtual inline int MinBottomBlobs() const { return 1; }
+  virtual inline int ExactNumTopBlobs() const { return 1; }
+
+ protected:
+
+  virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom,
+      const vector<Blob<Dtype>*>& top);
+
+  virtual void Backward_cpu(const vector<Blob<Dtype>*>& top,
+      const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom){
+    NOT_IMPLEMENTED;
+  };
+
+  int dim_diff_;
+  int dim_;
+  bool is_scalar_;
+};
+
+}  // namespace caffe
+
+#endif  // CAFFE_DIV_LAYER_HPP_
diff --git a/include/caffe/util/math_functions.hpp b/include/caffe/util/math_functions.hpp
@@ -46,6 +46,9 @@ inline void caffe_memset(const size_t N, const int alpha, void* X) {
 template <typename Dtype>
 void caffe_add_scalar(const int N, const Dtype alpha, Dtype *X);
 
+template <typename Dtype>
+void caffe_div_scalar(const int N, const Dtype alpha, Dtype *X);
+
 template <typename Dtype>
 void caffe_scal(const int N, const Dtype alpha, Dtype *X);
 
diff --git a/src/caffe/layers/div_layer.cpp b/src/caffe/layers/div_layer.cpp
@@ -0,0 +1,178 @@
+#include <algorithm>
+#include <functional>
+#include <utility>
+#include <vector>
+
+#include "caffe/layers/div_layer.hpp"
+
+namespace caffe {
+template <typename Dtype>
+void DivLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,
+      const vector<Blob<Dtype>*>& top) {
+  CHECK_NE(top[0], bottom[0]) << this->type() << " Layer does not allow in-place computation.";
+  is_scalar_=false;
+  Blob<Dtype>* divisor = (bottom.size() > 1) ? bottom[1] : this->blobs_[0].get();
+
+  if(bottom[0]->num_axes()==0 || divisor->num_axes()==0)
+    is_scalar_=true;
+  dim_diff_ = bottom[0]->num_axes() - divisor->num_axes();
+  dim_ = bottom[0]->num_axes() >= divisor->num_axes() ? bottom[0]->num_axes() : divisor->num_axes();
+  vector<int> top_shape(dim_, 1);
+  if(dim_diff_ == 0)
+  {
+    if(!is_scalar_)
+    {
+      for(int i=0;i<dim_;i++)
+      {
+        CHECK(bottom[0]->shape(i)==divisor->shape(i) || bottom[0]->shape(i)==1 || divisor->shape(i)==1)
+              << "Dimensions must be equal or 1 in the bottoms!";
+        top_shape[i] = bottom[0]->shape(i) >= divisor->shape(i) ? bottom[0]->shape(i): divisor->shape(i);
+      }
+    }
+  }
+  else if(dim_diff_ > 0) //bottom0 has more axes than bottom1
+  {
+    if(!is_scalar_)
+    {
+      for(int i=0;i<dim_diff_;i++)
+        top_shape[i] = bottom[0]->shape(i);
+      for(int i=dim_diff_; i<dim_; i++)
+        top_shape[i] = bottom[0]->shape(i) >= divisor->shape(i-dim_diff_) ? bottom[0]->shape(i): divisor->shape(i-dim_diff_);
+    }
+    else //bottom1 is a scalar
+    {
+      for(int i=0;i<dim_;i++)
+        top_shape[i] = bottom[0]->shape(i);
+    }
+  }
+  else //dim_diff_<0, bottom1 has more axes than bottom0
+  {
+    if(!is_scalar_)
+    {
+      for(int i=0;i<-dim_diff_;i++)
+        top_shape[i] = divisor->shape(i);
+      for(int i=-dim_diff_; i<dim_; i++)
+        top_shape[i] = bottom[0]->shape(i+dim_diff_) >= divisor->shape(i) ? bottom[0]->shape(i+dim_diff_): divisor->shape(i);
+    }
+    else //bottom0 is a scalar
+    {
+      for(int i=0;i<dim_;i++)
+        top_shape[i] = divisor->shape(i);
+    }
+  }
+
+  top[0]->Reshape(top_shape);
+}
+
+template <typename Dtype>
+void DivLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bottom,
+    const vector<Blob<Dtype>*>& top) {
+	  const Dtype* bottom0_data = bottom[0]->cpu_data();
+	  Blob<Dtype>* divisor = (bottom.size() > 1) ? bottom[1] : this->blobs_[0].get();
+	  const Dtype* bottom1_data = divisor->cpu_data();
+	  Dtype* top_data = top[0]->mutable_cpu_data();
+    int count = top[0]->count();
+
+    // Assume top index (x,y,z) with top shape (A, B, C)
+    // top offset d = xBC + yC + z
+    // So to count the bottom index, should first figure out x, y, z
+    // x = d / BC
+    // y = (d % BC) / C
+    // z = d % C
+    // Then consider bottom shape (A', B', C'), while A = A' or 1
+    // So bottom offset = x'B'C' + y'C' + z', while x' = x or 0
+    if(!is_scalar_)
+    {
+      for(int d=0; d<count; d++)
+      {
+        int offset0 = 0;
+        int offset1 = 0;
+
+        if(dim_diff_ == 0)
+        {
+          for(int i=0;i<dim_-1;i++)
+          {
+            int num = (d % top[0]->count(i)) / top[0]->count(i+1);
+            int n0 = 1 == bottom[0]->shape(i) ? 0 : num;
+            int n1 = 1 == divisor->shape(i) ? 0 : num;
+            offset0 += n0 * bottom[0]->count(i+1);
+            offset1 += n1 * divisor->count(i+1);
+          }
+          int z = d % top[0]->shape(dim_-1);
+          int z0 = 1 == bottom[0]->shape(dim_-1) ? 0 : z;
+          int z1 = 1 == divisor->shape(dim_-1) ? 0 : z;
+          offset0 += z0;
+          offset1 += z1;
+        }
+        else if(dim_diff_ > 0) //bottom0 has more axes than bottom1
+        {
+          for(int i=0;i<dim_diff_;i++)
+          {
+            int num = (d % top[0]->count(i)) / top[0]->count(i+1);
+            int n0 = 1 == bottom[0]->shape(i) ? 0 : num;
+            offset0 += n0 * bottom[0]->count(i+1);
+          }
+          for(int i=dim_diff_;i<dim_-1;i++)
+          {
+            int num = (d % top[0]->count(i)) / top[0]->count(i+1);
+            int n0 = 1 == bottom[0]->shape(i) ? 0 : num;
+            int n1 = 1 == divisor->shape(i-dim_diff_) ? 0 : num;
+            offset0 += n0 * bottom[0]->count(i+1);
+            offset1 += n1 * divisor->count(i-dim_diff_+1);
+          }
+          int z = d % top[0]->shape(dim_-1);
+          int z0 = 1 == bottom[0]->shape(dim_-1) ? 0 : z;
+          int z1 = 1 == divisor->shape(dim_-dim_diff_-1) ? 0 : z;
+          offset0 += z0;
+          offset1 += z1;
+        }
+        else //dim_diff_<0, bottom1 has more axes than bottom0
+        {
+          for(int i=0;i<-dim_diff_;i++)
+          {
+            int num = (d % top[0]->count(i)) / top[0]->count(i+1);
+            int n1 = 1 == divisor->shape(i) ? 0 : num;
+            offset1 += n1 * divisor->count(i+1);
+          }
+          for(int i=-dim_diff_;i<dim_-1;i++)
+          {
+            int num = (d % top[0]->count(i)) / top[0]->count(i+1);
+            int n0 = 1 == bottom[0]->shape(i+dim_diff_) ? 0 : num;
+            int n1 = 1 == divisor->shape(i) ? 0 : num;
+            offset0 += n0 * bottom[0]->count(i+dim_diff_+1);
+            offset1 += n1 * divisor->count(i+1);
+          }
+          int z = d % top[0]->shape(dim_-1);
+          int z0 = 1 == bottom[0]->shape(dim_+dim_diff_-1) ? 0 : z;
+          int z1 = 1 == divisor->shape(dim_-1) ? 0 : z;
+          offset0 += z0;
+          offset1 += z1;
+        }
+
+        top_data[d] = bottom0_data[offset0] / bottom1_data[offset1];
+      }
+    }
+    else //is scalar with shape ()
+    {
+      if(divisor->num_axes()==0) //bottom1 is a scalar
+      {
+        caffe_copy(count, bottom0_data, top_data);
+        Dtype scalar = bottom1_data[0];
+        caffe_div_scalar(count, scalar, top_data);
+      }
+      else //bottom0 is a scalar
+      {
+        Dtype scalar = bottom0_data[0];
+        for(int d=0; d<count; d++)
+        {
+          top_data[d] = scalar / bottom1_data[d];
+        }
+      }
+    }
+}
+
+
+INSTANTIATE_CLASS(DivLayer);
+REGISTER_LAYER_CLASS(Div);
+
+}  // namespace caffe
diff --git a/src/caffe/util/math_functions.cpp b/src/caffe/util/math_functions.cpp
@@ -82,6 +82,20 @@ void caffe_add_scalar(const int N, const double alpha, double* Y) {
   }
 }
 
+template <>
+void caffe_div_scalar(const int N, const float alpha, float* Y) {
+  for (int i = 0; i < N; ++i) {
+    Y[i] /= alpha;
+  }
+}
+
+template <>
+void caffe_div_scalar(const int N, const double alpha, double* Y) {
+  for (int i = 0; i < N; ++i) {
+    Y[i] /= alpha;
+  }
+}
+
 template <typename Dtype>
 void caffe_copy(const int N, const Dtype* X, Dtype* Y) {
   if (X != Y) {