foss-for-synopsys-dwc-arc-processors
diff --git a/‎data/VOC0712/create_data.sh‎
Lines changed: 2 additions & 2 deletions b/‎data/VOC0712/create_data.sh‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎include/caffe/data_transformer.hpp‎
Lines changed: 3 additions & 1 deletion b/‎include/caffe/data_transformer.hpp‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎include/caffe/layers/annotated_data_layer.hpp‎
Lines changed: 1 addition & 0 deletions b/‎include/caffe/layers/annotated_data_layer.hpp‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎include/caffe/layers/reorg_layer.hpp‎
Lines changed: 113 additions & 0 deletions b/‎include/caffe/layers/reorg_layer.hpp‎
Lines changed: 113 additions & 0 deletions
diff --git a/‎include/caffe/layers/yolo_v2_loss_layer.hpp‎
Lines changed: 58 additions & 0 deletions b/‎include/caffe/layers/yolo_v2_loss_layer.hpp‎
Lines changed: 58 additions & 0 deletions
diff --git a/‎include/caffe/util/io.hpp‎
Lines changed: 8 additions & 6 deletions b/‎include/caffe/util/io.hpp‎
Lines changed: 8 additions & 6 deletions
diff --git a/‎include/caffe/util/yolo_preprocess.hpp‎
Lines changed: 65 additions & 0 deletions b/‎include/caffe/util/yolo_preprocess.hpp‎
Lines changed: 65 additions & 0 deletions
diff --git a/‎scripts/create_annoset.py‎
Lines changed: 5 additions & 2 deletions b/‎scripts/create_annoset.py‎
Lines changed: 5 additions & 2 deletions
@@ -6,7 +6,7 @@ cd $root_dir
 redo=1
 data_root_dir="$HOME/data/VOCdevkit"
 dataset_name="VOC0712"
-mapfile="$root_dir/data/$dataset_name/labelmap_voc.prototxt"
+mapfile="$root_dir/data/$dataset_name/labelmap_yolo_voc.prototxt"
 anno_type="detection"
 db="lmdb"
 min_dim=0
@@ -21,5 +21,5 @@ then
 fi
 for subset in test trainval
 do
-  python $root_dir/scripts/create_annoset.py --anno-type=$anno_type --label-map-file=$mapfile --min-dim=$min_dim --max-dim=$max_dim --resize-width=$width --resize-height=$height --check-label $extra_cmd $data_root_dir $root_dir/data/$dataset_name/$subset.txt $data_root_dir/$dataset_name/$db/$dataset_name"_"$subset"_"$db examples/$dataset_name
+  python $root_dir/scripts/create_annoset.py --anno-type=$anno_type --label-map-file=$mapfile --min-dim=$min_dim --max-dim=$max_dim --resize-width=$width --resize-height=$height --check-label --caffe-yolo $extra_cmd $data_root_dir $root_dir/data/$dataset_name/$subset.txt $data_root_dir/$dataset_name/$db/$dataset_name"_"$subset"_"$db examples/$dataset_name
 done
@@ -258,7 +258,9 @@ class DataTransformer {
    */
   void Transform(const Datum& datum, Blob<Dtype>* transformed_blob,
                  NormalizedBBox* crop_bbox, bool* do_mirror);
-
+  void Transform_Yolo(const AnnotatedDatum& anno_datum, 
+                Blob<Dtype>* transformed_blob, NormalizedBBox* crop_bbox,
+                RepeatedPtrField<AnnotationGroup>* transformed_anno_group_all);
   // Tranformation parameters
   TransformationParameter param_;
 
 
@@ -40,6 +40,7 @@ class AnnotatedDataLayer : public BasePrefetchingDataLayer<Dtype> {
   AnnotatedDatum_AnnotationType anno_type_;
   vector<BatchSampler> batch_samplers_;
   string label_map_file_;
+  vector<int> sides_;
 };
 
 }  // namespace caffe
 
@@ -0,0 +1,113 @@
+#ifndef CAFFE_REORG_LAYER_HPP_
+#define CAFFE_REORG_LAYER_HPP_
+
+#include <vector>
+
+#include "caffe/blob.hpp"
+#include "caffe/layer.hpp"
+#include "caffe/proto/caffe.pb.h"
+
+namespace caffe {
+
+/*
+ * @brief Reshapes the input Blob into an arbitrary-sized output Blob.
+ *
+ * Note: similarly to FlattenLayer, this layer does not change the input values
+ * (see FlattenLayer, Blob::ShareData and Blob::ShareDiff).
+ */
+    template<typename Dtype>
+    class ReorgLayer : public Layer<Dtype> {
+    public:
+        explicit ReorgLayer(const LayerParameter &param)
+                : Layer<Dtype>(param) {}
+
+        virtual void LayerSetUp(const vector<Blob<Dtype> *> &bottom,
+                                const vector<Blob<Dtype> *> &top);
+
+        virtual void Reshape(const vector<Blob<Dtype> *> &bottom,
+                             const vector<Blob<Dtype> *> &top);
+
+        virtual inline const char *type() const { return "Reorg"; }
+
+        virtual inline int ExactNumBottomBlobs() const { return 1; }
+
+        virtual inline int ExactNumTopBlobs() const { return 1; }
+
+    protected:
+
+
+        virtual void Forward_cpu(const vector<Blob<Dtype> *> &bottom,
+                                 const vector<Blob<Dtype> *> &top);
+
+        virtual void Backward_cpu(const vector<Blob<Dtype> *> &top,
+                                  const vector<bool> &propagate_down, const vector<Blob<Dtype> *> &bottom);
+
+        virtual void Forward_gpu(const vector<Blob<Dtype> *> &bottom,
+                                 const vector<Blob<Dtype> *> &top);
+
+        virtual void Backward_gpu(const vector<Blob<Dtype> *> &top,
+                                  const vector<bool> &propagate_down, const vector<Blob<Dtype> *> &bottom);
+
+        int stride_;
+        bool reverse_;
+        int batch_num_;
+        int channels_;
+        int reorged_channels_;
+        int height_, width_;
+        int reorged_height_, reorged_width_;
+        Blob<Dtype> diff_;
+    };
+    template<typename Dtype>
+    void reorg_cpu(Dtype *x, int w, int h, int c, int batch, int stride, int forward, Dtype *out)
+    {
+        int b,i,j,k;
+        int out_c = c/(stride*stride);
+
+        for(b = 0; b < batch; ++b){
+            for(k = 0; k < c; ++k){
+                for(j = 0; j < h; ++j){
+                    for(i = 0; i < w; ++i){
+                        int in_index  = i + w*(j + h*(k + c*b));
+                        int c2 = k % out_c;
+                        int offset = k / out_c;
+                        int w2 = i*stride + offset % stride;
+                        int h2 = j*stride + offset / stride;
+                        int out_index = w2 + w*stride*(h2 + h*stride*(c2 + out_c*b));
+                        if(forward) out[out_index] = x[in_index];
+                        else out[in_index] = x[out_index];
+                    }
+                }
+            }
+        }
+    }
+
+    template<typename Dtype>
+    void reorg_cpu(const Dtype *bottom_data, const int b_w, const int b_h,
+                   const int b_c, const int b_n, const int stride,
+                   const bool forward, Dtype *top_data) {
+        int t_c = b_c / (stride * stride);
+        int t_w = b_w * stride;
+        int t_h = b_h * stride;
+        for (int n = 0; n < b_n; n++) {
+            for (int c = 0; c < b_c; c++) {
+                for (int h = 0; h < b_h; h++) {
+                    for (int w = 0; w < b_w; w++) {
+                        int bottom_index = w + b_w * (h + b_h * (c + b_c * n));
+                        int c2 = c % t_c;
+                        int offset = c / t_c;
+                        int w2 = w * stride + offset % stride;
+                        int h2 = h * stride + offset / stride;
+                        int top_index = w2 + t_w * (h2 + t_h * (c2 + t_c * n));
+                        if (forward) top_data[top_index] = bottom_data[bottom_index];
+                        else
+                            top_data[bottom_index] = bottom_data[top_index];
+                    }
+                }
+            }
+        }
+    }
+
+
+}  // namespace caffe
+
+#endif  // CAFFE_REORG_LAYER_HPP_
@@ -0,0 +1,58 @@
+#ifndef YOLOV2LOSSLAYER_H
+#define YOLOV2LOSSLAYER_H
+
+#include <vector>
+#include <google/protobuf/repeated_field.h>
+
+#include "caffe/blob.hpp"
+#include "caffe/layer.hpp"
+#include "caffe/proto/caffe.pb.h"
+
+#include "caffe/layers/loss_layer.hpp"
+
+namespace caffe {
+    template <typename Dtype>
+    Dtype Overlap(Dtype x1, Dtype w1, Dtype x2, Dtype w2);
+    template <typename Dtype>
+    Dtype Calc_iou(const std::vector<Dtype>& box, const std::vector<Dtype>& truth);
+    template <typename Dtype>
+    Dtype Calc_rmse(const std::vector<Dtype>& box, const std::vector<Dtype>& truth);
+
+    template<typename Dtype>
+    class YoloV2LossLayer: public LossLayer<Dtype> {
+    public:
+        explicit YoloV2LossLayer(const LayerParameter& param)
+            : LossLayer<Dtype>(param), diff_() {}
+
+        virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
+              const vector<Blob<Dtype>*>& top);
+
+        virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
+              const vector<Blob<Dtype>*>& top);
+
+        virtual inline const char* type() const { return "YoloV2Loss"; }
+
+    protected:
+        virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom,
+              const vector<Blob<Dtype>*>& top);
+        virtual void Backward_cpu(const vector<Blob<Dtype>*>& top,
+              const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom);
+
+        vector<float> biases_;
+        int seen;
+        int side_;
+        int num_classes_;
+        int num_boxes_;
+        float box_scale_;
+        float class_scale_;
+        float object_scale_;
+        float noobject_scale_;
+        bool rescore_;
+        bool constraint_;
+        float thresh_;
+        
+        Blob<Dtype> diff_;
+    };
+}
+
+#endif // YOLOV2LOSSLAYER_H
@@ -209,22 +209,24 @@ bool ReadRichImageToAnnotatedDatum(const string& filename,
     const string& labelname, const int height, const int width,
     const int min_dim, const int max_dim, const bool is_color,
     const std::string& encoding, const AnnotatedDatum_AnnotationType type,
-    const string& labeltype, const std::map<string, int>& name_to_label,
-    AnnotatedDatum* anno_datum);
+    const string& labeltype, const std::map<string,
+    int>& name_to_label, AnnotatedDatum* anno_datum,
+    const bool caffe_yolo = false);
 
 inline bool ReadRichImageToAnnotatedDatum(const string& filename,
     const string& labelname, const int height, const int width,
     const bool is_color, const std::string & encoding,
     const AnnotatedDatum_AnnotationType type, const string& labeltype,
-    const std::map<string, int>& name_to_label, AnnotatedDatum* anno_datum) {
+    const std::map<string, int>& name_to_label, AnnotatedDatum* anno_datum,
+    const bool caffe_yolo = false) {
   return ReadRichImageToAnnotatedDatum(filename, labelname, height, width, 0, 0,
-                      is_color, encoding, type, labeltype, name_to_label,
-                      anno_datum);
+                      is_color, encoding, type, labeltype,
+                      name_to_label, anno_datum, caffe_yolo);
 }
 
 bool ReadXMLToAnnotatedDatum(const string& labelname, const int img_height,
     const int img_width, const std::map<string, int>& name_to_label,
-    AnnotatedDatum* anno_datum);
+    AnnotatedDatum* anno_datum, const bool caffe_yolo = false);
 
 bool ReadJSONToAnnotatedDatum(const string& labelname, const int img_height,
     const int img_width, const std::map<string, int>& name_to_label,
 
@@ -0,0 +1,65 @@
+#ifndef YOLO_PREPROCESS_HPP
+#define YOLO_PREPROCESS_HPP
+
+#ifdef USE_OPENCV
+#include <opencv2/core/core.hpp>
+#include <opencv2/imgproc/imgproc.hpp>
+#endif  // USE_OPENCV
+
+#include "caffe/common.hpp"
+#include "caffe/proto/caffe.pb.h"
+
+namespace caffe {
+
+float rand_uniform(float min, float max);
+
+float rand_scale(float value_lower, float value_upper);
+
+void set_pixel(float *m, int w, int h, int ch, int x, int y, int c, float val);
+
+void set_pixel_with_scaling(float *m, int w, int h, int ch, int x, int y, int c,
+                            float val, float scale);
+
+float get_pixel(float *m, int w, int h, int ch, int x, int y, int c);
+
+void scale_image_channel(float *im, int w, int h, int ch, int c, float v);
+
+float three_way_max(float a, float b, float c);
+
+float three_way_min(float a, float b, float c);
+
+void rgb_to_hsv(float *im, int width, int height, int channels);
+
+void hsv_to_rgb(float *im, int width, int height, int channels);
+
+void constrain_image(float *im, int w, int h, int c);
+
+float constrain(float min, float max, float a);
+
+void distort_image(float *im, int w, int h, int c, float hue, float sat,
+                   float val);
+
+void random_distort_image(float *im, int w, int h, int c, float hue,
+                          float saturation_lower, float saturation_upper,
+                          float exposure_lower, float exposure_upper);
+
+void flip_image(float *im, int w, int h, int c);
+
+#ifdef USE_OPENCV
+void bgr_to_rgb(cv::Mat im);
+
+cv::Mat hwc_to_chw(cv::Mat im);
+
+float get_pixel_image(const cv::Mat& m, int x, int y, int c);
+
+float get_pixel_extend(const cv::Mat& m, int x, int y, int c);
+
+float bilinear_interpolate(const cv::Mat& im, float x, float y, int c);
+
+void place_image(cv::Mat im, int w, int h, int dx, int dy, float *resized_image,
+                 int resize_w, int resize_h, float scale);
+#endif  // USE_OPENCV
+
+}  // namespace caffe
+
+#endif  // YOLO_PREPROCESS_HPP
@@ -47,7 +47,8 @@
       help="Randomly shuffle the order of images and their labels.")
   parser.add_argument("--check-label", default = False, action = "store_true",
       help="Check that there is no duplicated name/label.")
-
+  parser.add_argument("--caffe-yolo", default = False, action = "store_true",
+      help="Generate data to train converted Yolo model on Caffe.")
   args = parser.parse_args()
   root_dir = args.root
   list_file = args.listfile
@@ -69,6 +70,7 @@
   resize_width = args.resize_width
   shuffle = args.shuffle
   check_label = args.check_label
+  caffe_yolo = args.caffe_yolo
 
   # check if root directory exists
   if not os.path.exists(root_dir):
@@ -134,10 +136,11 @@
         " --encode_type={}" \
         " --encoded={}" \
         " --gray={}" \
+        " --caffe_yolo={}" \
         " {} {} {}" \
         .format(caffe_root, anno_type, label_type, label_map_file, check_label,
             min_dim, max_dim, resize_height, resize_width, backend, shuffle,
-            check_size, encode_type, encoded, gray, root_dir, list_file, out_dir)
+            check_size, encode_type, encoded, gray, caffe_yolo, root_dir, list_file, out_dir)
   elif anno_type == "classification":
     cmd = "{}/build/tools/convert_annoset" \
         " --anno_type={}" \