Moved files to fit new tfmodels file structure

jacob-zietek · jacob-zietek · commit aa724a5ee19c · 2023-02-10T16:32:49.000-05:00
diff --git a/official/projects/yolo/README.md b/official/projects/yolo/README.md
@@ -0,0 +1,93 @@
+DISCLAIMER: this YOLO implementation is still under development. No support will
+be provided during the development phase.
+
+# YOLO Object Detectors, You Only Look Once
+
+[![Paper](http://img.shields.io/badge/Paper-arXiv.1804.02767-B3181B?logo=arXiv)](https://arxiv.org/abs/1804.02767)
+[![Paper](http://img.shields.io/badge/Paper-arXiv.2004.10934-B3181B?logo=arXiv)](https://arxiv.org/abs/2004.10934)
+
+This repository is the unofficial implementation of the following papers.
+However, we spent painstaking hours ensuring that every aspect that we
+constructed was the exact same as the original paper and the original
+repository.
+
+* YOLOv3: An Incremental Improvement: [YOLOv3: An Incremental Improvement](https://arxiv.org/abs/1804.02767)
+
+* YOLOv4: Optimal Speed and Accuracy of Object Detection: [YOLOv4: Optimal Speed and Accuracy of Object Detection](https://arxiv.org/abs/2004.10934)
+
+## Description
+
+YOLO v1 the original implementation was released in 2015 providing a
+ground breaking algorithm that would quickly process images and locate objects
+in a single pass through the detector. The original implementation used a
+backbone derived from state of the art object classifiers of the time, like
+[GoogLeNet](https://arxiv.org/abs/1409.4842) and
+[VGG](https://arxiv.org/abs/1409.1556). More attention was given to the novel
+YOLO Detection head that allowed for Object Detection with a single pass of an
+image. Though limited, the network could predict up to 90 bounding boxes per
+image, and was tested for about 80 classes per box. Also, the model can only
+make predictions at one scale. These attributes caused YOLO v1 to be more
+limited and less versatile, so as the year passed, the Developers continued to
+update and develop this model.
+
+YOLO v3 and v4 serve as the most up to date and capable versions of the YOLO
+network group. This model uses a custom backbone called Darknet53 that uses
+knowledge gained from the ResNet paper to improve its predictions. The new
+backbone also allows for objects to be detected at multiple scales. As for the
+new detection head, the model now predicts the bounding boxes using a set of
+anchor box priors (Anchor Boxes) as suggestions. Multiscale predictions in
+combination with Anchor boxes allow for the network to make up to 1000 object
+predictions on a single image. Finally, the new loss function forces the network
+to make better predictions by using Intersection Over Union (IOU) to inform the
+model's confidence rather than relying on the mean squared error for the entire
+output.
+
+
+## Authors
+
+* Vishnu Samardh Banna ([@GitHub vishnubanna](https://github.com/vishnubanna))
+* Anirudh Vegesana ([@GitHub anivegesana](https://github.com/anivegesana))
+* Akhil Chinnakotla ([@GitHub The-Indian-Chinna](https://github.com/The-Indian-Chinna))
+* Tristan Yan ([@GitHub Tyan3001](https://github.com/Tyan3001))
+* Naveen Vivek ([@GitHub naveen-vivek](https://github.com/naveen-vivek))
+* Jacob Zietek ([@GitHub jacob-zietek](https://github.com/jacob-zietek))
+
+## Table of Contents
+
+* [Our Goal](#our-goal)
+* [Models in the library](#models-in-the-library)
+* [References](#references)
+
+
+## Our Goal
+
+Our goal with this model conversion is to provide implementation of the Backbone
+and YOLO Head. We have built the model in such a way that the YOLO head could be
+connected to a new, more powerful backbone if a person chose to.
+
+## Models in the library
+
+| Object Detectors | AP               | AP50             | Checkpoint Path  |
+| :--------------: | :--------------: | :--------------: | :--------------: |
+| Yolo-v3          |                  |
+| Yolo-v3 tiny     |                  |
+| Yolo-v3 spp      |                  |
+| Yolo-v4          |                  |
+| Yolo-v4 tiny     | 21.21            | 41.69            |
+| Yolo-v4 csp      |                  |
+| Yolo-v4 large    |                  |
+
+| Classifiers      |
+| :--------------: |
+| Darknet53        |
+| CSPDarknet53     |
+## Models Zoo
+
+
+## Requirements
+[![TensorFlow 2.6](https://img.shields.io/badge/TensorFlow-2.6-FF6F00?logo=tensorflow)](https://github.com/tensorflow/tensorflow/releases/tag/v2.6.0)
+[![Python 3.8](https://img.shields.io/badge/Python-3.8-3776AB)](https://www.python.org/downloads/release/python-380/)
+
+
+DISCLAIMER: this YOLO implementation is still under development. No support
+will be provided during the development phase.
diff --git a/official/projects/yolo/configs/experiments/yolov4/yolov4_tiny_416_tpu.yaml b/official/projects/yolo/configs/experiments/yolov4/yolov4_tiny_416_tpu.yaml
@@ -0,0 +1,142 @@
+# --experiment_type=yolo_darknet
+# 21.21 AP
+# 41.68 AP50
+# 19.12 AP75
+# 29.59 APl
+# 23.94 APm
+# 9.67 APs
+
+runtime:
+  distribution_strategy: 'tpu'
+  mixed_precision_dtype: 'float32'
+task:
+  smart_bias_lr: 0.0
+  model:
+    darknet_based_model: True
+    input_size: [416, 416, 3]
+    backbone:
+      type: 'darknet'
+      darknet:
+        model_id: 'cspdarknettiny'
+        max_level: 5
+        min_level: 4
+    decoder:
+      type: yolo_decoder
+      yolo_decoder:
+        version: v4
+        type: tiny
+    head:
+      smart_bias: true
+    detection_generator:
+      box_type:
+        'all': original
+      scale_xy:
+        'all': 1.05
+      max_boxes: 300
+      nms_type: iou
+      iou_thresh: 0.001
+      nms_thresh: 0.60
+    loss:
+      use_scaled_loss: False
+      box_loss_type:  
+        'all': ciou
+      ignore_thresh:
+        'all': 0.7
+      iou_normalizer: 
+        'all': 0.07
+      cls_normalizer: 
+        'all': 1.0
+      object_normalizer: 
+        'all': 1.0
+      objectness_smooth: 
+        'all': 0.0
+      max_delta:
+        'all': .inf
+    norm_activation:
+      activation: leaky
+      norm_epsilon: 0.00001
+      norm_momentum: 0.99
+      use_sync_bn: true
+    num_classes: 80
+    anchor_boxes:
+      anchors_per_scale: 3
+      boxes: [box: [10, 14], box: [23, 27], box: [37, 58], 
+              box: [81, 82], box: [135, 169], box: [344, 319]]
+  train_data:
+    prefetch_buffer_size: 32
+    global_batch_size: 512
+    dtype: float32
+    input_path: 'gs://cam2-datasets/coco/train*'
+    is_training: true
+    drop_remainder: true
+    seed: 1000
+    parser:
+      mosaic:
+        mosaic_frequency: 0.0
+        mixup_frequency: 0.0
+      max_num_instances: 300
+      letter_box: False
+      random_flip: True
+      aug_rand_saturation: 1.5
+      aug_rand_brightness: 1.5
+      aug_rand_hue: 0.1
+      aug_scale_min: 0.50
+      aug_scale_max: 1.5
+      aug_rand_translate: 0.0 
+      jitter: 0.3
+      area_thresh: 0.0
+      random_pad: True
+      use_tie_breaker: False
+      best_match_only: False
+      anchor_thresh: 1.0
+  validation_data:
+    prefetch_buffer_size: 32
+    global_batch_size: 8
+    dtype: float32
+    input_path: 'gs://cam2-datasets/coco/val*'
+    is_training: false
+    drop_remainder: true
+    parser:
+      max_num_instances: 300
+      letter_box: False
+      use_tie_breaker: False
+      best_match_only: False
+      anchor_thresh: 1.0
+  weight_decay: 0.000
+  init_checkpoint: null
+  init_checkpoint_modules: null
+  annotation_file: null
+trainer:
+  best_checkpoint_eval_metric: 'AP'
+  best_checkpoint_export_subdir: 'best_ckpt'
+  best_checkpoint_metric_comp: 'higher'
+  train_steps: 553126
+  validation_steps: 625
+  steps_per_loop: 920
+  summary_interval: 920
+  validation_interval: 9200
+  checkpoint_interval: 920
+  optimizer_config:
+    ema:
+      average_decay: 0.9998
+      trainable_weights_only: False
+      dynamic_decay: True
+    learning_rate:
+      type: stepwise
+      stepwise:
+        boundaries: [442500, 497814]
+        name: PiecewiseConstantDecay
+        values: [0.04176, 0.004176, 0.0004176]
+    optimizer:
+      type: sgd_torch
+      sgd_torch:
+        momentum: 0.9
+        momentum_start: 0.9
+        nesterov: true
+        warmup_steps: 2000
+        weight_decay: 0.0005
+        name: SGD
+    warmup:
+      type: 'linear'
+      linear:
+        warmup_steps: 2000