feat: Add train and predict with yolo (#20)

rudeuns · web-flow · commit 397e5f4d3294 · 2024-01-08T21:15:22.000+09:00
#17
diff --git a/utils/coco2yolo.py b/utils/coco2yolo.py
@@ -0,0 +1,49 @@
+import os
+import json
+
+def main():
+    # 저장할 경로 입력
+    save_path = '/data/ephemeral/home/dataset/yolo/labels'
+    if not os.path.isdir('/data/ephemeral/home/dataset/yolo'):
+        os.mkdir('/data/ephemeral/home/dataset/yolo')
+    if not os.path.isdir(save_path):
+        os.mkdir(save_path)
+
+    # 읽어올 annotation 경로 입력
+    json_path = '/data/ephemeral/home/dataset/train.json'
+    with open(json_path, 'r') as f:
+        json_data = json.load(f)
+
+    print('start')
+
+    image_info_dict = dict()
+    for image_info in json_data['images']:
+        image_id = image_info['id']
+        image_info_dict[image_id] = image_info
+
+    yolo_info_dict = dict()
+    for anno_info in json_data['annotations']:
+        image_id = anno_info['image_id']
+        image_info = image_info_dict[image_id]
+        image_ww, image_hh = image_info['width'], image_info['height']
+        file_name = os.path.splitext(os.path.basename(image_info['file_name']))[0]
+
+        cate_id = anno_info['category_id']
+        xmin, ymin, ww, hh = anno_info['bbox']
+        cx, cy = xmin + (ww / 2), ymin + (hh / 2)
+        cx, cy, ww, hh = cx / image_ww, cy / image_hh, ww / image_ww, hh / image_hh
+
+        if file_name not in yolo_info_dict:
+            yolo_info_dict[file_name] = f'{cate_id} {cx} {cy} {ww} {hh}\n'
+        else:
+            yolo_info_dict[file_name] += f'{cate_id} {cx} {cy} {ww} {hh}\n'
+
+    for k, v in yolo_info_dict.items():
+        label_path = os.path.join(save_path, k + '.txt')
+        with open(label_path, 'w') as f:
+            f.write(v)
+
+    print('end')
+
+if __name__ == '__main__':
+    main()
diff --git a/yolo/custom.yaml b/yolo/custom.yaml
@@ -0,0 +1,125 @@
+# Ultralytics YOLO 🚀, AGPL-3.0 license
+# Default training settings and hyperparameters for medium-augmentation COCO training
+
+task: detect  # (str) YOLO task, i.e. detect, segment, classify, pose
+mode: train  # (str) YOLO mode, i.e. train, val, predict, export, track, benchmark
+
+# Train settings -------------------------------------------------------------------------------------------------------
+model:  # (str, optional) path to model file, i.e. yolov8n.pt, yolov8n.yaml
+data:  # (str, optional) path to data file, i.e. coco128.yaml
+epochs: 100  # (int) number of epochs to train for
+time:  # (float, optional) number of hours to train for, overrides epochs if supplied
+patience: 50  # (int) epochs to wait for no observable improvement for early stopping of training
+batch: 16  # (int) number of images per batch (-1 for AutoBatch)
+imgsz: 640  # (int | list) input images size as int for train and val modes, or list[w,h] for predict and export modes
+save: True  # (bool) save train checkpoints and predict results
+save_period: -1 # (int) Save checkpoint every x epochs (disabled if < 1)
+cache: False  # (bool) True/ram, disk or False. Use cache for data loading
+device:  # (int | str | list, optional) device to run on, i.e. cuda device=0 or device=0,1,2,3 or device=cpu
+workers: 8  # (int) number of worker threads for data loading (per RANK if DDP)
+project:  # (str, optional) project name
+name:  # (str, optional) experiment name, results saved to 'project/name' directory
+exist_ok: False  # (bool) whether to overwrite existing experiment
+pretrained: True  # (bool | str) whether to use a pretrained model (bool) or a model to load weights from (str)
+optimizer: auto  # (str) optimizer to use, choices=[SGD, Adam, Adamax, AdamW, NAdam, RAdam, RMSProp, auto]
+verbose: True  # (bool) whether to print verbose output
+seed: 0  # (int) random seed for reproducibility
+deterministic: True  # (bool) whether to enable deterministic mode
+single_cls: False  # (bool) train multi-class data as single-class
+rect: False  # (bool) rectangular training if mode='train' or rectangular validation if mode='val'
+cos_lr: False  # (bool) use cosine learning rate scheduler
+close_mosaic: 10  # (int) disable mosaic augmentation for final epochs (0 to disable)
+resume: False  # (bool) resume training from last checkpoint
+amp: True  # (bool) Automatic Mixed Precision (AMP) training, choices=[True, False], True runs AMP check
+fraction: 1.0  # (float) dataset fraction to train on (default is 1.0, all images in train set)
+profile: False  # (bool) profile ONNX and TensorRT speeds during training for loggers
+freeze: None  # (int | list, optional) freeze first n layers, or freeze list of layer indices during training
+multi_scale: False   # (bool) Whether to use multi-scale during training
+# Segmentation
+overlap_mask: True  # (bool) masks should overlap during training (segment train only)
+mask_ratio: 4  # (int) mask downsample ratio (segment train only)
+# Classification
+dropout: 0.0  # (float) use dropout regularization (classify train only)
+
+# Val/Test settings ----------------------------------------------------------------------------------------------------
+val: True  # (bool) validate/test during training
+split: val  # (str) dataset split to use for validation, i.e. 'val', 'test' or 'train'
+save_json: False  # (bool) save results to JSON file
+save_hybrid: False  # (bool) save hybrid version of labels (labels + additional predictions)
+conf: 0.05 # (float, optional) object confidence threshold for detection (default 0.25 predict, 0.001 val)
+iou: 0.5  # (float) intersection over union (IoU) threshold for NMS
+max_det: 300  # (int) maximum number of detections per image
+half: False  # (bool) use half precision (FP16)
+dnn: False  # (bool) use OpenCV DNN for ONNX inference
+plots: True  # (bool) save plots and images during train/val
+
+# Predict settings -----------------------------------------------------------------------------------------------------
+source:  # (str, optional) source directory for images or videos
+vid_stride: 1  # (int) video frame-rate stride
+stream_buffer: False  # (bool) buffer all streaming frames (True) or return the most recent frame (False)
+visualize: False  # (bool) visualize model features
+augment: False  # (bool) apply image augmentation to prediction sources
+agnostic_nms: False  # (bool) class-agnostic NMS
+classes:  # (int | list[int], optional) filter results by class, i.e. classes=0, or classes=[0,2,3]
+retina_masks: False  # (bool) use high-resolution segmentation masks
+embed:  # (list[int], optional) return feature vectors/embeddings from given layers
+
+# Visualize settings ---------------------------------------------------------------------------------------------------
+show: False  # (bool) show predicted images and videos if environment allows
+save_frames: False  # (bool) save predicted individual video frames
+save_txt: False  # (bool) save results as .txt file
+save_conf: False  # (bool) save results with confidence scores
+save_crop: False  # (bool) save cropped images with results
+show_labels: True  # (bool) show prediction labels, i.e. 'person'
+show_conf: True  # (bool) show prediction confidence, i.e. '0.99'
+show_boxes: True  # (bool) show prediction boxes
+line_width:   # (int, optional) line width of the bounding boxes. Scaled to image size if None.
+
+# Export settings ------------------------------------------------------------------------------------------------------
+format: torchscript  # (str) format to export to, choices at https://docs.ultralytics.com/modes/export/#export-formats
+keras: False  # (bool) use Kera=s
+optimize: False  # (bool) TorchScript: optimize for mobile
+int8: False  # (bool) CoreML/TF INT8 quantization
+dynamic: False  # (bool) ONNX/TF/TensorRT: dynamic axes
+simplify: False  # (bool) ONNX: simplify model
+opset:  # (int, optional) ONNX: opset version
+workspace: 4  # (int) TensorRT: workspace size (GB)
+nms: False  # (bool) CoreML: add NMS
+
+# Hyperparameters ------------------------------------------------------------------------------------------------------
+lr0: 0.01  # (float) initial learning rate (i.e. SGD=1E-2, Adam=1E-3)
+lrf: 0.01  # (float) final learning rate (lr0 * lrf)
+momentum: 0.937  # (float) SGD momentum/Adam beta1
+weight_decay: 0.0005  # (float) optimizer weight decay 5e-4
+warmup_epochs: 3.0  # (float) warmup epochs (fractions ok)
+warmup_momentum: 0.8  # (float) warmup initial momentum
+warmup_bias_lr: 0.1  # (float) warmup initial bias lr
+box: 7.5  # (float) box loss gain
+cls: 0.5  # (float) cls loss gain (scale with pixels)
+dfl: 1.5  # (float) dfl loss gain
+pose: 12.0  # (float) pose loss gain
+kobj: 1.0  # (float) keypoint obj loss gain
+label_smoothing: 0.0  # (float) label smoothing (fraction)
+nbs: 64  # (int) nominal batch size
+hsv_h: 0.015  # (float) image HSV-Hue augmentation (fraction)
+hsv_s: 0.7  # (float) image HSV-Saturation augmentation (fraction)
+hsv_v: 0.4  # (float) image HSV-Value augmentation (fraction)
+degrees: 0.0  # (float) image rotation (+/- deg)
+translate: 0.1  # (float) image translation (+/- fraction)
+scale: 0.5  # (float) image scale (+/- gain)
+shear: 0.0  # (float) image shear (+/- deg)
+perspective: 0.0  # (float) image perspective (+/- fraction), range 0-0.001
+flipud: 0.0  # (float) image flip up-down (probability)
+fliplr: 0.5  # (float) image flip left-right (probability)
+mosaic: 1.0  # (float) image mosaic (probability)
+mixup: 0.0  # (float) image mixup (probability)
+copy_paste: 0.0  # (float) segment copy-paste (probability)
+auto_augment: randaugment  # (str) auto augmentation policy for classification (randaugment, autoaugment, augmix)
+erasing: 0.4  # (float) probability of random erasing during classification training (0-1)
+crop_fraction: 1.0  # (float) image crop fraction for classification evaluation/inference (0-1)
+
+# Custom config.yaml ---------------------------------------------------------------------------------------------------
+cfg:  # (str, optional) for overriding defaults.yaml
+
+# Tracker settings ------------------------------------------------------------------------------------------------------
+tracker: botsort.yaml  # (str) tracker type, choices=[botsort.yaml, bytetrack.yaml]
diff --git a/yolo/datasets/recycle_det_42_1.yaml b/yolo/datasets/recycle_det_42_1.yaml
@@ -0,0 +1,15 @@
+train: /data/ephemeral/home/dataset/yolo/split/train_42_fold_1.txt 
+val: /data/ephemeral/home/dataset/yolo/split/val_42_fold_1.txt 
+
+nc: 10
+names:
+  0: General trash
+  1: Paper
+  2: Paper pack
+  3: Metal
+  4: Glass
+  5: Plastic
+  6: Styrofoam
+  7: Plastic bag
+  8: Battery
+  9: Clothing
diff --git a/yolo/datasets/recycle_det_42_2.yaml b/yolo/datasets/recycle_det_42_2.yaml
@@ -0,0 +1,15 @@
+train: /data/ephemeral/home/dataset/yolo/split/train_42_fold_2.txt 
+val: /data/ephemeral/home/dataset/yolo/split/val_42_fold_2.txt 
+
+nc: 10
+names:
+  0: General trash
+  1: Paper
+  2: Paper pack
+  3: Metal
+  4: Glass
+  5: Plastic
+  6: Styrofoam
+  7: Plastic bag
+  8: Battery
+  9: Clothing
diff --git a/yolo/datasets/recycle_det_42_3.yaml b/yolo/datasets/recycle_det_42_3.yaml
@@ -0,0 +1,15 @@
+train: /data/ephemeral/home/dataset/yolo/split/train_42_fold_3.txt 
+val: /data/ephemeral/home/dataset/yolo/split/val_42_fold_3.txt 
+
+nc: 10
+names:
+  0: General trash
+  1: Paper
+  2: Paper pack
+  3: Metal
+  4: Glass
+  5: Plastic
+  6: Styrofoam
+  7: Plastic bag
+  8: Battery
+  9: Clothing
diff --git a/yolo/datasets/recycle_det_42_4.yaml b/yolo/datasets/recycle_det_42_4.yaml
@@ -0,0 +1,15 @@
+train: /data/ephemeral/home/dataset/yolo/split/train_42_fold_4.txt 
+val: /data/ephemeral/home/dataset/yolo/split/val_42_fold_4.txt 
+
+nc: 10
+names:
+  0: General trash
+  1: Paper
+  2: Paper pack
+  3: Metal
+  4: Glass
+  5: Plastic
+  6: Styrofoam
+  7: Plastic bag
+  8: Battery
+  9: Clothing
diff --git a/yolo/datasets/recycle_det_42_5.yaml b/yolo/datasets/recycle_det_42_5.yaml
@@ -0,0 +1,15 @@
+train: /data/ephemeral/home/dataset/yolo/split/train_42_fold_5.txt 
+val: /data/ephemeral/home/dataset/yolo/split/val_42_fold_5.txt 
+
+nc: 10
+names:
+  0: General trash
+  1: Paper
+  2: Paper pack
+  3: Metal
+  4: Glass
+  5: Plastic
+  6: Styrofoam
+  7: Plastic bag
+  8: Battery
+  9: Clothing
diff --git a/yolo/predict.py b/yolo/predict.py
@@ -0,0 +1,51 @@
+from ultralytics import YOLO
+import argparse
+import pandas as pd
+import os
+
+def main(opt):
+    model = YOLO(opt.weight)
+    results = model(opt.source)
+
+    df = pd.DataFrame(columns=['PredictionString', 'image_id'])
+    prediction_arr = []
+    
+    for result in results:
+        for box in result.boxes:
+            c = int(box.cls)  
+            confidence = float(box.conf)
+            *xyxy, = box.xyxy
+
+            prediction_arr.append(str(c))
+            prediction_arr.append(str(confidence))
+            for coord in list(map(float, xyxy[0])):
+                prediction_arr.append(str(coord))
+
+        paths = result.path.split('/')
+        image_id = '/'.join(paths[-2:])
+        prediction_str = ' '.join(prediction_arr)
+
+        df = df.append(pd.DataFrame({'PredictionString':[prediction_str], 'image_id':[image_id]}), ignore_index=True)
+        prediction_arr = []
+        
+    save_dir = opt.save_dir
+    name = opt.name
+    if not os.path.isdir(save_dir):
+        os.mkdir(save_dir)
+
+    df.to_csv(os.path.join(save_dir, f'{name}.csv'), index=False)
+
+
+def parse_opt():
+    parser = argparse.ArgumentParser()
+
+    parser.add_argument('--weight', type=str, required=True)
+    parser.add_argument('--source', type=str, default='/data/ephemeral/home/dataset/test')
+    parser.add_argument('--save-dir', type=str, default='/data/ephemeral/home/level2-objectdetection-cv-03/yolo/results')
+    parser.add_argument('--name', type=str, required=True)
+
+    return parser.parse_args()
+
+if __name__ == '__main__':
+    opt = parse_opt()
+    main(opt)
diff --git a/yolo/predict.sh b/yolo/predict.sh
@@ -0,0 +1,5 @@
+python ./predict.py --weight '/data/ephemeral/home/level2-objectdetection-cv-03/yolo/runs/detect/yolov8s_42_1_e50_SGD/weights/best.pt' --name yolov8s_42_1_e50_SGD;
+python ./predict.py --weight '/data/ephemeral/home/level2-objectdetection-cv-03/yolo/runs/detect/yolov8s_42_2_e50_SGD/weights/best.pt' --name yolov8s_42_2_e50_SGD;
+python ./predict.py --weight '/data/ephemeral/home/level2-objectdetection-cv-03/yolo/runs/detect/yolov8s_42_3_e50_SGD/weights/best.pt' --name yolov8s_42_3_e50_SGD;
+python ./predict.py --weight '/data/ephemeral/home/level2-objectdetection-cv-03/yolo/runs/detect/yolov8s_42_4_e50_SGD/weights/best.pt' --name yolov8s_42_4_e50_SGD;
+python ./predict.py --weight '/data/ephemeral/home/level2-objectdetection-cv-03/yolo/runs/detect/yolov8s_42_5_e50_SGD/weights/best.pt' --name yolov8s_42_5_e50_SGD;
diff --git a/yolo/train.py b/yolo/train.py
@@ -0,0 +1,28 @@
+from ultralytics import YOLO
+import argparse
+
+def main(opt):
+    model = YOLO()
+    model.train(cfg='./custom.yaml', **vars(opt))
+
+def parse_opt():
+    parser = argparse.ArgumentParser()
+
+    parser.add_argument('--model', type=str, required=True)
+    parser.add_argument('--data', type=str, required=True)
+    parser.add_argument('--epochs', type=int, default=50)
+    parser.add_argument('--patience', type=int, default=50)
+    parser.add_argument('--batch', '--batch-size', type=int, default=16)
+    parser.add_argument('--imgsz', '--img-size', type=int, default=640)
+    parser.add_argument('--workers', type=int, default=8)
+    parser.add_argument('--project', type=str, default='')
+    parser.add_argument('--name', type=str, default='')
+    parser.add_argument('--optimizer', type=str, default='SGD')
+    parser.add_argument('--conf', type=float, default=0.05)
+    parser.add_argument('--iou', type=float, default=0.5)
+
+    return parser.parse_args()
+
+if __name__ == '__main__':
+    opt = parse_opt()
+    main(opt)
diff --git a/yolo/train.sh b/yolo/train.sh
@@ -0,0 +1,5 @@
+python ./train.py --model yolov8s.pt --data /data/ephemeral/home/level2-objectdetection-cv-03/yolo/datasets/recycle_det_42_1.yaml --name yolov8s_42_1_e50_SGD;
+python ./train.py --model yolov8s.pt --data /data/ephemeral/home/level2-objectdetection-cv-03/yolo/datasets/recycle_det_42_2.yaml --name yolov8s_42_2_e50_SGD;
+python ./train.py --model yolov8s.pt --data /data/ephemeral/home/level2-objectdetection-cv-03/yolo/datasets/recycle_det_42_3.yaml --name yolov8s_42_3_e50_SGD;
+python ./train.py --model yolov8s.pt --data /data/ephemeral/home/level2-objectdetection-cv-03/yolo/datasets/recycle_det_42_4.yaml --name yolov8s_42_4_e50_SGD;
+python ./train.py --model yolov8s.pt --data /data/ephemeral/home/level2-objectdetection-cv-03/yolo/datasets/recycle_det_42_5.yaml --name yolov8s_42_5_e50_SGD;