Mikhail11235
diff --git a/‎.gitignore‎
Lines changed: 4 additions & 0 deletions b/‎.gitignore‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎api/m1_yolo/Dockerfile‎
Lines changed: 21 additions & 0 deletions b/‎api/m1_yolo/Dockerfile‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎api/m1_yolo/app/app.py‎
Lines changed: 26 additions & 0 deletions b/‎api/m1_yolo/app/app.py‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎api/m1_yolo/app/config.py‎
Lines changed: 26 additions & 0 deletions b/‎api/m1_yolo/app/config.py‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎api/m1_yolo/app/yolo.py‎
Lines changed: 122 additions & 0 deletions b/‎api/m1_yolo/app/yolo.py‎
Lines changed: 122 additions & 0 deletions
diff --git a/‎api/m1_yolo/model/coco.names‎
Lines changed: 80 additions & 0 deletions b/‎api/m1_yolo/model/coco.names‎
Lines changed: 80 additions & 0 deletions
@@ -0,0 +1,4 @@
+.idea
+*.DS_Store
+*.pyc
+*.log
@@ -0,0 +1,21 @@
+FROM python:3.7
+
+WORKDIR /opt/object_detection_video
+
+RUN apt-get update
+RUN apt-get install ffmpeg libsm6 libxext6  -y
+
+RUN /usr/local/bin/python -m pip install --upgrade pip
+COPY requirements.txt .
+RUN pip install -r requirements.txt
+
+COPY app /opt/object_detection_video/app/
+COPY model /opt/object_detection_video/model/
+# COPY output /opt/object_detection_video/output/
+# COPY videos /opt/object_detection_video/videos/
+
+
+# for local build
+EXPOSE 8501
+CMD uvicorn app.app:app --host 0.0.0.0 --port 9000
+
@@ -0,0 +1,26 @@
+import fastapi
+from .config import VIDEO_PATH, OUTPUT_PATH
+from .yolo import detect_objects
+
+
+app = fastapi.FastAPI()
+
+
+@app.post("/m1_yolo")
+async def root(video: fastapi.UploadFile = fastapi.File(...), confidence: float = "0.5",
+               non_max_suppression: float = "0.5", video_source: str = "nodb"):
+    if video_source == "db":
+        pass
+    else:
+        test_video = video.filename
+        with open(config.VIDEO_PATH + test_video, "bw+") as f:
+            f.write(video.file.read())
+    print(f"[INFO] Processing Video....")
+    total, elap = detect_objects(VIDEO_PATH + test_video, confidence, non_max_suppression)
+    output_video = open(OUTPUT_PATH, 'rb')
+    video_bytes = output_video.read()
+    print(f"[INFO] The video has total of {total} frames")
+    print(f"[INFO] Time required to process a single frame: {round(elap / 60, 2)} minutes")
+    print(f"[INFO] Time required to process the entire video: {round((elap * total) / 60, 2)} minutes")
+    return fastapi.Response(content=video_bytes, media_type="video/mp4", headers={"filename": "output.mp4",
+                                                                                  "content-disposition": "attachment"})
@@ -0,0 +1,26 @@
+import numpy as np
+
+
+# Docker Path
+DIR_PATH = '/opt/object_detection_video/'
+
+model = 'model/yolov3.weights'
+model_config = 'model/yolov3.cfg'
+labels = 'model/coco.names'
+input_videos = 'videos/'
+output_video = 'output/output_video.mp4'
+
+MODEL_PATH = DIR_PATH + model
+CONFIG_PATH = DIR_PATH + model_config
+LABEL_PATH = DIR_PATH + labels
+OUTPUT_PATH = DIR_PATH + output_video
+INPUT_PATH = DIR_PATH + input_videos
+VIDEO_PATH = DIR_PATH + input_videos
+
+LABELS = open(LABEL_PATH).read().strip().split('\n')
+
+COLORS = np.random.randint(0, 255, size=(len(LABELS), 3), dtype='uint8')
+
+DEFAULT_CONFIDENCE = 0.5
+NMS_THRESHOLD = 0.3
+
@@ -0,0 +1,122 @@
+import numpy as np
+import imutils
+import cv2
+import time
+from .config import MODEL_PATH, CONFIG_PATH, OUTPUT_PATH, COLORS, LABELS
+
+
+def detect_objects(video, confidence_threshold, nms_threshold):
+    # get video frames and pass to YOLO for output
+
+    # load YOLO from cv2.dnn
+    # determine only the output layer names we need from YOLO
+    net = cv2.dnn.readNetFromDarknet(CONFIG_PATH, MODEL_PATH)
+    ln = net.getLayerNames()
+    ln = [ln[i - 1] for i in net.getUnconnectedOutLayers()]
+
+    # initialize video stream, pointer to output video file and grabbing frame dimension
+    vs = cv2.VideoCapture(video)
+    fps = vs.get(cv2.CAP_PROP_FPS)
+    writer_width = int(vs.get(cv2.CAP_PROP_FRAME_WIDTH))
+    writer_height = int(vs.get(cv2.CAP_PROP_FRAME_HEIGHT))
+
+    writer = None
+    (W, H) = (None, None)
+
+    # determine the total number of frames in a video
+    try:
+        prop = cv2.CAP_PROP_FRAME_COUNT if imutils.is_cv2() else cv2.CAP_PROP_FRAME_COUNT
+        total = int(vs.get(prop))
+        print(f"[INFO] {total} frames in the video")
+
+    # if error occurs print
+    except:
+        print(f"[INFO] {total} frames in the video")
+        total = -1
+
+    # loop over on entire video frames
+    while True:
+        # read next frame
+        (grabbed, frame) = vs.read()
+
+        # if no frame is grabbed, we reached the end of video, so break the loop
+        if not grabbed:
+            break
+        # if the frame dimensions are empty, grab them
+        if W is None or H is None:
+            (H, W) = frame.shape[:2]
+
+        # build blob and feed forward to YOLO to get bounding boxes and probability
+        blob = cv2.dnn.blobFromImage(frame, 1 / 255.0, (416, 416), swapRB=True, crop=False)
+        start = time.time()
+        net.setInput(blob)
+        layerOutputs = net.forward(ln)
+        end = time.time()
+
+        # get metrics from YOLO
+
+        boxes = []
+        confidences = []
+        classIDs = []
+
+        # loop over each output from layeroutputs
+        for output in layerOutputs:
+            # loop over each detecton in output
+            for detection in output:
+                # extract score, ids and confidence of current object detection
+                score = detection[5:]
+                classID = np.argmax(score)
+                confidence = score[classID]
+
+                # filter out weak detections with confidence threshold
+                if confidence > confidence_threshold:
+                    # scale bounding box coordinates back relative to image size
+                    # YOLO spits out center (x,y) of bounding boxes followed by
+                    # boxes width and heigth
+                    box = detection[0:4] * np.array([W, H, W, H])
+                    (centerX, centerY, width, height) = box.astype('int')
+
+                    # grab top left coordinate of the box
+                    x = int(centerX - (width / 2))
+                    y = int(centerY - (height / 2))
+
+                    boxes.append([x, y, int(width), int(height)])
+                    confidences.append(float(confidence))
+                    classIDs.append(classID)
+
+        # Apply Non-Max Suppression, draw boxes and write output video
+
+        idxs = cv2.dnn.NMSBoxes(boxes, confidences, confidence_threshold, nms_threshold)
+        # ensure detection exists
+        if len(idxs) > 0:
+            for i in idxs.flatten():
+                # getting box coordinates
+                (x, y) = (boxes[i][0], boxes[i][1])
+                (w, h) = (boxes[i][2], boxes[i][3])
+
+                # color and draw boxes
+                color = [int(c) for c in COLORS[classIDs[i]]]
+                cv2.rectangle(frame, (x, y), (x + w, y + h), color, 2)
+                text = f"{LABELS[classIDs[i]]}: {confidences[i]}"
+                cv2.putText(frame, text, (x, y - 5), cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)
+
+        if writer is None:
+            # initialize video writer by setting fourcc
+            # and writing output video to output path
+            # fourcc = cv2.VideoWriter_fourcc(*'H264')
+            fourcc = cv2.VideoWriter_fourcc(*"mp4v")
+            if not fourcc:
+                break
+            writer = cv2.VideoWriter(OUTPUT_PATH, fourcc, fps, (writer_width, writer_height), True)
+
+            if total > 0:
+                elap = (end - start)
+                print(f"[INFO] single frame took {round(elap / 60, 2)} minutes")
+                print(f"[INFO] total estimated time to finish: {(elap * total) / 60} minutes")
+
+        writer.write(frame)
+
+    writer.release()
+    vs.release()
+
+    return total, elap
@@ -0,0 +1,80 @@
+person
+bicycle
+car
+motorbike
+aeroplane
+bus
+train
+truck
+boat
+traffic light
+fire hydrant
+stop sign
+parking meter
+bench
+bird
+cat
+dog
+horse
+sheep
+cow
+elephant
+bear
+zebra
+giraffe
+backpack
+umbrella
+handbag
+tie
+suitcase
+frisbee
+skis
+snowboard
+sports ball
+kite
+baseball bat
+baseball glove
+skateboard
+surfboard
+tennis racket
+bottle
+wine glass
+cup
+fork
+knife
+spoon
+bowl
+banana
+apple
+sandwich
+orange
+broccoli
+carrot
+hot dog
+pizza
+donut
+cake
+chair
+sofa
+pottedplant
+bed
+diningtable
+toilet
+tvmonitor
+laptop
+mouse
+remote
+keyboard
+cell phone
+microwave
+oven
+toaster
+sink
+refrigerator
+book
+clock
+vase
+scissors
+teddy bear
+hair drier
+toothbrush
-Original file line number
+Diff line change
@@ @@ -0,0 +1,4 @@ @@
 +.idea
 +*.DS_Store
 +*.pyc
 +*.log