Face_Recognition_TF/utils.py at main · PushpakBhoge/Face_Recognition_TF · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
from Inference.FaceDetector import FaceDetector
from Inference.FaceRecognizer import FaceRecognizer
from sklearn.svm import SVC
import numpy as np
import joblib
import json
import cv2
import os

class Detector():
    def __init__(self):
        self.FaceDetect = FaceDetector()
        self.FaceRecog = FaceRecognizer()

    def get_people_names_svc(self, Model_dir, decode_json_dir, image, speed_up=True, downscale_by=4):
        """
		Arguments:
        model_dir - model directory for svc_classifier
        decode_json_dir - directory for json file containing data to decode svc
                            classifier output
        image - image on which to predict
        speed_up - bool whether to downscale image or not
        downscale_by - bigger the number faster the reults but lower accuracy
		Output:
        results - a lsit with following format
        [(confidence, person_name, box_co-ordinates),
        (confidence, person_name, box_co-ordinates), .........]

        box_co-ordinates = [xmin, ymin, xmax, ymax]

		"""

        # load svc classifier
        with open(Model_dir, "rb") as file:
            svc_clf = joblib.load(file)

        # load decode json
        with open(decode_json_dir, "r") as file:
            class_decode = json.load(file)

        # get bounding boxes for faces
        face_bboxes = self.FaceDetect.detect_faces(image, speed_up=speed_up,
                                        scale_factor=downscale_by)

        # get face crops for faces
        Face_crops = self.FaceDetect.crop_faces(image, face_bboxes)

        # Store the result as a tuple in a list
        results = []
        for face_crop, box in zip(Face_crops, face_bboxes):
            # get face embedding for the face crop
            face_embd = self.FaceRecog.get_face_embedding(face_crop)
            # get svc_classifier output
            class_id = svc_clf.predict(face_embd)
            # confidence always 100 (only added to make it compatable with draw function)
            confidence = 100
            person_name = class_decode[str(class_id[0])]
            results.append((confidence, person_name, box))
        return results


    def get_people_names(self, image, speed_up=True, downscale_by=4):
        """
		Arguments:
        image - numpy array of image
        speed_up - bool whether to downscale image or not
        downscale_by - bigger the number faster the reults but lower accuracy
		Output:
        results - a lsit with following format
        [(distance, person_name, box_co-ordinates),
        (distance, person_name, box_co-ordinates), .........]

        box_co-ordinates = [xmin, ymin, xmax, ymax]

		"""
        # get bounding boxes for faces
        face_bboxes = self.FaceDetect.detect_faces(image, speed_up=speed_up,
                                        scale_factor=downscale_by)
        # get face crops according to the bounding boxes
        Face_crops = self.FaceDetect.crop_faces(image, face_bboxes)

        # store the results in tuple format in list
        results = []
        for face_crop, box in zip(Face_crops, face_bboxes):
            # get face embedding
            face_embd = self.FaceRecog.get_face_embedding(face_crop)
            # get person_name and distance
            person_name, distance = self.FaceRecog.Whoisit(face_embd)
            results.append((distance, person_name, box))

        return results

    def draw_results(self, image, infer_results,
                    color=(255,0,0),box_thickness=None,
                    font_size=None, font_thickness=None,
                    offset=None):
        """
		Arguments:
        image - numpy array of image(RGB)
        infer_results  - result list from .get_people_name() and .get_people_name_svc() methods
        color - color of the bounding box as well as name
        box_thickness - thickess of the bounding box
        font_size - Size of the font
        font_thickness - thickness of the font
        offset - distance between top edge of box and alphabets of name
        (Leaving the above 4 option to None will automatically calculate best valus for all)
		Output:
        A seperate image instance with face boxes and person name drawn on to
        the image (a numpy array)

		"""
        # make deep copy of image
        img = image.copy()

        # Calculate best fraw setting and set if None is not
        # provided
        settings = self.get_draw_settings(image.shape)
        if offset == None:
            offset = settings[0]
        if font_size == None:
            font_size = settings[1]
        if font_thickness == None:
            font_thickness = settings[2]
        if box_thickness == None:
            box_thickness = settings[3]

        # loop over results
        for result in infer_results:
            dist, name, box = result
            x1,y1,x2,y2 = box
            # draw bounding box
            img = cv2.rectangle(img,(x1,y1),(x2,y2),
                            color=color, thickness=box_thickness)
            # generate text to put over box
            text = "{} {:.2f}".format(name, dist)
            # put the text on image
            img = cv2.putText(img, text, (x1,y1-offset),
                cv2.FONT_HERSHEY_SIMPLEX, font_size,
                color, font_thickness, cv2.LINE_AA)
        return img

    def get_draw_settings(self,image_shape):
        """
		Arguments:
        image_shape - shape of the image
		Output:
        best setting for the image calculated by
        empherical relations formed from several best settings

		"""
        width,_,_ = image_shape
        offset = round(width/150)
        font_size = round(width/800, 2)
        font_thickness = round(width/400)
        box_thickness = round(width/300)
        return offset, font_size, font_thickness, box_thickness