Merge pull request #8 from louis-she/add-prediction-threshold

pengbo0054 · web-flow · commit 3f62b17660c0 · 2018-07-13T23:40:16.000+08:00
change top-k to threshold
diff --git a/config.py.example b/config.py.example
@@ -32,6 +32,7 @@ class Config(object):
     ANCHOR_STRIDE = [8, 16, 32, 64, 128]
     ANCHOR_SIZE = [32, 64, 128, 256, 512]
     NEG_POS_ANCHOR_NUM_RATIO = 3
-    
-    # nms threshold
-    NMS_THRESHOLD = 0.3
+
+    # prediction
+    NMS_THRESHOLD = 0.3
+    PREDICTION_THRESHOLD = 6
diff --git a/detector.py b/detector.py
@@ -16,11 +16,11 @@
 
 class Detector(object):
 
-    def __init__(self, model, image_size=Config.IMAGE_SIZE, keep=200):
+    def __init__(self, model, image_size=Config.IMAGE_SIZE, threshold=Config.PREDICTION_THRESHOLD):
         checkpoint = torch.load(seek_model(model))
         self.model = Net().to(device)
         self.model.load_state_dict(checkpoint['state_dict'], strict=True)
-        self.keep = keep
+        self.threshold = threshold
         self.image_size = image_size
 
     def infer(self, image):
@@ -39,10 +39,11 @@ def infer(self, image):
 
         # get sorted indices by score
         diff = predictions[:, 5] - predictions[:, 4]
-        scores, indices = torch.sort(diff, descending=True)
-        # sort and slice predictions
-        predictions = predictions[indices][:self.keep]
-        scores = scores[:self.keep]
+        scores, sorted_indices = torch.sort(diff, descending=True)
+        valid_indices = scores > self.threshold
+        scores = scores[valid_indices]
+
+        predictions = predictions[sorted_indices][valid_indices]
         # generate anchors then sort and slice
         anchor_configs = (
             Config.ANCHOR_STRIDE,
@@ -52,7 +53,7 @@ def infer(self, image):
         anchors = change_coordinate(np.vstack(
             list(map(lambda x: np.array(x), generate_anchors(*anchor_configs)))
         ))
-        anchors = torch.tensor(anchors[indices][:self.keep]).float().to(device)
+        anchors = torch.tensor(anchors)[sorted_indices][valid_indices].float().to(device)
 
         x = (predictions[:, 0] * anchors[:, 2] + anchors[:, 0]) * scale[1]
         y = (predictions[:, 1] * anchors[:, 3] + anchors[:, 1]) * scale[0]
@@ -62,10 +63,11 @@ def infer(self, image):
         bounding_boxes = torch.stack((x, y, w, h), dim=1).cpu().data.numpy()
         bounding_boxes = change_coordinate_inv(bounding_boxes)
         scores = scores.cpu().data.numpy()
-        bboxes_scores = np.hstack((bounding_boxes,np.array([scores]).T))
-        # TODO: do non-maximum suppression for bounding_boxes here
+        bboxes_scores = np.hstack((bounding_boxes, np.array([scores]).T))
+
+        # nms
         keep = nms(bboxes_scores)
-        
+
         return bounding_boxes[keep]
 
 def main(args):
diff --git a/inference.ipynb b/inference.ipynb