CoderBotOrg
diff --git a/‎cnn_classifier.py‎
Lines changed: 27 additions & 74 deletions b/‎cnn_classifier.py‎
Lines changed: 27 additions & 74 deletions
diff --git a/‎cnn_manager.py‎
Lines changed: 14 additions & 6 deletions b/‎cnn_manager.py‎
Lines changed: 14 additions & 6 deletions
diff --git a/‎cnn_models/models.json‎
Lines changed: 1 addition & 1 deletion b/‎cnn_models/models.json‎
Lines changed: 1 addition & 1 deletion
@@ -29,7 +29,7 @@
 logger = logging.getLogger(__name__)
 
 class CNNClassifier(object):
-    def __init__(self, model_file, label_file, input_layer="input", output_layer="final_result", input_height=128, input_width=128, input_mean=127.5, input_std=127.5):
+    def __init__(self, model_file, label_file):
         logger.info(model_file)
         self._interpreter = Interpreter(model_path=model_file)
         self._interpreter.set_num_threads(4)
@@ -40,73 +40,20 @@ def __init__(self, model_file, label_file, input_layer="input", output_layer="fi
         self._input_height=self._input_details[0]['shape'][1]
         self._input_width=self._input_details[0]['shape'][2]
         self._floating_model = (self._input_details[0]['dtype'] == np.float32)
-        #input_name = "import/" + input_layer
-        #output_name = "import/" + output_layer
-        #self._input_operation = self._graph.get_operation_by_name(input_name)
-        #self._output_operation = self._graph.get_operation_by_name(output_name)
-        #self._session = tf.compat.v1.Session(graph=self._graph)
-        #self._graph_norm = tf.Graph()
-        #with self._graph_norm.as_default():
-        #    image_mat = tf.compat.v1.placeholder(tf.float32, None, name="image_rgb_in")
-        #    float_caster = tf.cast(image_mat, tf.float32)
-        #    dims_expander = tf.expand_dims(float_caster, 0)
-        #    resized = tf.compat.v1.image.resize_bilinear(dims_expander, [input_height, input_width])
-        #    normalized = tf.divide(tf.subtract(resized, [input_mean]), [input_std], name="image_norm_out")
-        #    self._input_operation_norm = self._graph_norm.get_operation_by_name("image_rgb_in")
-        #    self._output_operation_norm = self._graph_norm.get_operation_by_name("image_norm_out")
-        #self._sess_norm = tf.Session(graph=self._graph_norm)
 
     def close(self):
         pass
-        #self._session.close()
-        #self._sess_norm.close()
-
-    #def load_graph(self, model_file):
-    #   graph = tf.Graph()
-    #    graph_def = tf.compat.v1.GraphDef()
-    #
-    #    with open(model_file, "rb") as f:
-    #        graph_def.ParseFromString(f.read())
-    #    with graph.as_default():
-    #        tf.import_graph_def(graph_def)
-    #
-    #    return graph
-    #
-    #def read_tensor_from_image_file(self, file_name, input_height=299, input_width=299, input_mean=0, input_std=255):
-    #    input_name = "file_reader"
-    #    output_name = "normalized"
-    #
-    #    file_reader = tf.read_file(file_name, input_name)
-    #
-    #    if file_name.endswith(".png"):
-    #        image_reader = tf.image.decode_png(file_reader, channels=3, name='png_reader')
-    #    elif file_name.endswith(".gif"):
-    #        image_reader = tf.squeeze(tf.image.decode_gif(file_reader, name='gif_reader'))
-    #    elif file_name.endswith(".bmp"):
-    #        image_reader = tf.image.decode_bmp(file_reader, name='bmp_reader')
-    #    else:
-    #        image_reader = tf.image.decode_jpeg(file_reader, channels=3, name='jpeg_reader')
-    #
-    #    float_caster = tf.cast(image_reader, tf.float32)
-    #    dims_expander = tf.expand_dims(float_caster, 0);
-    #    resized = tf.image.resize_bilinear(dims_expander, [self.input_height, self.input_width])
-    #    normalized = tf.divide(tf.subtract(resized, [input_mean]), [input_std])
-    #    sess = tf.Session()
-    #
-    #    result = sess.run(normalized)
-    #    sess.close()
-    #
-    #    return result
-    #
-    #def read_tensor_from_image_mat(self, image_mat, input_height=299, input_width=299, input_mean=0, input_std=255):
-    #    result = self._sess_norm.run(self._output_operation_norm.outputs[0], {self._input_operation_norm.outputs[0]: image_mat})
-    #    return result
-    def read_tensor_from_image_mat(self, image_mat, input_height=299, input_width=299, input_mean=0, input_std=255):
+
+    def read_tensor_from_image_file(self, file_name):
+        image = cv2.imread(file_name)
+        return self.read_tensor_from_image_mat(image)
+
+    def read_tensor_from_image_mat(self, image_mat):
         frame_rgb = cv2.cvtColor(image_mat, cv2.COLOR_BGR2RGB)
         frame_resized = cv2.resize(frame_rgb, (self._input_width, self._input_height))
         input_data = np.expand_dims(frame_resized, axis=0)
 
-            # Normalize pixel values if using a floating model (i.e. if model is non-quantized)
+        # Normalize pixel values if using a floating model (i.e. if model is non-quantized)
         if self._floating_model:
             input_mean = 127.5
             input_std = 127.5
@@ -124,33 +71,39 @@ def classify_image(self,
                        image_file_or_mat,
                        top_results=3):
         input_image = None
-        #if isinstance(image_file_or_mat, str):
-        #    t = self.read_tensor_from_image_file(file_name=image_file_or_mat)
-        #else:
-        input_image = self.read_tensor_from_image_mat(image_file_or_mat)
+        if isinstance(image_file_or_mat, str):
+            input_image = self.read_tensor_from_image_file(file_name=image_file_or_mat)
+        else:
+            input_image = self.read_tensor_from_image_mat(image_file_or_mat)
 
         self._interpreter.set_tensor(self._input_details[0]['index'], input_image)
         self._interpreter.invoke()
-        scores = self._interpreter.get_tensor(self._output_details[0]['index'])[0] # Bounding box coordinates of detected objects
-
+        scores = self._interpreter.get_tensor(self._output_details[0]['index'])[0]
+
+        #print("scores: " + str(scores))
+        confidence = 0.4
+        base = 1
+        # normalize to int8 for quantized models
+        if len(scores)>0 and (scores[0] == int(scores[0])):
+            confidence = 128
+            base = 256
         pairs = []
         for i in range(0, len(scores)):
-            if scores[i] > 128:
+            if scores[i] > confidence:
                 object_name = self._labels[i]
-                pairs.append((object_name, int(100*scores[i]/256)))
+                pairs.append((object_name, int(100*scores[i]/base)))
 
         pairs = sorted(pairs, key=lambda x: x[1], reverse=True)[:top_results]
-        logger.info(str(pairs))
         return pairs
 
     def detect_objects(self,
                        image_file_or_mat,
                        top_results=3):
         input_image = None
-        #if isinstance(image_file_or_mat, str):
-        #    t = self.read_tensor_from_image_file(file_name=image_file_or_mat)
-        #else:
-        input_image = self.read_tensor_from_image_mat(image_file_or_mat)
+        if isinstance(image_file_or_mat, str):
+            input_image = self.read_tensor_from_image_file(file_name=image_file_or_mat)
+        else:
+            input_image = self.read_tensor_from_image_mat(image_file_or_mat)
 
         self._interpreter.set_tensor(self._input_details[0]['index'], input_image)
         self._interpreter.invoke()
 
@@ -63,6 +63,17 @@ def get_models(self):
     def get_model_status(self, model_name):
         return self._models[model_name]
 
+    @classmethod
+    def get_model_info(cls, architecture):
+        model_info = architecture.split("/")[1].split("_")
+        return model_info
+
+    @classmethod
+    def get_model_shape(cls, architecture):
+        model_info = cls.get_model_info(architecture)
+        size = int(model_info[3])
+        return (size, size)
+
     def _save_model_meta(self):
         f = open(MODEL_METADATA, "w")
         json.dump(self._models, f)
@@ -92,7 +103,7 @@ def train_new_model(self,
         self._trainers[model_name] = trainer
 
     def save_model_status(self, model_name, architecture, status):
-        model_info = architecture.split("_")
+        model_info = self.get_model_info(architecture)
         self._models[model_name] = {"status": status, "image_height": model_info[3], "image_width": model_info[3], "output_layer": "final_result"}
         self._save_model_meta()
 
@@ -104,10 +115,7 @@ def load_model(self, model_name):
         model_info = self._models.get(model_name)
         if model_info:
             return CNNClassifier(model_file=MODEL_PATH + "/" + model_name + ".tflite",
-                                 label_file=MODEL_PATH + "/" + model_name + ".txt",
-                                 output_layer=model_info["output_layer"],
-                                 input_height=int(model_info["image_height"]),
-                                 input_width=int(model_info["image_width"]))
+                                 label_file=MODEL_PATH + "/" + model_name + ".txt")
         return None
     class TrainThread(threading.Thread):
 
@@ -127,7 +135,7 @@ def update_train_status(self, model_name, status):
             model["status"] = status
 
         def run(self):
-            self.trainer = CNNTrainer(self.manager, self.architecture)
+            self.trainer = CNNTrainer(self.manager, self.architecture, CNNManager.get_model_shape(self.architecture))
             self.manager.save_model_status(self.model_name, self.architecture, 0)
             image_dir = self.prepare_images()
             logging.info("retrain")
 
@@ -1 +1 @@
-{"test_model_1": {"status": 0, "image_height": "128", "image_width": "128", "output_layer": "final_result"}, "mobilenet_v1_1_0_quant": {"status": 100, "image_height": 120, "output_layer": "final_result", "image_width": 160}, "v3-large_224_1.0_uint8": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}, "object_detection": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}}
+{"test_model_1": {"image_width": "160", "output_layer": "final_result", "status": 1, "image_height": "160"}, "base_high_slow": {"image_width": 224, "status": 1.0, "image_height": 224, "output_layer": "final_result"}, "object_detect": {"image_width": 224, "status": 1.0, "image_height": 224, "output_layer": "final_result"}, "base_low_fast": {"image_width": 224, "status": 100, "image_height": 224, "output_layer": "final_result"}}
Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-{"test_model_1": {"status": 0, "image_height": "128", "image_width": "128", "output_layer": "final_result"}, "mobilenet_v1_1_0_quant": {"status": 100, "image_height": 120, "output_layer": "final_result", "image_width": 160}, "v3-large_224_1.0_uint8": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}, "object_detection": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}}`
	`1`	`+{"test_model_1": {"image_width": "160", "output_layer": "final_result", "status": 1, "image_height": "160"}, "base_high_slow": {"image_width": 224, "status": 1.0, "image_height": 224, "output_layer": "final_result"}, "object_detect": {"image_width": 224, "status": 1.0, "image_height": 224, "output_layer": "final_result"}, "base_low_fast": {"image_width": 224, "status": 100, "image_height": 224, "output_layer": "final_result"}}`