object detection

previ · previ · commit 253af596d57f · 2019-12-08T17:39:26.000Z
diff --git a/camera.py b/camera.py
@@ -373,3 +373,24 @@ def cnn_classify(self, model_name=None, top_results=3):
     def find_class(self):
         return self.cnn_classify(top_results=1)[0][0]
 
+    def cnn_detect_objects(self, model_name=None, top_results=3):
+        classifier = None
+        if model_name:
+            classifier = self._cnn_classifiers.get(model_name)
+            if classifier is None:
+                classifier = CNNManager.get_instance().load_model(model_name)
+                self._cnn_classifiers[model_name] = classifier
+        else:
+            classifier = self._cnn_classifier_default
+
+        t0 = time.time()
+        classes = None
+        try:
+            img = self.get_image()
+            classes = classifier.detect_objects(img.mat(), top_results=top_results)
+        except Exception:
+            logging.warning("classifier not available")
+            classes = [("None", 100)]
+            raise
+        logging.info("fps: %f", 1.0/(time.time()-t0))
+        return classes
diff --git a/cnn_classifier.py b/cnn_classifier.py
@@ -129,23 +129,55 @@ def classify_image(self,
         #else:
         input_image = self.read_tensor_from_image_mat(image_file_or_mat)
 
-        logger.info("classify.0")
         self._interpreter.set_tensor(self._input_details[0]['index'], input_image)
         self._interpreter.invoke()
-        logger.info("classify.1")
         scores = self._interpreter.get_tensor(self._output_details[0]['index'])[0] # Bounding box coordinates of detected objects
-        #logger.info("classify.2")
-        #classes = self._interpreter.get_tensor(self._output_details[1]['index'])[0] # Class index of detected objects
-        #logger.info("classify.3")
-        #scores = self._interpreter.get_tensor(self._output_details[2]['index'])[0] # Confidence of detected objects
-        #logger.info("classify.4")
 
-        #pairs = [(classes[i], scores[i], boxes[i]) for i in range(0, len(classes))]
         pairs = []
         for i in range(0, len(scores)):
-            if scores[i] > 0.5:
+            if scores[i] > 128:
                 object_name = self._labels[i]
-                pairs.append((object_name, scores[i]))
+                pairs.append((object_name, int(100*scores[i]/256)))
 
+        pairs = sorted(pairs, key=lambda x: x[1], reverse=True)[:top_results]
+        logger.info(str(pairs))
+        return pairs
+
+    def detect_objects(self,
+                       image_file_or_mat,
+                       top_results=3):
+        input_image = None
+        #if isinstance(image_file_or_mat, str):
+        #    t = self.read_tensor_from_image_file(file_name=image_file_or_mat)
+        #else:
+        input_image = self.read_tensor_from_image_mat(image_file_or_mat)
+
+        self._interpreter.set_tensor(self._input_details[0]['index'], input_image)
+        self._interpreter.invoke()
+
+        # Retrieve detection results
+        boxes = self._interpreter.get_tensor(self._output_details[0]['index'])[0] # Bounding box coordinates of detected objects
+        classes = self._interpreter.get_tensor(self._output_details[1]['index'])[0] # Class index of detected objects
+        scores = self._interpreter.get_tensor(self._output_details[2]['index'])[0] # Confidence of detected objects
+
+        # Loop over all detections and draw detection box if confidence is above minimum threshold
+        min_conf_threshold=0.1
+        imH=100
+        imW=100
+        pairs = []
+        for i in range(len(scores)):
+            if ((scores[i] > min_conf_threshold) and (scores[i] <= 1.0)):
+
+                # Get bounding box coordinates and draw box
+                # Interpreter can return coordinates that are outside of image dimensions, need to force them to be within image using max() and min()
+                ymin = int(max(1,(boxes[i][0] * imH)))
+                xmin = int(max(1,(boxes[i][1] * imW)))
+                ymax = int(min(imH,(boxes[i][2] * imH)))
+                xmax = int(min(imW,(boxes[i][3] * imW)))
+
+                object_name = self._labels[int(classes[i])]
+                pairs.append((object_name, int(100*scores[i]), (xmin, ymin, xmax, ymax)))
+
+        pairs = sorted(pairs, key=lambda x: x[1], reverse=True)[:top_results]
         logger.info(str(pairs))
         return pairs
diff --git a/cnn_models/models.json b/cnn_models/models.json
@@ -1 +1 @@
-{"test_model_1": {"status": 0, "image_height": "128", "image_width": "128", "output_layer": "final_result"}, "mobilenet_v1_1_0_quant": {"status": 100, "image_height": 120, "output_layer": "final_result", "image_width": 160}}
+{"test_model_1": {"status": 0, "image_height": "128", "image_width": "128", "output_layer": "final_result"}, "mobilenet_v1_1_0_quant": {"status": 100, "image_height": 120, "output_layer": "final_result", "image_width": 160}, "v3-large_224_1.0_uint8": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}, "object_detection": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}}
diff --git a/static/js/blockly/blocks.js b/static/js/blockly/blocks.js
@@ -759,6 +759,29 @@ Blockly.Python['coderbot_adv_cnn_classify'] = function(block) {
   return [class_scores, Blockly.Python.ORDER_ATOMIC];
 };
 
+Blockly.Blocks['coderbot_adv_cnn_detect_objects'] = {
+  /**
+   * Block for find_class function.
+   * @this Blockly.Block
+   */
+  init: function() {
+    this.setHelpUrl(Blockly.Msg.LOGIC_BOOLEAN_HELPURL);
+    this.setColour(250);
+    this.appendDummyInput()
+        .appendField(Blockly.Msg.CODERBOT_SENSOR_FINDOBJECT)
+        .appendField(new Blockly.FieldDropdown(CODERBOT_CNN_MODEL_LIST), 'MODEL');
+    this.setInputsInline(true);
+    this.setOutput(true, ['Array']);
+    this.setTooltip(Blockly.Msg.LOGIC_BOOLEAN_TOOLTIP);
+  }
+};
+
+Blockly.Python['coderbot_adv_cnn_detect_objects'] = function(block) {
+  var model = block.getFieldValue('MODEL');
+  var class_scores = 'get_cam().cnn_detect_objects("'+ model +'")';
+  return [class_scores, Blockly.Python.ORDER_ATOMIC];
+};
+
 Blockly.Blocks['coderbot_event_generator'] = {
   init: function() {
     this.appendDummyInput()
diff --git a/static/js/blockly/bot_en.js b/static/js/blockly/bot_en.js
@@ -52,6 +52,7 @@ Blockly.Msg.CODERBOT_SENSOR_FINDFACE_SIZE = "size";
 Blockly.Msg.CODERBOT_SENSOR_FINDFACE_ALL = "x, y, size (as list)";
 Blockly.Msg.CODERBOT_SENSOR_FINDLOGO = "find logo";
 Blockly.Msg.CODERBOT_SENSOR_FINDCLASS = "find class";
+Blockly.Msg.CODERBOT_SENSOR_FINDOBJECT = "detect objects";
 Blockly.Msg.CODERBOT_SENSOR_AVERAGE = "get image average";
 Blockly.Msg.CODERBOT_SENSOR_AVERAGE_HUE = "Hue";
 Blockly.Msg.CODERBOT_SENSOR_AVERAGE_SATURATION = "Saturation";
diff --git a/static/js/blockly/bot_it.js b/static/js/blockly/bot_it.js
@@ -52,6 +52,7 @@ Blockly.Msg.CODERBOT_SENSOR_FINDFACE_SIZE = "dimensione";
 Blockly.Msg.CODERBOT_SENSOR_FINDFACE_ALL = "x, y, dimensione (come lista)";
 Blockly.Msg.CODERBOT_SENSOR_FINDLOGO = "trova logo";
 Blockly.Msg.CODERBOT_SENSOR_FINDCLASS = "trova classe";
+Blockly.Msg.CODERBOT_SENSOR_FINDOBJECT = "trova oggetti";
 Blockly.Msg.CODERBOT_SENSOR_AVERAGE = "valore medio immagine";
 Blockly.Msg.CODERBOT_SENSOR_AVERAGE_HUE = "Tinta";
 Blockly.Msg.CODERBOT_SENSOR_AVERAGE_SATURATION = "Saturazione";
diff --git a/templates/blocks_adv.xml b/templates/blocks_adv.xml
@@ -303,6 +303,7 @@
       <block type="coderbot_adv_findARCode"></block>
       <block type="coderbot_adv_find_class"></block>
       <block type="coderbot_adv_cnn_classify"></block>
+      <block type="coderbot_adv_cnn_detect_objects"></block>
       <block type="coderbot_sonar_get_distance"></block>
     </category>{%endif%}
     <category name="{% trans %}Sound{% endtrans %}" colour="220">

Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-{"test_model_1": {"status": 0, "image_height": "128", "image_width": "128", "output_layer": "final_result"}, "mobilenet_v1_1_0_quant": {"status": 100, "image_height": 120, "output_layer": "final_result", "image_width": 160}}`
	`1`	`+{"test_model_1": {"status": 0, "image_height": "128", "image_width": "128", "output_layer": "final_result"}, "mobilenet_v1_1_0_quant": {"status": 100, "image_height": 120, "output_layer": "final_result", "image_width": 160}, "v3-large_224_1.0_uint8": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}, "object_detection": {"status": 1.0, "image_height": 224, "output_layer": "final_result", "image_width": 224}}`