initial commit

2025-10-23 01:38:59 +08:00 · 2022-08-26 17:42:09 +00:00
commit c71768bb55
823 changed files with 276191 additions and 0 deletions
--- a/code_generator/detection_utils.py
+++ b/code_generator/detection_utils.py
@@ -0,0 +1,86 @@
+# ----------------------------------------------------------------------
+# Project: TinyEngine
+# Title:   detection_utils.py
+#
+# Reference papers:
+#  - MCUNet: Tiny Deep Learning on IoT Device, NeurIPS 2020
+#  - MCUNetV2: Memory-Efficient Patch-based Inference for Tiny Deep Learning, NeurIPS 2021
+#  - MCUNetV3: On-Device Training Under 256KB Memory, arXiv:2206.15472
+# Contact authors:
+#  - Wei-Ming Chen, wmchen@mit.edu
+#  - Wei-Chen Wang, wweichen@mit.edu
+#  - Ji Lin, jilin@mit.edu
+#  - Ligeng Zhu, ligeng@mit.edu
+#  - Song Han, songhan@mit.edu
+#
+# Target ISA:  ARMv7E-M
+# ----------------------------------------------------------------------
+
+import json
+
+
+class detectionUtils:
+    def __init__(self, layers, det_config_path) -> None:
+        with open(det_config_path, "r") as f:
+            self.det_conf = json.loads(f.read())
+        self.layers = layers
+        pass
+
+    def genPostProcessing(self):
+        output_string = ""
+        output_ch = None
+        num_class = None
+        # generate anchors
+        assert len(self.det_conf) == 3, "Only support 3 detection outputs."
+        output_string += """const int anchors[3][3][2] = {\n"""
+        for key in self.det_conf:
+            output_config = self.det_conf[key]
+            num_class = output_config["num_class"]
+            assert output_config["name"] == "Yolo3Output", "Only support Yolo3Output now."
+            output_string += "{"
+            for i in range(len(output_config["anchors"]) // 2):
+                output_string += "{" + f"{output_config['anchors'][i * 2]},{output_config['anchors'][i * 2 + 1]}" + "},"
+            output_string += "},\n"
+        output_string += "};\n"
+        # generate the post processing part
+        output_string += """void det_post_procesing(int* box_cnt, det_box** ret_box, float threshold){\n"""
+        tensorstring = "    int8_t *input_data" + f"[{str(len(self.det_conf))}]" + "={"
+        zerostring = "    int8_t y_zero" + f"[{str(len(self.det_conf))}]" + "={"
+        scalestring = "    float y_scale" + f"[{str(len(self.det_conf))}]" + "={"
+        top_avaialble_addrees = 0
+        for key in self.det_conf:
+            output_config = self.det_conf[key]
+            # Find out the op that gerneate this output
+            target_id = output_config["input_id"]
+            for layer in self.layers:
+                if str(layer.params["output_idx"]) == str(target_id):
+                    print(f"Processing the output {layer.params['output_idx']} as a detection feature map.")
+                    tensorstring += (
+                        f"{layer._getBufferstr(layer.params['output_buf_add'], layer.params['output_buf_add_offset'])},"
+                    )
+                    zerostring += f'{layer.params["output_zero_point"]},'
+                    scalestring += f'{layer.params["output_scale"]},'
+                    output_ch = layer.params["output_c"]
+                    top_avaialble_addrees = max(
+                        top_avaialble_addrees, layer.params["output_buf_add_offset"] + layer.output_tensors[0].len()
+                    )
+
+        import math
+
+        # Align by 4
+        top_avaialble_addrees = math.ceil((float(top_avaialble_addrees) / 4) * 4)
+
+        assert output_ch is not None
+        tensorstring += "};\n"
+        zerostring += "};\n"
+        scalestring += "};\n"
+        output_string += tensorstring + zerostring + scalestring
+        output_string += (
+            f" 	postprocessing(input_data, y_zero, y_scale, &buffer[{top_avaialble_addrees}],"
+            + f" {self.layers[0].params['input_w']}, "
+            + f'{self.layers[0].params["input_h"]}, {output_ch}, {num_class}, '
+            + f"anchors, {len(self.det_conf)}, "
+            + "0.45f, threshold, box_cnt, ret_box);\n}\n"
+        )
+
+        return output_string