From 8d720cf546200407ef852fbdb48b7479d0bc0018 Mon Sep 17 00:00:00 2001
From: Hanry <54668181+hanryxu@users.noreply.github.com>
Date: Wed, 2 Nov 2022 20:07:09 -0700
Subject: [PATCH 1/3] add specific car detector

model from HybridNets
---
 vqpy/detector/spec_car.py | 139 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 139 insertions(+)
 create mode 100644 vqpy/detector/spec_car.py

diff --git a/vqpy/detector/spec_car.py b/vqpy/detector/spec_car.py
new file mode 100644
index 0000000..6e99866
--- /dev/null
+++ b/vqpy/detector/spec_car.py
@@ -0,0 +1,139 @@
+# References:
+# https://github.com/ibaiGorordo/ONNX-HybridNets-Multitask-Road-Detection
+# https://github.com/PINTO0309/PINTO_model_zoo/tree/main/276_HybridNets
+# using 384x512 model and anchors
+
+from vqpy.detector.utils import onnx_inference
+from vqpy.base.detector import DetectorBase
+from vqpy.utils.classes import COCO_CLASSES
+import numpy as np
+from typing import Dict, List
+import cv2
+from vqpy.detector.logger import register
+import os
+
+
+input_width = 512
+input_height = 384  # use hybridnets_384x512.onnx, hard code size for now
+output_names = ["regression", "classification", "segmentation"]
+anchor_name = "SpecCar_anchors.npy"
+conf_thres = 0.5
+iou_thres = 0.5
+
+
+class SpecCarDetector(DetectorBase):
+    """The detector for car detection"""
+
+    cls_names = COCO_CLASSES
+    output_fields = ["tlbr", "score", "class_id"]
+
+    def inference(self, img: np.ndarray) -> List[Dict]:
+        # TODO: allow loading multiple files from "model_path"
+        anchor_path = os.path.join(os.path.dirname(self.model_path), anchor_name)
+        processed_img = preprocess(img)
+        detections = onnx_inference(processed_img, self.model_path)
+        outputs = postprocess(detections, img.shape, anchor_path)
+        return outputs
+
+
+def preprocess(image):
+    input_img = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+
+    # Resize input image
+    input_img = cv2.resize(input_img, (input_width, input_height))
+
+    # Scale input pixel values to -1 to 1
+    mean = [0.485, 0.456, 0.406]
+    std = [0.229, 0.224, 0.225]
+    input_img = (input_img / 255.0 - mean) / std
+    input_img = input_img.transpose(2, 0, 1)
+    input_tensor = input_img[np.newaxis, :, :, :].astype(np.float32)
+
+    return input_tensor
+
+
+def postprocess(detections, image_size, anchor_path):
+    boxes = np.squeeze(detections[0])
+    scores = np.squeeze(detections[1])
+
+    anchors = np.squeeze(np.load(anchor_path))
+    transformed_boxes = transform_boxes(boxes, anchors)
+    filtered_boxes = transformed_boxes[scores > conf_thres]
+    filtered_scores = scores[scores > conf_thres]
+
+    filtered_boxes[:, [0, 2]] *= image_size[1] / input_width
+    filtered_boxes[:, [1, 3]] *= image_size[0] / input_height
+
+    filtered_boxes, filtered_scores = nms_fast(
+        filtered_boxes, filtered_scores, iou_thres
+    )
+
+    rets = []
+    for (tlbr, score) in zip(filtered_boxes, filtered_scores):
+        # todo: convert dict to named tuple
+        rets.append({"tlbr": tlbr, "score": score, "class_id": 2})  # class_id for car
+    return rets
+
+
+def transform_boxes(boxes, anchors):
+    y_centers_a = (anchors[:, 0] + anchors[:, 2]) / 2
+    x_centers_a = (anchors[:, 1] + anchors[:, 3]) / 2
+    ha = anchors[:, 2] - anchors[:, 0]
+    wa = anchors[:, 3] - anchors[:, 1]
+
+    w = np.exp(boxes[:, 3]) * wa
+    h = np.exp(boxes[:, 2]) * ha
+
+    y_centers = boxes[:, 0] * ha + y_centers_a
+    x_centers = boxes[:, 1] * wa + x_centers_a
+
+    ymin = y_centers - h / 2.0
+    xmin = x_centers - w / 2.0
+    ymax = y_centers + h / 2.0
+    xmax = x_centers + w / 2.0
+
+    return np.vstack((xmin, ymin, xmax, ymax)).T
+
+
+# Ref: https://python-ai-learn.com/2021/02/14/nmsfast/
+def nms_fast(bboxes, scores, iou_threshold=0.5):
+    areas = (bboxes[:, 2] - bboxes[:, 0] + 1) * (bboxes[:, 3] - bboxes[:, 1] + 1)
+
+    sort_index = np.argsort(scores)
+
+    i = -1
+    while len(sort_index) >= 1 - i:
+
+        max_scr_ind = sort_index[i]
+        ind_list = sort_index[:i]
+
+        iou = iou_np(
+            bboxes[max_scr_ind], bboxes[ind_list], areas[max_scr_ind], areas[ind_list]
+        )
+
+        del_index = np.where(iou >= iou_threshold)
+        sort_index = np.delete(sort_index, del_index)
+        i -= 1
+
+    bboxes = bboxes[sort_index]
+    scores = scores[sort_index]
+
+    return bboxes, scores
+
+
+# Ref: https://python-ai-learn.com/2021/02/14/nmsfast/
+def iou_np(box, boxes, area, areas):
+    x_min = np.maximum(box[0], boxes[:, 0])
+    y_min = np.maximum(box[1], boxes[:, 1])
+    x_max = np.minimum(box[2], boxes[:, 2])
+    y_max = np.minimum(box[3], boxes[:, 3])
+
+    w = np.maximum(0, x_max - x_min + 1)
+    h = np.maximum(0, y_max - y_min + 1)
+    intersect = w * h
+
+    iou_np = intersect / (area + areas - intersect)
+    return iou_np
+
+
+register("spec_car", SpecCarDetector, "SpecCar.onnx")
\ No newline at end of file

From 3876d2c0d0ea69ce50762004ad569cd254e2b26d Mon Sep 17 00:00:00 2001
From: Hanry <54668181+hanryxu@users.noreply.github.com>
Date: Wed, 2 Nov 2022 20:09:10 -0700
Subject: [PATCH 2/3] Add instructions to download onnx model for specific car
 detector

---
 examples/list_red_moving_vehicle/README.md | 2 ++
 vqpy/detector/spec_car.py                  | 4 ++--
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/examples/list_red_moving_vehicle/README.md b/examples/list_red_moving_vehicle/README.md
index 1ddd703..4626aa0 100644
--- a/examples/list_red_moving_vehicle/README.md
+++ b/examples/list_red_moving_vehicle/README.md
@@ -13,6 +13,8 @@ pip3 install -v -e .
 wget https://github.com/Megvii-BaseDetection/YOLOX/releases/download/0.1.1rc0/yolox_x.pth
 ```
 
+Pretrained onnx model for the specific car detector can be found [here](https://github.com/PINTO0309/PINTO_model_zoo/tree/main/276_HybridNets), the `hybridnets_384x512` model and anchors are used.
+
 Besides, please use below command to install other dependencies for this example.
 ```
 pip install webcolors ColorDetect opencv-python
diff --git a/vqpy/detector/spec_car.py b/vqpy/detector/spec_car.py
index 6e99866..e1b4fcf 100644
--- a/vqpy/detector/spec_car.py
+++ b/vqpy/detector/spec_car.py
@@ -16,7 +16,7 @@
 input_width = 512
 input_height = 384  # use hybridnets_384x512.onnx, hard code size for now
 output_names = ["regression", "classification", "segmentation"]
-anchor_name = "SpecCar_anchors.npy"
+anchor_name = "anchors_384x512.npy"
 conf_thres = 0.5
 iou_thres = 0.5
 
@@ -136,4 +136,4 @@ def iou_np(box, boxes, area, areas):
     return iou_np
 
 
-register("spec_car", SpecCarDetector, "SpecCar.onnx")
\ No newline at end of file
+register("spec_car", SpecCarDetector, "hybridnets_384x512.onnx")
\ No newline at end of file

From 3b456e3b85081042dc3f2b417e286ced01f28401 Mon Sep 17 00:00:00 2001
From: Hanry <54668181+hanryxu@users.noreply.github.com>
Date: Wed, 2 Nov 2022 20:18:08 -0700
Subject: [PATCH 3/3] Fix lint

---
 vqpy/detector/spec_car.py | 15 ++++++++++-----
 1 file changed, 10 insertions(+), 5 deletions(-)

diff --git a/vqpy/detector/spec_car.py b/vqpy/detector/spec_car.py
index e1b4fcf..1d83bc4 100644
--- a/vqpy/detector/spec_car.py
+++ b/vqpy/detector/spec_car.py
@@ -29,7 +29,8 @@ class SpecCarDetector(DetectorBase):
 
     def inference(self, img: np.ndarray) -> List[Dict]:
         # TODO: allow loading multiple files from "model_path"
-        anchor_path = os.path.join(os.path.dirname(self.model_path), anchor_name)
+        anchor_path = os.path.join(os.path.dirname(self.model_path),
+                                   anchor_name)
         processed_img = preprocess(img)
         detections = onnx_inference(processed_img, self.model_path)
         outputs = postprocess(detections, img.shape, anchor_path)
@@ -71,7 +72,9 @@ def postprocess(detections, image_size, anchor_path):
     rets = []
     for (tlbr, score) in zip(filtered_boxes, filtered_scores):
         # todo: convert dict to named tuple
-        rets.append({"tlbr": tlbr, "score": score, "class_id": 2})  # class_id for car
+        rets.append(
+            {"tlbr": tlbr, "score": score, "class_id": 2}   # class_id for car
+        )
     return rets
 
 
@@ -97,7 +100,8 @@ def transform_boxes(boxes, anchors):
 
 # Ref: https://python-ai-learn.com/2021/02/14/nmsfast/
 def nms_fast(bboxes, scores, iou_threshold=0.5):
-    areas = (bboxes[:, 2] - bboxes[:, 0] + 1) * (bboxes[:, 3] - bboxes[:, 1] + 1)
+    areas = (bboxes[:, 2] - bboxes[:, 0] + 1) * \
+        (bboxes[:, 3] - bboxes[:, 1] + 1)
 
     sort_index = np.argsort(scores)
 
@@ -108,7 +112,8 @@ def nms_fast(bboxes, scores, iou_threshold=0.5):
         ind_list = sort_index[:i]
 
         iou = iou_np(
-            bboxes[max_scr_ind], bboxes[ind_list], areas[max_scr_ind], areas[ind_list]
+            bboxes[max_scr_ind], bboxes[ind_list],
+            areas[max_scr_ind], areas[ind_list]
         )
 
         del_index = np.where(iou >= iou_threshold)
@@ -136,4 +141,4 @@ def iou_np(box, boxes, area, areas):
     return iou_np
 
 
-register("spec_car", SpecCarDetector, "hybridnets_384x512.onnx")
\ No newline at end of file
+register("spec_car", SpecCarDetector, "hybridnets_384x512.onnx")