Spaces:

vk888
/

yolox-pedestrian-detection-all-weather-augmentation

Running

App Files Files Community

vk commited on Mar 12

Commit

3b86909

1 Parent(s): db5fd2f

square input handling

Browse files

Files changed (1) hide show

yolox_onnx.py +36 -2

yolox_onnx.py CHANGED Viewed

@@ -4,6 +4,7 @@ import numpy as np
 import onnxruntime
 class YOLOX_ONNX:
     def __init__(self, model_path):
@@ -13,12 +14,28 @@ class YOLOX_ONNX:
         # print(self.model.get_outputs()[0].name)
         # print(self.image_size)
         self.labels_map=['pedestrian']
     def __preprocess_image(self, img, swap=(2, 0, 1)):
         padded_img = np.ones((self.image_size[0], self.image_size[1], 3), dtype=np.uint8) * 114
         r = min(self.image_size[0] / img.shape[0], self.image_size[1] / img.shape[1])
         resized_img = cv2.resize(img, (int(img.shape[1] * r), int(img.shape[0] * r)), interpolation=cv2.INTER_LINEAR).astype(np.uint8)
@@ -102,6 +119,13 @@ class YOLOX_ONNX:
         #valid_boxes_xyxy, valid_scores, valid_classes = self.__remove_duplicates(valid_boxes_xyxy, valid_scores, valid_classes)
         return valid_boxes_xyxy, valid_scores, valid_classes
@@ -136,7 +160,8 @@ class YOLOX_ONNX:
             #             lineType=cv2.LINE_AA)
         return img
-    def predict(self, image, score_thresh=0.5, iou_thresh=0.4):
         h,w = image.shape[:2]
         origin_img=np.copy(image)
         model_input = np.copy(image)
@@ -155,3 +180,12 @@ class YOLOX_ONNX:
         return d_boxes, d_scores, d_classes

 import onnxruntime
 class YOLOX_ONNX:
     def __init__(self, model_path):
         # print(self.model.get_outputs()[0].name)
         # print(self.image_size)
         self.labels_map=['pedestrian']
+        self.pad_to_square_flag=False
+    def pad_to_square(self,image):
+        height, width = image.shape[:2]
+        size = max(height, width)
+        delta_w = size - width
+        delta_h = size - height
+        self.top, self.bottom = delta_h // 2, delta_h - (delta_h // 2)
+        self.left, self.right = delta_w // 2, delta_w - (delta_w // 2)
+        print(self.top, self.bottom,self.left, self.right)
+        color = [114,114,114]  # padding
+        padded_image = cv2.copyMakeBorder(image, self.top, self.bottom, self.left, self.right, cv2.BORDER_CONSTANT, value=color)
+        return padded_image
     def __preprocess_image(self, img, swap=(2, 0, 1)):
+        if (img.shape[1]/img.shape[0]) > 1.2:
+            self.pad_to_square_flag=True
+            img = self.pad_to_square(img)  # training aspect ratio is 1:1
         padded_img = np.ones((self.image_size[0], self.image_size[1], 3), dtype=np.uint8) * 114
         r = min(self.image_size[0] / img.shape[0], self.image_size[1] / img.shape[1])
         resized_img = cv2.resize(img, (int(img.shape[1] * r), int(img.shape[0] * r)), interpolation=cv2.INTER_LINEAR).astype(np.uint8)
         #valid_boxes_xyxy, valid_scores, valid_classes = self.__remove_duplicates(valid_boxes_xyxy, valid_scores, valid_classes)
+        if self.pad_to_square_flag:
+            for i,offset in enumerate([self.left,self.top,self.right,self.bottom]):
+                valid_boxes_xyxy[:, i] = valid_boxes_xyxy[:,i] - offset #remove pad offsets from boundingbox(xmin,ymin,xmax,ymax)
+            self.pad_to_square_flag=False
         return valid_boxes_xyxy, valid_scores, valid_classes
             #             lineType=cv2.LINE_AA)
         return img
+    def predict(self, image, score_thresh=0.4, iou_thresh=0.4):
         h,w = image.shape[:2]
         origin_img=np.copy(image)
         model_input = np.copy(image)
         return d_boxes, d_scores, d_classes
+# if __name__=="__main__":
+#     from matplotlib import pyplot as plt
+#     path='test-images/test1.jpg'
+#     yolox_nano_onnx=YOLOX_ONNX('models/pedestrian-detection-best95.onnx')
+#     yolox_nano_onnx.predict(cv2.imread(path))
+#     plt.title('Predicted')
+#     plt.imshow(cv2.cvtColor(yolox_nano_onnx.output_img,cv2.COLOR_BGR2RGB))
+#     plt.show()