Spaces:

sam749
/

YuNet-face-detection

Running

App Files Files Community

sam749 commited on Mar 28, 2024

Commit

58ae671

verified ·

1 Parent(s): b03e0d7

added window sliding (#1)

Browse files

- added window sliding (ec7bf1ecd046d97945a306471d5a72eab96a1b0d)

Files changed (2) hide show

app.py +3 -106
image_resizer.py +114 -0

app.py CHANGED Viewed

@@ -1,111 +1,8 @@
-import os
-import cv2
-import cv2 as cv
-import numpy as np
 import gradio as gr
-from yunet import YuNet
-# Valid combinations of backends and targets
-backend_target_pairs = [
-    [cv.dnn.DNN_BACKEND_OPENCV, cv.dnn.DNN_TARGET_CPU],
-    [cv.dnn.DNN_BACKEND_CUDA, cv.dnn.DNN_TARGET_CUDA],
-    [cv.dnn.DNN_BACKEND_CUDA, cv.dnn.DNN_TARGET_CUDA_FP16],
-    [cv.dnn.DNN_BACKEND_TIMVX, cv.dnn.DNN_TARGET_NPU],
-    [cv.dnn.DNN_BACKEND_CANN, cv.dnn.DNN_TARGET_NPU],
-]
-class ImageResizer:
-    def __init__(
-        self,
-        modelPath,
-        input_size=(320, 320),
-        conf_threshold=0.6,
-        nms_threshold=0.3,
-        top_k=5000,
-        backend_id=0,
-        target_id=0,
-    ):
-        self.model = YuNet(
-            modelPath=modelPath,
-            inputSize=input_size,
-            confThreshold=conf_threshold,
-            nmsThreshold=nms_threshold,
-            topK=top_k,
-            backendId=backend_id,
-            targetId=target_id,
-        )
-    def detect(self, image, num_faces=None):
-        # If input is an image
-        if image is not None:
-            h, w, _ = image.shape
-            # Inference
-            self.model.setInputSize([w, h])
-            results = self.model.infer(image)
-            faces = results[:num_faces] if num_faces else results
-            bboxs = []
-            for face in faces:
-                bbox = face[0:4].astype(np.int32)  # x,y,w,h
-                x, y, w, h = bbox
-                # draw
-                cv2.rectangle(image, (x, y), (x + w, y + h), (0, 0, 255), 2)
-                bboxs.append(bbox)
-            return image, bboxs
-    def resize(self, image, target_size=512, above_head_ratio=0.5):
-        height, width, _c = image.shape
-        ar = width / height
-        # downscale the image
-        if not target_size:
-            target_size = 512
-        if ar > 1:
-            # Landscape
-            new_height = target_size
-            new_width = int(target_size * ar)
-        elif ar < 1:
-            # Portrait
-            new_width = target_size
-            new_height = int(target_size / ar)
-        else:
-            # Square
-            new_width = target_size
-            new_height = target_size
-        resized = cv2.resize(
-            image, (new_width, new_height), interpolation=cv2.INTER_LINEAR
-        )
-        # Perform object detection on the resized image
-        dt_image, bboxes = self.detect(resized.copy())
-        # crop around face
-        if len(bboxes) >= 1:
-            x, y, w, h = bboxes[0]
-        else:
-            x, y, w, h = 0, 0, target_size, target_size
-        # 20% of image height
-        above_head_max = int(target_size * above_head_ratio)
-        x_center = int((x + (x + w)) / 2)
-        y_center = int((y + (y + h)) / 2)
-        # Calculate cropping box
-        left = int(max(0, x_center - target_size // 2))
-        top = int(max(0, y_center - above_head_max))
-        right = min(left + target_size, resized.shape[1])
-        bottom = min(top + target_size, resized.shape[0])
-        cropped_image = resized[top:bottom, left:right]
-        return dt_image, cropped_image
-model_path = "face_detection_yunet_2023mar.onnx"
-image_resizer = ImageResizer(modelPath=model_path)
 def face_detector(input_image, target_size=512):

 import gradio as gr
+from image_resizer import ImageResizer
+MODEL_PATH = "face_detection_yunet_2023mar.onnx"
+image_resizer = ImageResizer(modelPath=MODEL_PATH)
 def face_detector(input_image, target_size=512):

image_resizer.py ADDED Viewed

	@@ -0,0 +1,114 @@

+import cv2
+import cv2 as cv
+import numpy as np
+from yunet import YuNet
+# Valid combinations of backends and targets
+backend_target_pairs = [
+    [cv.dnn.DNN_BACKEND_OPENCV, cv.dnn.DNN_TARGET_CPU],
+    [cv.dnn.DNN_BACKEND_CUDA, cv.dnn.DNN_TARGET_CUDA],
+    [cv.dnn.DNN_BACKEND_CUDA, cv.dnn.DNN_TARGET_CUDA_FP16],
+    [cv.dnn.DNN_BACKEND_TIMVX, cv.dnn.DNN_TARGET_NPU],
+    [cv.dnn.DNN_BACKEND_CANN, cv.dnn.DNN_TARGET_NPU],
+]
+class ImageResizer:
+    def __init__(
+        self,
+        modelPath,
+        input_size=(320, 320),
+        conf_threshold=0.6,
+        nms_threshold=0.3,
+        top_k=5000,
+        backend_id=0,
+        target_id=0,
+    ):
+        self.model = YuNet(
+            modelPath=modelPath,
+            inputSize=input_size,
+            confThreshold=conf_threshold,
+            nmsThreshold=nms_threshold,
+            topK=top_k,
+            backendId=backend_id,
+            targetId=target_id,
+        )
+    def detect(self, image, num_faces=None):
+        # If input is an image
+        if image is not None:
+            h, w, _ = image.shape
+            # Inference
+            self.model.setInputSize([w, h])
+            results = self.model.infer(image)
+            faces = results[:num_faces] if num_faces else results
+            bboxs = []
+            for face in faces:
+                bbox = face[0:4].astype(np.int32)  # x,y,w,h
+                x, y, w, h = bbox
+                # draw
+                cv2.rectangle(image, (x, y), (x + w, y + h), (0, 0, 255), 2)
+                bboxs.append(bbox)
+            return image, bboxs
+    def resize(self, image, target_size=512, above_head_ratio=0.5):
+        height, width, _c = image.shape
+        ar = width / height
+        # downscale the image
+        if not target_size:
+            target_size = 512
+        if ar > 1:
+            # Landscape
+            new_height = target_size
+            new_width = int(target_size * ar)
+        elif ar < 1:
+            # Portrait
+            new_width = target_size
+            new_height = int(target_size / ar)
+        else:
+            # Square
+            new_width = target_size
+            new_height = target_size
+        resized = cv2.resize(
+            image, (new_width, new_height), interpolation=cv2.INTER_AREA
+        )
+        # Perform object detection on the resized image
+        dt_image, bboxes = self.detect(resized.copy())
+        # crop around face
+        if len(bboxes) >= 1:
+            x, y, w, h = bboxes[0]
+        else:
+            x, y, w, h = 0, 0, target_size, target_size
+        # 20% of image height
+        above_head_max = int(target_size * above_head_ratio)
+        x_center = int((x + (x + w)) / 2)
+        y_center = int((y + (y + h)) / 2)
+        # Calculate cropping box
+        top = int(max(0, y_center - above_head_max))
+        bottom = int(min(top + target_size, resized.shape[0]))
+        left = int(max(0, x_center - target_size // 2))
+        right = int(min(x_center + target_size // 2, resized.shape[1]))
+        # adjust width if necessory
+        _w = right - left
+        if _w != target_size:
+            dx = (
+                target_size - _w
+            )  # difference between the target size and the current width
+            nl = max(0, left - dx)
+            dr = dx - nl  # remaining adjustment needed for the right coordinate
+            left = nl
+            right += dr
+        cropped_image = resized[top:bottom, left:right]
+        return dt_image, cropped_image