From f4d18a70c02e9592b1c6f9a1a872fb60732c9398 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 09:43:18 +0000
Subject: [PATCH 01/41] batched detection

---
 deepface/modules/detection.py | 309 ++++++++++++++++++----------------
 1 file changed, 163 insertions(+), 146 deletions(-)

diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index c31a0263..aefd3ec6 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -19,7 +19,7 @@
 
 
 def extract_faces(
-    img_path: Union[str, np.ndarray, IO[bytes]],
+    img_path: Union[List[Union[str, np.ndarray, IO[bytes]]], str, np.ndarray, IO[bytes]],
     detector_backend: str = "opencv",
     enforce_detection: bool = True,
     align: bool = True,
@@ -31,10 +31,10 @@ def extract_faces(
     max_faces: Optional[int] = None,
 ) -> List[Dict[str, Any]]:
     """
-    Extract faces from a given image
+    Extract faces from a given image or list of images
 
     Args:
-        img_path (str or np.ndarray or IO[bytes]): Path to the first image. Accepts exact image path
+        img_paths (List[str or np.ndarray or IO[bytes]] or str or np.ndarray or IO[bytes]): Path(s) to the image(s). Accepts exact image path
             as a string, numpy array (BGR), a file object that supports at least `.read` and is
             opened in binary mode, or base64 encoded images.
 
@@ -80,135 +80,140 @@ def extract_faces(
             just available in the result only if anti_spoofing is set to True in input arguments.
     """
 
-    resp_objs = []
+    if not isinstance(img_path, list):
+        img_path = [img_path]
 
-    # img might be path, base64 or numpy array. Convert it to numpy whatever it is.
-    img, img_name = image_utils.load_image(img_path)
+    all_images = []
+    img_names = []
 
-    if img is None:
-        raise ValueError(f"Exception while loading {img_name}")
+    for single_img_path in img_path:
+        # img might be path, base64 or numpy array. Convert it to numpy whatever it is.
+        img, img_name = image_utils.load_image(single_img_path)
 
-    height, width, _ = img.shape
+        if img is None:
+            raise ValueError(f"Exception while loading {img_name}")
 
-    base_region = FacialAreaRegion(x=0, y=0, w=width, h=height, confidence=0)
+        all_images.append(img)
+        img_names.append(img_name)
 
-    if detector_backend == "skip":
-        face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]
-    else:
-        face_objs = detect_faces(
-            detector_backend=detector_backend,
-            img=img,
-            align=align,
-            expand_percentage=expand_percentage,
-            max_faces=max_faces,
-        )
+    # Run detect_faces for all images at once
+    all_face_objs = detect_faces(
+        detector_backend=detector_backend,
+        img=all_images,
+        align=align,
+        expand_percentage=expand_percentage,
+        max_faces=max_faces,
+    )
 
-    # in case of no face found
-    if len(face_objs) == 0 and enforce_detection is True:
-        if img_name is not None:
-            raise ValueError(
-                f"Face could not be detected in {img_name}."
-                "Please confirm that the picture is a face photo "
-                "or consider to set enforce_detection param to False."
-            )
-        else:
-            raise ValueError(
-                "Face could not be detected. Please confirm that the picture is a face photo "
-                "or consider to set enforce_detection param to False."
-            )
+    if len(all_images) == 1:
+        all_face_objs = [all_face_objs]
 
-    if len(face_objs) == 0 and enforce_detection is False:
-        face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]
-
-    for face_obj in face_objs:
-        current_img = face_obj.img
-        current_region = face_obj.facial_area
-
-        if current_img.shape[0] == 0 or current_img.shape[1] == 0:
-            continue
-
-        if grayscale is True:
-            logger.warn("Parameter grayscale is deprecated. Use color_face instead.")
-            current_img = cv2.cvtColor(current_img, cv2.COLOR_BGR2GRAY)
-        else:
-            if color_face == "rgb":
-                current_img = current_img[:, :, ::-1]
-            elif color_face == "bgr":
-                pass  # image is in BGR
-            elif color_face == "gray":
-                current_img = cv2.cvtColor(current_img, cv2.COLOR_BGR2GRAY)
+    all_resp_objs = []
+
+    for img, img_name, face_objs in zip(all_images, img_names, all_face_objs):
+        height, width, _ = img.shape
+
+        if len(face_objs) == 0 and enforce_detection is True:
+            if img_name is not None:
+                raise ValueError(
+                    f"Face could not be detected in {img_name}."
+                    "Please confirm that the picture is a face photo "
+                    "or consider to set enforce_detection param to False."
+                )
             else:
-                raise ValueError(f"The color_face can be rgb, bgr or gray, but it is {color_face}.")
-
-        if normalize_face:
-            current_img = current_img / 255  # normalize input in [0, 1]
-
-        # cast to int for flask, and do final checks for borders
-        x = max(0, int(current_region.x))
-        y = max(0, int(current_region.y))
-        w = min(width - x - 1, int(current_region.w))
-        h = min(height - y - 1, int(current_region.h))
-
-        facial_area = {
-            "x": x,
-            "y": y,
-            "w": w,
-            "h": h,
-            "left_eye": current_region.left_eye,
-            "right_eye": current_region.right_eye,
-        }
-
-        # optional nose, mouth_left and mouth_right fields are coming just for retinaface
-        if current_region.nose is not None:
-            facial_area["nose"] = current_region.nose
-        if current_region.mouth_left is not None:
-            facial_area["mouth_left"] = current_region.mouth_left
-        if current_region.mouth_right is not None:
-            facial_area["mouth_right"] = current_region.mouth_right
-
-        resp_obj = {
-            "face": current_img,
-            "facial_area": facial_area,
-            "confidence": round(float(current_region.confidence or 0), 2),
-        }
-
-        if anti_spoofing is True:
-            antispoof_model = modeling.build_model(task="spoofing", model_name="Fasnet")
-            is_real, antispoof_score = antispoof_model.analyze(img=img, facial_area=(x, y, w, h))
-            resp_obj["is_real"] = is_real
-            resp_obj["antispoof_score"] = antispoof_score
-
-        resp_objs.append(resp_obj)
-
-    if len(resp_objs) == 0 and enforce_detection == True:
-        raise ValueError(
-            f"Exception while extracting faces from {img_name}."
-            "Consider to set enforce_detection arg to False."
-        )
+                raise ValueError(
+                    "Face could not be detected. Please confirm that the picture is a face photo "
+                    "or consider to set enforce_detection param to False."
+                )
+
+        if len(face_objs) == 0 and enforce_detection is False:
+            base_region = FacialAreaRegion(x=0, y=0, w=width, h=height, confidence=0)
+            face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]
 
-    return resp_objs
+        for face_obj in face_objs:
+            current_img = face_obj.img
+            current_region = face_obj.facial_area
+
+            if current_img.shape[0] == 0 or current_img.shape[1] == 0:
+                continue
+
+            if grayscale is True:
+                logger.warn("Parameter grayscale is deprecated. Use color_face instead.")
+                current_img = cv2.cvtColor(current_img, cv2.COLOR_BGR2GRAY)
+            else:
+                if color_face == "rgb":
+                    current_img = current_img[:, :, ::-1]
+                elif color_face == "bgr":
+                    pass  # image is in BGR
+                elif color_face == "gray":
+                    current_img = cv2.cvtColor(current_img, cv2.COLOR_BGR2GRAY)
+                else:
+                    raise ValueError(f"The color_face can be rgb, bgr or gray, but it is {color_face}.")
+
+            if normalize_face:
+                current_img = current_img / 255  # normalize input in [0, 1]
+
+            # cast to int for flask, and do final checks for borders
+            x = max(0, int(current_region.x))
+            y = max(0, int(current_region.y))
+            w = min(width - x - 1, int(current_region.w))
+            h = min(height - y - 1, int(current_region.h))
+
+            facial_area = {
+                "x": x,
+                "y": y,
+                "w": w,
+                "h": h,
+                "left_eye": current_region.left_eye,
+                "right_eye": current_region.right_eye,
+            }
+
+            # optional nose, mouth_left and mouth_right fields are coming just for retinaface
+            if current_region.nose is not None:
+                facial_area["nose"] = current_region.nose
+            if current_region.mouth_left is not None:
+                facial_area["mouth_left"] = current_region.mouth_left
+            if current_region.mouth_right is not None:
+                facial_area["mouth_right"] = current_region.mouth_right
+
+            resp_obj = {
+                "face": current_img,
+                "facial_area": facial_area,
+                "confidence": round(float(current_region.confidence or 0), 2),
+            }
+
+            if anti_spoofing is True:
+                antispoof_model = modeling.build_model(task="spoofing", model_name="Fasnet")
+                is_real, antispoof_score = antispoof_model.analyze(img=img, facial_area=(x, y, w, h))
+                resp_obj["is_real"] = is_real
+                resp_obj["antispoof_score"] = antispoof_score
+
+            all_resp_objs.append(resp_obj)
+
+    return all_resp_objs
 
 
 def detect_faces(
     detector_backend: str,
-    img: np.ndarray,
+    img: Union[np.ndarray, List[np.ndarray]],
     align: bool = True,
     expand_percentage: int = 0,
     max_faces: Optional[int] = None,
-) -> List[DetectedFace]:
+) -> Union[List[List[DetectedFace]], List[DetectedFace]]:
     """
-    Detect face(s) from a given image
+    Detect face(s) from a given image or list of images
     Args:
         detector_backend (str): detector name
 
-        img (np.ndarray): pre-loaded image
+        img (np.ndarray or List[np.ndarray]): pre-loaded image or list of images
 
         align (bool): enable or disable alignment after detection
 
         expand_percentage (int): expand detected facial area with a percentage (default is 0).
 
     Returns:
-        results (List[DetectedFace]): A list of DetectedFace objects
+        results (Union[List[List[DetectedFace]], List[DetectedFace]]): 
+        A list of lists of DetectedFace objects or a list of DetectedFace objects
             where each object contains:
 
         - img (np.ndarray): The detected face as a NumPy array.
@@ -219,53 +224,65 @@ def detect_faces(
 
         - confidence (float): The confidence score associated with the detected face.
     """
-    height, width, _ = img.shape
+    if not isinstance(img, list):
+        img = [img]
+
     face_detector: Detector = modeling.build_model(
         task="face_detector", model_name=detector_backend
     )
+    all_detected_faces = []
 
-    # validate expand percentage score
-    if expand_percentage < 0:
-        logger.warn(
-            f"Expand percentage cannot be negative but you set it to {expand_percentage}."
-            "Overwritten it to 0."
-        )
-        expand_percentage = 0
-
-    # If faces are close to the upper boundary, alignment move them outside
-    # Add a black border around an image to avoid this.
-    height_border = int(0.5 * height)
-    width_border = int(0.5 * width)
-    if align is True:
-        img = cv2.copyMakeBorder(
-            img,
-            height_border,
-            height_border,
-            width_border,
-            width_border,
-            cv2.BORDER_CONSTANT,
-            value=[0, 0, 0],  # Color of the border (black)
-        )
+    for single_img in img:
+        height, width, _ = single_img.shape
 
-    # find facial areas of given image
-    facial_areas = face_detector.detect_faces(img)
+        # validate expand percentage score
+        if expand_percentage < 0:
+            logger.warn(
+                f"Expand percentage cannot be negative but you set it to {expand_percentage}."
+                "Overwritten it to 0."
+            )
+            expand_percentage = 0
+
+        # If faces are close to the upper boundary, alignment move them outside
+        # Add a black border around an image to avoid this.
+        height_border = int(0.5 * height)
+        width_border = int(0.5 * width)
+        if align is True:
+            single_img = cv2.copyMakeBorder(
+                single_img,
+                height_border,
+                height_border,
+                width_border,
+                width_border,
+                cv2.BORDER_CONSTANT,
+                value=[0, 0, 0],  # Color of the border (black)
+            )
 
-    if max_faces is not None and max_faces < len(facial_areas):
-        facial_areas = nlargest(
-            max_faces, facial_areas, key=lambda facial_area: facial_area.w * facial_area.h
-        )
+        # find facial areas of given image
+        facial_areas = face_detector.detect_faces(single_img)
 
-    return [
-        extract_face(
-            facial_area=facial_area,
-            img=img,
-            align=align,
-            expand_percentage=expand_percentage,
-            width_border=width_border,
-            height_border=height_border,
-        )
-        for facial_area in facial_areas
-    ]
+        if max_faces is not None and max_faces < len(facial_areas):
+            facial_areas = nlargest(
+                max_faces, facial_areas, key=lambda facial_area: facial_area.w * facial_area.h
+            )
+
+        detected_faces = [
+            extract_face(
+                facial_area=facial_area,
+                img=single_img,
+                align=align,
+                expand_percentage=expand_percentage,
+                width_border=width_border,
+                height_border=height_border,
+            )
+            for facial_area in facial_areas
+        ]
+
+        all_detected_faces.append(detected_faces)
+
+    if len(all_detected_faces) == 1:
+        return all_detected_faces[0]
+    return all_detected_faces
 
 
 def extract_face(

From 0ad7c57abf928411ad08d36c0ba7bc1f266cbb82 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 10:04:20 +0000
Subject: [PATCH 02/41] deepFace batch detection; typing

---
 deepface/DeepFace.py          | 12 ++++++------
 deepface/modules/detection.py |  4 ++--
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/deepface/DeepFace.py b/deepface/DeepFace.py
index 3abe6db9..eeacbe7a 100644
--- a/deepface/DeepFace.py
+++ b/deepface/DeepFace.py
@@ -2,7 +2,7 @@
 import os
 import warnings
 import logging
-from typing import Any, Dict, IO, List, Union, Optional
+from typing import Any, Dict, IO, List, Union, Optional, Sequence
 
 # this has to be set before importing tensorflow
 os.environ["TF_USE_LEGACY_KERAS"] = "1"
@@ -510,7 +510,7 @@ def stream(
 
 
 def extract_faces(
-    img_path: Union[str, np.ndarray, IO[bytes]],
+    img_path: Union[str, np.ndarray, IO[bytes], Sequence[Union[str, np.ndarray, IO[bytes]]]],
     detector_backend: str = "opencv",
     enforce_detection: bool = True,
     align: bool = True,
@@ -521,12 +521,12 @@ def extract_faces(
     anti_spoofing: bool = False,
 ) -> List[Dict[str, Any]]:
     """
-    Extract faces from a given image
+    Extract faces from a given image or sequence of images.
 
     Args:
-        img_path (str or np.ndarray or IO[bytes]): Path to the first image. Accepts exact image path
-            as a string, numpy array (BGR), a file object that supports at least `.read` and is
-            opened in binary mode, or base64 encoded images.
+        img_path (Union[str, np.ndarray, IO[bytes], Sequence[Union[str, np.ndarray, IO[bytes]]]]): 
+            Path(s) to the image(s). Accepts a string path, a numpy array (BGR), a file object 
+            that supports at least `.read` and is opened in binary mode, or base64 encoded images.
 
         detector_backend (string): face detector backend. Options: 'opencv', 'retinaface',
             'mtcnn', 'ssd', 'dlib', 'mediapipe', 'yolov8', 'yolov11n', 'yolov11s', 'yolov11m',
diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index aefd3ec6..21d09f56 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -1,5 +1,5 @@
 # built-in dependencies
-from typing import Any, Dict, IO, List, Tuple, Union, Optional
+from typing import Any, Dict, IO, List, Tuple, Union, Optional, Sequence
 
 # 3rd part dependencies
 from heapq import nlargest
@@ -19,7 +19,7 @@
 
 
 def extract_faces(
-    img_path: Union[List[Union[str, np.ndarray, IO[bytes]]], str, np.ndarray, IO[bytes]],
+    img_path: Union[Sequence[Union[str, np.ndarray, IO[bytes]]], str, np.ndarray, IO[bytes]],
     detector_backend: str = "opencv",
     enforce_detection: bool = True,
     align: bool = True,

From b38e95c4078b67d2d669b5809889f5faa3c8ae8b Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 15:47:24 +0000
Subject: [PATCH 03/41] test batch extract faces

---
 tests/test_extract_faces.py | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 262d22d1..89f025d7 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -79,6 +79,20 @@ def test_different_detectors():
         logger.info(f"✅ extract_faces for {detector} backend test is done")
 
 
+@pytest.mark.parametrize("detector_backend", [
+    # "YOLO",
+    "opencv",
+])
+def test_batch_extract_faces(detector_backend):
+    img_paths = [
+        "dataset/img2.jpg",
+        "dataset/img3.jpg",
+        "dataset/img11.jpg",
+    ]
+    img_objs = DeepFace.extract_faces(img_path=img_paths, detector_backend=detector_backend)
+    assert len(img_objs) == 3
+
+
 def test_backends_for_enforced_detection_with_non_facial_inputs():
     black_img = np.zeros([224, 224, 3])
     for detector in detectors:

From 737ee793dcb7c204dc62c2a8e6de5cb7f20dc01d Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 15:47:39 +0000
Subject: [PATCH 04/41] chagne detector interface

---
 deepface/models/Detector.py | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/deepface/models/Detector.py b/deepface/models/Detector.py
index 004f0d37..70675cd1 100644
--- a/deepface/models/Detector.py
+++ b/deepface/models/Detector.py
@@ -1,4 +1,4 @@
-from typing import List, Tuple, Optional
+from typing import List, Tuple, Optional, Union
 from abc import ABC, abstractmethod
 from dataclasses import dataclass
 import numpy as np
@@ -9,15 +9,19 @@
 # pylint: disable=unnecessary-pass, too-few-public-methods, too-many-instance-attributes
 class Detector(ABC):
     @abstractmethod
-    def detect_faces(self, img: np.ndarray) -> List["FacialAreaRegion"]:
+    def detect_faces(
+        self, 
+        imgs: Union[np.ndarray, List[np.ndarray]]
+    ) -> Union[List["FacialAreaRegion"], List[List["FacialAreaRegion"]]]:
         """
-        Interface for detect and align face
+        Interface for detect and align faces in a batch of images
 
         Args:
-            img (np.ndarray): pre-loaded image as numpy array
+            imgs (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
+            results (Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]): 
+            A list or a list of lists of FacialAreaRegion objects
                 where each object contains:
 
             - facial_area (FacialAreaRegion): The facial area region represented

From b2d6178bedf1f9201b8a3de547af4f0edef4e448 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 15:49:35 +0000
Subject: [PATCH 05/41] opencv pseudo batching

---
 deepface/models/face_detection/OpenCv.py | 85 ++++++++++++------------
 1 file changed, 43 insertions(+), 42 deletions(-)

diff --git a/deepface/models/face_detection/OpenCv.py b/deepface/models/face_detection/OpenCv.py
index 4abb6daa..ac376b8d 100644
--- a/deepface/models/face_detection/OpenCv.py
+++ b/deepface/models/face_detection/OpenCv.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import Any, List
+from typing import Any, List, Union
 
 # 3rd party dependencies
 import cv2
@@ -29,55 +29,56 @@ def build_model(self):
         detector["eye_detector"] = self.__build_cascade("haarcascade_eye")
         return detector
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(self, imgs: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with opencv
 
         Args:
-            img (np.ndarray): pre-loaded image as numpy array
+            imgs (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        resp = []
-
-        detected_face = None
-
-        faces = []
-        try:
-            # faces = detector["face_detector"].detectMultiScale(img, 1.3, 5)
-
-            # note that, by design, opencv's haarcascade scores are >0 but not capped at 1
-            faces, _, scores = self.model["face_detector"].detectMultiScale3(
-                img, 1.1, 10, outputRejectLevels=True
-            )
-        except:
-            pass
-
-        if len(faces) > 0:
-            for (x, y, w, h), confidence in zip(faces, scores):
-                detected_face = img[int(y) : int(y + h), int(x) : int(x + w)]
-                left_eye, right_eye = self.find_eyes(img=detected_face)
-
-                # eyes found in the detected face instead image itself
-                # detected face's coordinates should be added
-                if left_eye is not None:
-                    left_eye = (int(x + left_eye[0]), int(y + left_eye[1]))
-                if right_eye is not None:
-                    right_eye = (int(x + right_eye[0]), int(y + right_eye[1]))
-
-                facial_area = FacialAreaRegion(
-                    x=x,
-                    y=y,
-                    w=w,
-                    h=h,
-                    left_eye=left_eye,
-                    right_eye=right_eye,
-                    confidence=(100 - confidence) / 100,
+        if isinstance(imgs, np.ndarray):
+            imgs = [imgs]
+
+        batch_results = []
+
+        for img in imgs:
+            resp = []
+            detected_face = None
+            faces = []
+            try:
+                faces, _, scores = self.model["face_detector"].detectMultiScale3(
+                    img, 1.1, 10, outputRejectLevels=True
                 )
-                resp.append(facial_area)
-
-        return resp
+            except:
+                pass
+
+            if len(faces) > 0:
+                for (x, y, w, h), confidence in zip(faces, scores):
+                    detected_face = img[int(y):int(y + h), int(x):int(x + w)]
+                    left_eye, right_eye = self.find_eyes(img=detected_face)
+
+                    if left_eye is not None:
+                        left_eye = (int(x + left_eye[0]), int(y + left_eye[1]))
+                    if right_eye is not None:
+                        right_eye = (int(x + right_eye[0]), int(y + right_eye[1]))
+
+                    facial_area = FacialAreaRegion(
+                        x=x,
+                        y=y,
+                        w=w,
+                        h=h,
+                        left_eye=left_eye,
+                        right_eye=right_eye,
+                        confidence=(100 - confidence) / 100,
+                    )
+                    resp.append(facial_area)
+
+            batch_results.append(resp)
+
+        return batch_results if len(batch_results) > 1 else batch_results[0]
 
     def find_eyes(self, img: np.ndarray) -> tuple:
         """

From 1bd83356e7761875190c2d6856a8596c79a2c67c Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 15:59:13 +0000
Subject: [PATCH 06/41] yolo detect batched

---
 deepface/models/face_detection/Yolo.py | 111 ++++++++++++++-----------
 1 file changed, 62 insertions(+), 49 deletions(-)

diff --git a/deepface/models/face_detection/Yolo.py b/deepface/models/face_detection/Yolo.py
index 233f0885..34fdb017 100644
--- a/deepface/models/face_detection/Yolo.py
+++ b/deepface/models/face_detection/Yolo.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import List, Any
+from typing import List, Any, Union, Tuple
 from enum import Enum
 
 # 3rd party dependencies
@@ -62,64 +62,77 @@ def build_model(self, model: YoloModel) -> Any:
         # Return face_detector
         return YOLO(weight_file)
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(self, imgs: Union[np.ndarray, List[np.ndarray]]) -> Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]:
         """
-        Detect and align face with yolo
+        Detect and align faces in an image or a list of images with yolo
 
         Args:
-            img (np.ndarray): pre-loaded image as numpy array
+            imgs (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
+            results (Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]): 
+                A list of lists of FacialAreaRegion objects for each image or a list of FacialAreaRegion objects
         """
-        resp = []
+        if not isinstance(imgs, list):
+            imgs = [imgs]
 
-        # Detect faces
-        results = self.model.predict(
-            img,
+        all_results = []
+
+        # Detect faces for all images
+        results_list = self.model.predict(
+            imgs,
             verbose=False,
             show=False,
             conf=float(os.getenv("YOLO_MIN_DETECTION_CONFIDENCE", "0.25")),
-        )[0]
-
-        # For each face, extract the bounding box, the landmarks and confidence
-        for result in results:
-
-            if result.boxes is None:
-                continue
-
-            # Extract the bounding box and the confidence
-            x, y, w, h = result.boxes.xywh.tolist()[0]
-            confidence = result.boxes.conf.tolist()[0]
-
-            right_eye = None
-            left_eye = None
-
-            # yolo-facev8 is detecting eyes through keypoints,
-            # while for v11 keypoints are always None
-            if result.keypoints is not None:
-                # right_eye_conf = result.keypoints.conf[0][0]
-                # left_eye_conf = result.keypoints.conf[0][1]
-                right_eye = result.keypoints.xy[0][0].tolist()
-                left_eye = result.keypoints.xy[0][1].tolist()
-
-                # eyes are list of float, need to cast them tuple of int
-                left_eye = tuple(int(i) for i in left_eye)
-                right_eye = tuple(int(i) for i in right_eye)
-
-            x, y, w, h = int(x - w / 2), int(y - h / 2), int(w), int(h)
-            facial_area = FacialAreaRegion(
-                x=x,
-                y=y,
-                w=w,
-                h=h,
-                left_eye=left_eye,
-                right_eye=right_eye,
-                confidence=confidence,
-            )
-            resp.append(facial_area)
-
-        return resp
+        )
+
+        # Iterate over each image's results
+        for results in results_list:
+            resp = []
+
+            # For each face, extract the bounding box, the landmarks and confidence
+            for result in results:
+
+                if result.boxes is None:
+                    continue
+
+                # Extract the bounding box and the confidence
+                x, y, w, h = result.boxes.xywh.tolist()[0]
+                confidence = result.boxes.conf.tolist()[0]
+
+                right_eye = None
+                left_eye = None
+
+                # yolo-facev8 is detecting eyes through keypoints,
+                # while for v11 keypoints are always None
+                if result.keypoints is not None:
+                    # right_eye_conf = result.keypoints.conf[0][0]
+                    # left_eye_conf = result.keypoints.conf[0][1]
+                    right_eye = result.keypoints.xy[0][0].tolist()
+                    left_eye = result.keypoints.xy[0][1].tolist()
+
+                    # eyes are list of float, need to cast them tuple of int
+                    # Ensure eyes are tuples of exactly two integers or None
+                    left_eye = tuple(map(int, left_eye[:2])) if left_eye and len(left_eye) == 2 else None
+                    right_eye = tuple(map(int, right_eye[:2])) if right_eye and len(right_eye) == 2 else None
+
+                x, y, w, h = int(x - w / 2), int(y - h / 2), int(w), int(h)
+                facial_area = FacialAreaRegion(
+                    x=x,
+                    y=y,
+                    w=w,
+                    h=h,
+                    left_eye=left_eye,
+                    right_eye=right_eye,
+                    confidence=confidence,
+                )
+                resp.append(facial_area)
+
+            all_results.append(resp)
+
+        if len(all_results) == 1:
+            return all_results[0]
+        return all_results
 
 
 class YoloDetectorClientV8n(YoloDetectorClient):

From bbf6a55037cc8243bbff0d637320dbb3475186a7 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 16:05:16 +0000
Subject: [PATCH 07/41] enhance batched detector test

---
 tests/test_extract_faces.py | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 89f025d7..e78576a7 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -80,7 +80,7 @@ def test_different_detectors():
 
 
 @pytest.mark.parametrize("detector_backend", [
-    # "YOLO",
+    "yolov11n",
     "opencv",
 ])
 def test_batch_extract_faces(detector_backend):
@@ -89,8 +89,19 @@ def test_batch_extract_faces(detector_backend):
         "dataset/img3.jpg",
         "dataset/img11.jpg",
     ]
-    img_objs = DeepFace.extract_faces(img_path=img_paths, detector_backend=detector_backend)
-    assert len(img_objs) == 3
+    
+    # Extract faces one by one
+    img_objs_individual = [DeepFace.extract_faces(img_path=img_path, detector_backend=detector_backend)[0] for img_path in img_paths]
+    
+    # Extract faces in batch
+    img_objs_batch = DeepFace.extract_faces(img_path=img_paths, detector_backend=detector_backend)
+    
+    assert len(img_objs_batch) == len(img_objs_individual)
+    
+    for img_obj_individual, img_obj_batch in zip(img_objs_individual, img_objs_batch):
+        assert np.array_equal(img_obj_individual["face"], img_obj_batch["face"])
+        assert img_obj_individual["facial_area"] == img_obj_batch["facial_area"]
+        assert img_obj_individual["confidence"] == img_obj_batch["confidence"]
 
 
 def test_backends_for_enforced_detection_with_non_facial_inputs():

From ba2ff90ac4e11d32ae5b90d0401e31e8a868ddad Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Wed, 12 Feb 2025 16:35:16 +0000
Subject: [PATCH 08/41] mtcnn batching

---
 deepface/models/face_detection/MtCnn.py | 62 +++++++++++++++----------
 1 file changed, 38 insertions(+), 24 deletions(-)

diff --git a/deepface/models/face_detection/MtCnn.py b/deepface/models/face_detection/MtCnn.py
index 014e4a53..8f4c6247 100644
--- a/deepface/models/face_detection/MtCnn.py
+++ b/deepface/models/face_detection/MtCnn.py
@@ -1,5 +1,5 @@
 # built-in dependencies
-from typing import List
+from typing import List, Union
 
 # 3rd party dependencies
 import numpy as np
@@ -17,44 +17,58 @@ class MtCnnClient(Detector):
     def __init__(self):
         self.model = MTCNN()
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(
+        self, 
+        img: Union[np.ndarray, 
+        List[np.ndarray]]
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
-        Detect and align face with mtcnn
+        Detect and align faces with mtcnn for a list of images
 
         Args:
-            img (np.ndarray): pre-loaded image as numpy array
+            imgs (Union[np.ndarray, List[np.ndarray]]): 
+                pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+                A list of FacialAreaRegion objects for a single image or a list of lists of FacialAreaRegion objects for each image
         """
 
+        if not isinstance(img, list):
+            img = [img]
+
         resp = []
 
         # mtcnn expects RGB but OpenCV read BGR
         # img_rgb = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
-        img_rgb = img[:, :, ::-1]
+        img_rgb = [img[:, :, ::-1] for img in img]
         detections = self.model.detect_faces(img_rgb)
 
-        if detections is not None and len(detections) > 0:
+        for image_detections in detections:
+            image_resp = []
+            if image_detections is not None and len(image_detections) > 0:
+                for current_detection in image_detections:
+                    x, y, w, h = current_detection["box"]
+                    confidence = current_detection["confidence"]
+                    # mtcnn detector assigns left eye with respect to the observer
+                    # but we are setting it with respect to the person itself
+                    left_eye = current_detection["keypoints"]["right_eye"]
+                    right_eye = current_detection["keypoints"]["left_eye"]
 
-            for current_detection in detections:
-                x, y, w, h = current_detection["box"]
-                confidence = current_detection["confidence"]
-                # mtcnn detector assigns left eye with respect to the observer
-                # but we are setting it with respect to the person itself
-                left_eye = current_detection["keypoints"]["right_eye"]
-                right_eye = current_detection["keypoints"]["left_eye"]
+                    facial_area = FacialAreaRegion(
+                        x=x,
+                        y=y,
+                        w=w,
+                        h=h,
+                        left_eye=left_eye,
+                        right_eye=right_eye,
+                        confidence=confidence,
+                    )
 
-                facial_area = FacialAreaRegion(
-                    x=x,
-                    y=y,
-                    w=w,
-                    h=h,
-                    left_eye=left_eye,
-                    right_eye=right_eye,
-                    confidence=confidence,
-                )
+                    image_resp.append(facial_area)
 
-                resp.append(facial_area)
+            resp.append(image_resp)
 
+        if len(resp) == 1:
+            return resp[0]
         return resp

From ad0172472625787c48e027a864748b2ca1125982 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Thu, 13 Feb 2025 12:43:32 +0000
Subject: [PATCH 09/41] soft test

---
 tests/test_extract_faces.py | 37 +++++++++++++++++++++++++++++--------
 1 file changed, 29 insertions(+), 8 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index e78576a7..3bb67e5e 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -80,8 +80,10 @@ def test_different_detectors():
 
 
 @pytest.mark.parametrize("detector_backend", [
-    "yolov11n",
-    "opencv",
+    # "yolov11n",
+    # "yolov8",
+    "yolov11s",
+    # "opencv",
 ])
 def test_batch_extract_faces(detector_backend):
     img_paths = [
@@ -91,18 +93,37 @@ def test_batch_extract_faces(detector_backend):
     ]
     
     # Extract faces one by one
-    img_objs_individual = [DeepFace.extract_faces(img_path=img_path, detector_backend=detector_backend)[0] for img_path in img_paths]
+    img_objs_individual = [
+        DeepFace.extract_faces(
+            img_path=img_path,
+            detector_backend=detector_backend,
+            align=True,
+        )[0] for img_path in img_paths
+    ]
     
     # Extract faces in batch
-    img_objs_batch = DeepFace.extract_faces(img_path=img_paths, detector_backend=detector_backend)
+    img_objs_batch = DeepFace.extract_faces(
+        img_path=img_paths,
+        detector_backend=detector_backend,
+        align=True,
+    )
     
     assert len(img_objs_batch) == len(img_objs_individual)
     
     for img_obj_individual, img_obj_batch in zip(img_objs_individual, img_objs_batch):
-        assert np.array_equal(img_obj_individual["face"], img_obj_batch["face"])
-        assert img_obj_individual["facial_area"] == img_obj_batch["facial_area"]
-        assert img_obj_individual["confidence"] == img_obj_batch["confidence"]
-
+        # assert np.array_equal(img_obj_individual["face"], img_obj_batch["face"])
+        for key in img_obj_individual["facial_area"]:
+            if key == "left_eye" or key == "right_eye":
+                continue
+            assert abs(
+                img_obj_individual["facial_area"][key] - 
+                img_obj_batch["facial_area"][key]
+            ) <= 0.03 * img_obj_individual["facial_area"][key]
+        assert abs(
+            img_obj_individual["confidence"] - 
+            img_obj_batch["confidence"]
+        ) <= 0.03 * img_obj_individual["confidence"]
+    
 
 def test_backends_for_enforced_detection_with_non_facial_inputs():
     black_img = np.zeros([224, 224, 3])

From 799f83cd7bb4696ed5d208d8000656aab06f0d67 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Thu, 13 Feb 2025 12:43:54 +0000
Subject: [PATCH 10/41] true batching on detect_faces

---
 deepface/modules/detection.py | 22 ++++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index 21d09f56..9fa2c830 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -230,8 +230,10 @@ def detect_faces(
     face_detector: Detector = modeling.build_model(
         task="face_detector", model_name=detector_backend
     )
-    all_detected_faces = []
 
+    preprocessed_images = []
+    width_borders = []
+    height_borders = []
     for single_img in img:
         height, width, _ = single_img.shape
 
@@ -258,8 +260,20 @@ def detect_faces(
                 value=[0, 0, 0],  # Color of the border (black)
             )
 
-        # find facial areas of given image
-        facial_areas = face_detector.detect_faces(single_img)
+        preprocessed_images.append(single_img)
+        width_borders.append(width_border)
+        height_borders.append(height_border)
+
+    # Detect faces in all preprocessed images
+    all_facial_areas = face_detector.detect_faces(preprocessed_images)
+
+    if len(preprocessed_images) == 1:
+        all_facial_areas = [all_facial_areas]
+
+    all_detected_faces = []
+    for single_img, facial_areas, width_border, height_border in zip(preprocessed_images, all_facial_areas, width_borders, height_borders):
+        if not isinstance(facial_areas, list):
+            facial_areas = [facial_areas]
 
         if max_faces is not None and max_faces < len(facial_areas):
             facial_areas = nlargest(
@@ -275,7 +289,7 @@ def detect_faces(
                 width_border=width_border,
                 height_border=height_border,
             )
-            for facial_area in facial_areas
+            for facial_area in facial_areas if isinstance(facial_area, FacialAreaRegion)
         ]
 
         all_detected_faces.append(detected_faces)

From 619930cd1e0b3f6192492c18e910bb3cad93015f Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 16 Feb 2025 13:22:01 +0000
Subject: [PATCH 11/41] detection skip

---
 deepface/modules/detection.py | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index 9fa2c830..88cd63ea 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -226,6 +226,15 @@ def detect_faces(
     """
     if not isinstance(img, list):
         img = [img]
+    
+    if detector_backend == "skip":
+        all_face_objs = [
+            [DetectedFace(img=single_img, facial_area=FacialAreaRegion(x=0, y=0, w=single_img.shape[1], h=single_img.shape[0]), confidence=0)]
+            for single_img in img
+        ]
+        if len(img) == 1:
+            all_face_objs = all_face_objs[0]
+        return all_face_objs
 
     face_detector: Detector = modeling.build_model(
         task="face_detector", model_name=detector_backend

From b544a2d866a7a439d5c7087427afab248870094e Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 16 Feb 2025 13:54:28 +0000
Subject: [PATCH 12/41] pseudo batched retinaface

---
 deepface/models/face_detection/RetinaFace.py | 115 ++++++++++---------
 1 file changed, 59 insertions(+), 56 deletions(-)

diff --git a/deepface/models/face_detection/RetinaFace.py b/deepface/models/face_detection/RetinaFace.py
index c687322e..ca98a549 100644
--- a/deepface/models/face_detection/RetinaFace.py
+++ b/deepface/models/face_detection/RetinaFace.py
@@ -1,5 +1,5 @@
 # built-in dependencies
-from typing import List
+from typing import List, Union
 
 # 3rd party dependencies
 import numpy as np
@@ -13,64 +13,67 @@ class RetinaFaceClient(Detector):
     def __init__(self):
         self.model = rf.build_model()
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
-        Detect and align face with retinaface
+        Detect and align faces with retinaface in an image or a list of images
 
         Args:
-            img (np.ndarray): pre-loaded image as numpy array
+            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        resp = []
-
-        obj = rf.detect_faces(img, model=self.model, threshold=0.9)
-
-        if not isinstance(obj, dict):
-            return resp
-
-        for face_idx in obj.keys():
-            identity = obj[face_idx]
-            detection = identity["facial_area"]
-
-            y = detection[1]
-            h = detection[3] - y
-            x = detection[0]
-            w = detection[2] - x
-
-            # retinaface sets left and right eyes with respect to the person
-            left_eye = identity["landmarks"]["left_eye"]
-            right_eye = identity["landmarks"]["right_eye"]
-            nose = identity["landmarks"].get("nose")
-            mouth_right = identity["landmarks"].get("mouth_right")
-            mouth_left = identity["landmarks"].get("mouth_left")
-
-            # eyes are list of float, need to cast them tuple of int
-            left_eye = tuple(int(i) for i in left_eye)
-            right_eye = tuple(int(i) for i in right_eye)
-            if nose is not None:
-                nose = tuple(int(i) for i in nose)
-            if mouth_right is not None:
-                mouth_right = tuple(int(i) for i in mouth_right)
-            if mouth_left is not None:
-                mouth_left = tuple(int(i) for i in mouth_left)
-
-            confidence = identity["score"]
-
-            facial_area = FacialAreaRegion(
-                x=x,
-                y=y,
-                w=w,
-                h=h,
-                left_eye=left_eye,
-                right_eye=right_eye,
-                confidence=confidence,
-                nose=nose,
-                mouth_left=mouth_left,
-                mouth_right=mouth_right,
-            )
-
-            resp.append(facial_area)
-
-        return resp
+        if isinstance(img, np.ndarray):
+            imgs = [img]
+        else:
+            imgs = img
+
+        batch_results = []
+
+        for img in imgs:
+            resp = []
+            obj = rf.detect_faces(img, model=self.model, threshold=0.9)
+
+            if isinstance(obj, dict):
+                for face_idx in obj.keys():
+                    identity = obj[face_idx]
+                    detection = identity["facial_area"]
+
+                    y = detection[1]
+                    h = detection[3] - y
+                    x = detection[0]
+                    w = detection[2] - x
+
+                    left_eye = tuple(int(i) for i in identity["landmarks"]["left_eye"])
+                    right_eye = tuple(int(i) for i in identity["landmarks"]["right_eye"])
+                    nose = identity["landmarks"].get("nose")
+                    mouth_right = identity["landmarks"].get("mouth_right")
+                    mouth_left = identity["landmarks"].get("mouth_left")
+
+                    if nose is not None:
+                        nose = tuple(int(i) for i in nose)
+                    if mouth_right is not None:
+                        mouth_right = tuple(int(i) for i in mouth_right)
+                    if mouth_left is not None:
+                        mouth_left = tuple(int(i) for i in mouth_left)
+
+                    confidence = identity["score"]
+
+                    facial_area = FacialAreaRegion(
+                        x=x,
+                        y=y,
+                        w=w,
+                        h=h,
+                        left_eye=left_eye,
+                        right_eye=right_eye,
+                        confidence=confidence,
+                        nose=nose,
+                        mouth_left=mouth_left,
+                        mouth_right=mouth_right,
+                    )
+
+                    resp.append(facial_area)
+
+            batch_results.append(resp)
+
+        return batch_results if len(batch_results) > 1 else batch_results[0]

From 8bfdcf139a9cd9b1ba9e3b5c668ffb13d56a5903 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 16 Feb 2025 14:05:56 +0000
Subject: [PATCH 13/41] test diff detetors

---
 tests/test_extract_faces.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 3bb67e5e..24f404e1 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -80,10 +80,8 @@ def test_different_detectors():
 
 
 @pytest.mark.parametrize("detector_backend", [
-    # "yolov11n",
-    # "yolov8",
-    "yolov11s",
-    # "opencv",
+    "opencv",
+    "ssd"
 ])
 def test_batch_extract_faces(detector_backend):
     img_paths = [

From 7e59cdf05d2b47ffeb1c6118e5edf476b22b4a5c Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 16 Feb 2025 14:09:05 +0000
Subject: [PATCH 14/41] lint

---
 deepface/models/Detector.py                  |   7 +-
 deepface/models/face_detection/MtCnn.py      |   8 +-
 deepface/models/face_detection/OpenCv.py     |  23 ++-
 deepface/models/face_detection/RetinaFace.py |  17 +-
 deepface/models/face_detection/Ssd.py        | 161 ++++++++++---------
 deepface/models/face_detection/Yolo.py       |  34 ++--
 deepface/modules/detection.py                |  39 ++++-
 7 files changed, 176 insertions(+), 113 deletions(-)

diff --git a/deepface/models/Detector.py b/deepface/models/Detector.py
index 70675cd1..6db5e7be 100644
--- a/deepface/models/Detector.py
+++ b/deepface/models/Detector.py
@@ -10,14 +10,15 @@
 class Detector(ABC):
     @abstractmethod
     def detect_faces(
-        self, 
-        imgs: Union[np.ndarray, List[np.ndarray]]
+        self,
+        img: Union[np.ndarray, List[np.ndarray]]
     ) -> Union[List["FacialAreaRegion"], List[List["FacialAreaRegion"]]]:
         """
         Interface for detect and align faces in a batch of images
 
         Args:
-            imgs (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            Pre-loaded image as numpy array or a list of those
 
         Returns:
             results (Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]): 
diff --git a/deepface/models/face_detection/MtCnn.py b/deepface/models/face_detection/MtCnn.py
index 8f4c6247..de43b968 100644
--- a/deepface/models/face_detection/MtCnn.py
+++ b/deepface/models/face_detection/MtCnn.py
@@ -18,9 +18,8 @@ def __init__(self):
         self.model = MTCNN()
 
     def detect_faces(
-        self, 
-        img: Union[np.ndarray, 
-        List[np.ndarray]]
+        self,
+        img: Union[np.ndarray, List[np.ndarray]]
     ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align faces with mtcnn for a list of images
@@ -31,7 +30,8 @@ def detect_faces(
 
         Returns:
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
-                A list of FacialAreaRegion objects for a single image or a list of lists of FacialAreaRegion objects for each image
+                A list of FacialAreaRegion objects for a single image 
+                or a list of lists of FacialAreaRegion objects for each image
         """
 
         if not isinstance(img, list):
diff --git a/deepface/models/face_detection/OpenCv.py b/deepface/models/face_detection/OpenCv.py
index ac376b8d..f97f6586 100644
--- a/deepface/models/face_detection/OpenCv.py
+++ b/deepface/models/face_detection/OpenCv.py
@@ -29,35 +29,42 @@ def build_model(self):
         detector["eye_detector"] = self.__build_cascade("haarcascade_eye")
         return detector
 
-    def detect_faces(self, imgs: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]]
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with opencv
 
         Args:
-            imgs (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]):
+            Pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(imgs, np.ndarray):
-            imgs = [imgs]
+        if isinstance(img, np.ndarray):
+            imgs = [img]
+        else:
+            imgs = img
 
         batch_results = []
 
-        for img in imgs:
+        for single_img in imgs:
             resp = []
             detected_face = None
             faces = []
             try:
                 faces, _, scores = self.model["face_detector"].detectMultiScale3(
-                    img, 1.1, 10, outputRejectLevels=True
+                    single_img, 1.1, 10, outputRejectLevels=True
                 )
             except:
                 pass
 
             if len(faces) > 0:
                 for (x, y, w, h), confidence in zip(faces, scores):
-                    detected_face = img[int(y):int(y + h), int(x):int(x + w)]
+                    detected_face = single_img[int(y):int(y + h), int(x):int(x + w)]
                     left_eye, right_eye = self.find_eyes(img=detected_face)
 
                     if left_eye is not None:
diff --git a/deepface/models/face_detection/RetinaFace.py b/deepface/models/face_detection/RetinaFace.py
index ca98a549..b0d1c949 100644
--- a/deepface/models/face_detection/RetinaFace.py
+++ b/deepface/models/face_detection/RetinaFace.py
@@ -13,15 +13,20 @@ class RetinaFaceClient(Detector):
     def __init__(self):
         self.model = rf.build_model()
 
-    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]]
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
-        Detect and align faces with retinaface in an image or a list of images
+        Detect and align faces with retinaface in a batch of images
 
         Args:
-            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            Pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
         """
         if isinstance(img, np.ndarray):
             imgs = [img]
@@ -30,9 +35,9 @@ def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[F
 
         batch_results = []
 
-        for img in imgs:
+        for single_img in imgs:
             resp = []
-            obj = rf.detect_faces(img, model=self.model, threshold=0.9)
+            obj = rf.detect_faces(single_img, model=self.model, threshold=0.9)
 
             if isinstance(obj, dict):
                 for face_idx in obj.keys():
diff --git a/deepface/models/face_detection/Ssd.py b/deepface/models/face_detection/Ssd.py
index 449144f0..c0ae2cbf 100644
--- a/deepface/models/face_detection/Ssd.py
+++ b/deepface/models/face_detection/Ssd.py
@@ -1,5 +1,5 @@
 # built-in dependencies
-from typing import List
+from typing import List, Union
 from enum import IntEnum
 
 # 3rd party dependencies
@@ -54,83 +54,96 @@ def build_model(self) -> dict:
 
         return {"face_detector": face_detector, "opencv_module": OpenCv.OpenCvClient()}
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]]
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
-        Detect and align face with ssd
+        Detect and align faces with ssd in a batch of images
 
         Args:
-            img (np.ndarray): pre-loaded image as numpy array
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            Pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
         """
-
-        # Because cv2.dnn.blobFromImage expects CV_8U (8-bit unsigned integer) values
-        if img.dtype != np.uint8:
-            img = img.astype(np.uint8)
-
-        opencv_module: OpenCv.OpenCvClient = self.model["opencv_module"]
-
-        target_size = (300, 300)
-
-        original_size = img.shape
-
-        current_img = cv2.resize(img, target_size)
-
-        aspect_ratio_x = original_size[1] / target_size[1]
-        aspect_ratio_y = original_size[0] / target_size[0]
-
-        imageBlob = cv2.dnn.blobFromImage(image=current_img)
-
-        face_detector = self.model["face_detector"]
-        face_detector.setInput(imageBlob)
-        detections = face_detector.forward()
-
-        class ssd_labels(IntEnum):
-            img_id = 0
-            is_face = 1
-            confidence = 2
-            left = 3
-            top = 4
-            right = 5
-            bottom = 6
-
-        faces = detections[0][0]
-        faces = faces[
-            (faces[:, ssd_labels.is_face] == 1) & (faces[:, ssd_labels.confidence] >= 0.90)
-        ]
-        margins = [ssd_labels.left, ssd_labels.top, ssd_labels.right, ssd_labels.bottom]
-        faces[:, margins] = np.int32(faces[:, margins] * 300)
-        faces[:, margins] = np.int32(
-            faces[:, margins] * [aspect_ratio_x, aspect_ratio_y, aspect_ratio_x, aspect_ratio_y]
-        )
-        faces[:, [ssd_labels.right, ssd_labels.bottom]] -= faces[
-            :, [ssd_labels.left, ssd_labels.top]
-        ]
-
-        resp = []
-        for face in faces:
-            confidence = float(face[ssd_labels.confidence])
-            x, y, w, h = map(int, face[margins])
-            detected_face = img[y : y + h, x : x + w]
-
-            left_eye, right_eye = opencv_module.find_eyes(detected_face)
-
-            # eyes found in the detected face instead image itself
-            # detected face's coordinates should be added
-            if left_eye is not None:
-                left_eye = x + int(left_eye[0]), y + int(left_eye[1])
-            if right_eye is not None:
-                right_eye = x + int(right_eye[0]), y + int(right_eye[1])
-
-            facial_area = FacialAreaRegion(
-                x=x,
-                y=y,
-                w=w,
-                h=h,
-                left_eye=left_eye,
-                right_eye=right_eye,
-                confidence=confidence,
+        if isinstance(img, np.ndarray):
+            imgs = [img]
+        else:
+            imgs = img
+
+        batch_results = []
+
+        for single_img in imgs:
+            # Because cv2.dnn.blobFromImage expects CV_8U (8-bit unsigned integer) values
+            if single_img.dtype != np.uint8:
+                single_img = single_img.astype(np.uint8)
+
+            opencv_module: OpenCv.OpenCvClient = self.model["opencv_module"]
+
+            target_size = (300, 300)
+            original_size = single_img.shape
+            current_img = cv2.resize(single_img, target_size)
+
+            aspect_ratio_x = original_size[1] / target_size[1]
+            aspect_ratio_y = original_size[0] / target_size[0]
+
+            imageBlob = cv2.dnn.blobFromImage(image=current_img)
+
+            face_detector = self.model["face_detector"]
+            face_detector.setInput(imageBlob)
+            detections = face_detector.forward()
+
+            class ssd_labels(IntEnum):
+                img_id = 0
+                is_face = 1
+                confidence = 2
+                left = 3
+                top = 4
+                right = 5
+                bottom = 6
+
+            faces = detections[0][0]
+            faces = faces[
+                (faces[:, ssd_labels.is_face] == 1) & (faces[:, ssd_labels.confidence] >= 0.90)
+            ]
+            margins = [ssd_labels.left, ssd_labels.top, ssd_labels.right, ssd_labels.bottom]
+            faces[:, margins] = np.int32(faces[:, margins] * 300)
+            faces[:, margins] = np.int32(
+                faces[:, margins] * [aspect_ratio_x, aspect_ratio_y, aspect_ratio_x, aspect_ratio_y]
             )
-            resp.append(facial_area)
-        return resp
+            faces[:, [ssd_labels.right, ssd_labels.bottom]] -= faces[
+                :, [ssd_labels.left, ssd_labels.top]
+            ]
+
+            resp = []
+            for face in faces:
+                confidence = float(face[ssd_labels.confidence])
+                x, y, w, h = map(int, face[margins])
+                detected_face = single_img[y : y + h, x : x + w]
+
+                left_eye, right_eye = opencv_module.find_eyes(detected_face)
+
+                # eyes found in the detected face instead image itself
+                # detected face's coordinates should be added
+                if left_eye is not None:
+                    left_eye = x + int(left_eye[0]), y + int(left_eye[1])
+                if right_eye is not None:
+                    right_eye = x + int(right_eye[0]), y + int(right_eye[1])
+
+                facial_area = FacialAreaRegion(
+                    x=x,
+                    y=y,
+                    w=w,
+                    h=h,
+                    left_eye=left_eye,
+                    right_eye=right_eye,
+                    confidence=confidence,
+                )
+                resp.append(facial_area)
+
+            batch_results.append(resp)
+
+        return batch_results if len(batch_results) > 1 else batch_results[0]
diff --git a/deepface/models/face_detection/Yolo.py b/deepface/models/face_detection/Yolo.py
index 34fdb017..cbb88799 100644
--- a/deepface/models/face_detection/Yolo.py
+++ b/deepface/models/face_detection/Yolo.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import List, Any, Union, Tuple
+from typing import List, Any, Union
 from enum import Enum
 
 # 3rd party dependencies
@@ -62,25 +62,30 @@ def build_model(self, model: YoloModel) -> Any:
         # Return face_detector
         return YOLO(weight_file)
 
-    def detect_faces(self, imgs: Union[np.ndarray, List[np.ndarray]]) -> Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]:
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]]
+    ) -> Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]:
         """
-        Detect and align faces in an image or a list of images with yolo
+        Detect and align faces in a batch of images with yolo
 
         Args:
-            imgs (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            Pre-loaded image as numpy array or a list of those
 
         Returns:
             results (Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]): 
-                A list of lists of FacialAreaRegion objects for each image or a list of FacialAreaRegion objects
+            A list of lists of FacialAreaRegion objects 
+            for each image or a list of FacialAreaRegion objects
         """
-        if not isinstance(imgs, list):
-            imgs = [imgs]
+        if not isinstance(img, list):
+            img = [img]
 
         all_results = []
 
         # Detect faces for all images
         results_list = self.model.predict(
-            imgs,
+            img,
             verbose=False,
             show=False,
             conf=float(os.getenv("YOLO_MIN_DETECTION_CONFIDENCE", "0.25")),
@@ -113,9 +118,16 @@ def detect_faces(self, imgs: Union[np.ndarray, List[np.ndarray]]) -> Union[List[
 
                     # eyes are list of float, need to cast them tuple of int
                     # Ensure eyes are tuples of exactly two integers or None
-                    left_eye = tuple(map(int, left_eye[:2])) if left_eye and len(left_eye) == 2 else None
-                    right_eye = tuple(map(int, right_eye[:2])) if right_eye and len(right_eye) == 2 else None
-
+                    left_eye = (
+                        tuple(map(int, left_eye[:2]))
+                        if left_eye and len(left_eye) == 2
+                        else None
+                    )
+                    right_eye = (
+                        tuple(map(int, right_eye[:2]))
+                        if right_eye and len(right_eye) == 2
+                        else None
+                    )
                 x, y, w, h = int(x - w / 2), int(y - h / 2), int(w), int(h)
                 facial_area = FacialAreaRegion(
                     x=x,
diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index 88cd63ea..5d974dfc 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -34,8 +34,9 @@ def extract_faces(
     Extract faces from a given image or list of images
 
     Args:
-        img_paths (List[str or np.ndarray or IO[bytes]] or str or np.ndarray or IO[bytes]): Path(s) to the image(s). Accepts exact image path
-            as a string, numpy array (BGR), a file object that supports at least `.read` and is
+        img_paths (List[str or np.ndarray or IO[bytes]] or str or np.ndarray or IO[bytes]): 
+            Path(s) to the image(s) as a string, 
+            numpy array (BGR), a file object that supports at least `.read` and is
             opened in binary mode, or base64 encoded images.
 
         detector_backend (string): face detector backend. Options: 'opencv', 'retinaface',
@@ -148,7 +149,10 @@ def extract_faces(
                 elif color_face == "gray":
                     current_img = cv2.cvtColor(current_img, cv2.COLOR_BGR2GRAY)
                 else:
-                    raise ValueError(f"The color_face can be rgb, bgr or gray, but it is {color_face}.")
+                    raise ValueError(
+                        f"The color_face can be rgb, bgr or gray, "
+                        f"but it is {color_face}."
+                    )
 
             if normalize_face:
                 current_img = current_img / 255  # normalize input in [0, 1]
@@ -184,7 +188,10 @@ def extract_faces(
 
             if anti_spoofing is True:
                 antispoof_model = modeling.build_model(task="spoofing", model_name="Fasnet")
-                is_real, antispoof_score = antispoof_model.analyze(img=img, facial_area=(x, y, w, h))
+                is_real, antispoof_score = antispoof_model.analyze(
+                    img=img,
+                    facial_area=(x, y, w, h)
+                )
                 resp_obj["is_real"] = is_real
                 resp_obj["antispoof_score"] = antispoof_score
 
@@ -226,10 +233,18 @@ def detect_faces(
     """
     if not isinstance(img, list):
         img = [img]
-    
+
     if detector_backend == "skip":
         all_face_objs = [
-            [DetectedFace(img=single_img, facial_area=FacialAreaRegion(x=0, y=0, w=single_img.shape[1], h=single_img.shape[0]), confidence=0)]
+            [
+                DetectedFace(
+                    img=single_img,
+                    facial_area=FacialAreaRegion(
+                        x=0, y=0, w=single_img.shape[1], h=single_img.shape[0]
+                    ),
+                    confidence=0,
+                )
+            ]
             for single_img in img
         ]
         if len(img) == 1:
@@ -280,7 +295,17 @@ def detect_faces(
         all_facial_areas = [all_facial_areas]
 
     all_detected_faces = []
-    for single_img, facial_areas, width_border, height_border in zip(preprocessed_images, all_facial_areas, width_borders, height_borders):
+    for (
+        single_img,
+        facial_areas,
+        width_border,
+        height_border
+    ) in zip(
+        preprocessed_images,
+        all_facial_areas,
+        width_borders,
+        height_borders
+    ):
         if not isinstance(facial_areas, list):
             facial_areas = [facial_areas]
 

From 0f67ddaf9f82f6b576842aa345657ca13f4a3382 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Mon, 17 Feb 2025 12:08:32 +0000
Subject: [PATCH 15/41] optional MtCnn batching (does not work in python3.8)

---
 deepface/models/face_detection/MtCnn.py | 27 ++++++++++++++++++++++++-
 1 file changed, 26 insertions(+), 1 deletion(-)

diff --git a/deepface/models/face_detection/MtCnn.py b/deepface/models/face_detection/MtCnn.py
index de43b968..b3bb306a 100644
--- a/deepface/models/face_detection/MtCnn.py
+++ b/deepface/models/face_detection/MtCnn.py
@@ -1,4 +1,5 @@
 # built-in dependencies
+import logging
 from typing import List, Union
 
 # 3rd party dependencies
@@ -8,6 +9,8 @@
 # project dependencies
 from deepface.models.Detector import Detector, FacialAreaRegion
 
+logger = logging.getLogger(__name__)
+
 # pylint: disable=too-few-public-methods
 class MtCnnClient(Detector):
     """
@@ -16,6 +19,7 @@ class MtCnnClient(Detector):
 
     def __init__(self):
         self.model = MTCNN()
+        self.supports_batch_detection = self._supports_batch_detection()
 
     def detect_faces(
         self,
@@ -42,7 +46,10 @@ def detect_faces(
         # mtcnn expects RGB but OpenCV read BGR
         # img_rgb = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
         img_rgb = [img[:, :, ::-1] for img in img]
-        detections = self.model.detect_faces(img_rgb)
+        if self.supports_batch_detection:
+            detections = self.model.detect_faces(img_rgb)
+        else:
+            detections = [self.model.detect_faces(single_img) for single_img in img_rgb]
 
         for image_detections in detections:
             image_resp = []
@@ -72,3 +79,21 @@ def detect_faces(
         if len(resp) == 1:
             return resp[0]
         return resp
+    
+    def _supports_batch_detection(self) -> bool:
+        import mtcnn
+        try:
+            mtcnn_version = mtcnn.__version__
+        except AttributeError:
+            try:
+                import mtcnn.metadata
+                mtcnn_version = mtcnn.metadata.__version__
+            except AttributeError:
+                logger.warning("Failed to determine mtcnn version")
+                logger.warning("Fallback to single image detection")
+                return False
+        supports_batch_detection = mtcnn_version >= "1.0.0"
+        if not supports_batch_detection:
+            logger.warning("MtCnn version is less than 1.0.0, batch detection is not supported")
+            logger.warning("Fallback to single image detection")
+        return supports_batch_detection

From c4b4b4a7366d72b79840966097a6aa74c3b904ae Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Mon, 17 Feb 2025 12:28:44 +0000
Subject: [PATCH 16/41] lint

---
 deepface/models/face_detection/MtCnn.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/deepface/models/face_detection/MtCnn.py b/deepface/models/face_detection/MtCnn.py
index b3bb306a..be3a51fa 100644
--- a/deepface/models/face_detection/MtCnn.py
+++ b/deepface/models/face_detection/MtCnn.py
@@ -79,7 +79,7 @@ def detect_faces(
         if len(resp) == 1:
             return resp[0]
         return resp
-    
+
     def _supports_batch_detection(self) -> bool:
         import mtcnn
         try:

From 60bee4e1a98a40829f8637a998a0d324c4b46650 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Thu, 13 Feb 2025 13:59:16 +0000
Subject: [PATCH 17/41] detect faces return list of lists on batched inputs

---
 deepface/DeepFace.py          |  5 +++--
 deepface/modules/detection.py | 12 +++++++++---
 tests/test_extract_faces.py   |  6 ++++++
 3 files changed, 18 insertions(+), 5 deletions(-)

diff --git a/deepface/DeepFace.py b/deepface/DeepFace.py
index eeacbe7a..f4253c4e 100644
--- a/deepface/DeepFace.py
+++ b/deepface/DeepFace.py
@@ -519,7 +519,7 @@ def extract_faces(
     color_face: str = "rgb",
     normalize_face: bool = True,
     anti_spoofing: bool = False,
-) -> List[Dict[str, Any]]:
+) -> Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]]:
     """
     Extract faces from a given image or sequence of images.
 
@@ -551,7 +551,8 @@ def extract_faces(
         anti_spoofing (boolean): Flag to enable anti spoofing (default is False).
 
     Returns:
-        results (List[Dict[str, Any]]): A list of dictionaries, where each dictionary contains:
+        results (Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]): 
+        A list or a list of lists of dictionaries, where each dictionary contains:
 
         - "face" (np.ndarray): The detected face as a NumPy array.
 
diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index 5d974dfc..e3b679d0 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -29,7 +29,7 @@ def extract_faces(
     normalize_face: bool = True,
     anti_spoofing: bool = False,
     max_faces: Optional[int] = None,
-) -> List[Dict[str, Any]]:
+) -> Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]]:
     """
     Extract faces from a given image or list of images
 
@@ -62,7 +62,8 @@ def extract_faces(
         anti_spoofing (boolean): Flag to enable anti spoofing (default is False).
 
     Returns:
-        results (List[Dict[str, Any]]): A list of dictionaries, where each dictionary contains:
+        results (Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]): 
+        A list or list of lists of dictionaries, where each dictionary contains:
 
         - "face" (np.ndarray): The detected face as a NumPy array in RGB format.
 
@@ -131,6 +132,7 @@ def extract_faces(
             base_region = FacialAreaRegion(x=0, y=0, w=width, h=height, confidence=0)
             face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]
 
+        img_resp_objs = []
         for face_obj in face_objs:
             current_img = face_obj.img
             current_region = face_obj.facial_area
@@ -195,8 +197,12 @@ def extract_faces(
                 resp_obj["is_real"] = is_real
                 resp_obj["antispoof_score"] = antispoof_score
 
-            all_resp_objs.append(resp_obj)
+            img_resp_objs.append(resp_obj)
 
+        all_resp_objs.append(img_resp_objs)
+
+    if len(all_resp_objs) == 1:
+        return all_resp_objs[0]
     return all_resp_objs
 
 
diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 24f404e1..2c34d94b 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -106,6 +106,12 @@ def test_batch_extract_faces(detector_backend):
         align=True,
     )
     
+    assert (
+        len(img_objs_batch) == 3 and 
+        all(isinstance(obj, list) and len(obj) == 1 for obj in img_objs_batch)
+    )
+    img_objs_batch = [obj for sublist in img_objs_batch for obj in sublist]
+    
     assert len(img_objs_batch) == len(img_objs_individual)
     
     for img_obj_individual, img_obj_batch in zip(img_objs_individual, img_objs_batch):

From f3d05ef2d5f081d14db0f67f63a7877f6a065702 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 09:03:17 +0000
Subject: [PATCH 18/41] add a couple to test batch extract faces

---
 tests/test_extract_faces.py | 48 +++++++++++++++++++++----------------
 1 file changed, 27 insertions(+), 21 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 2c34d94b..50a268b7 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -88,45 +88,51 @@ def test_batch_extract_faces(detector_backend):
         "dataset/img2.jpg",
         "dataset/img3.jpg",
         "dataset/img11.jpg",
+        "dataset/couple.jpg"
     ]
     
     # Extract faces one by one
-    img_objs_individual = [
+    imgs_objs_individual = [
         DeepFace.extract_faces(
             img_path=img_path,
             detector_backend=detector_backend,
             align=True,
-        )[0] for img_path in img_paths
+        ) for img_path in img_paths
     ]
     
     # Extract faces in batch
-    img_objs_batch = DeepFace.extract_faces(
+    imgs_objs_batch = DeepFace.extract_faces(
         img_path=img_paths,
         detector_backend=detector_backend,
         align=True,
     )
     
     assert (
-        len(img_objs_batch) == 3 and 
-        all(isinstance(obj, list) and len(obj) == 1 for obj in img_objs_batch)
+        len(imgs_objs_batch) == 4 and 
+        all(isinstance(obj, list) for obj in imgs_objs_batch)
     )
-    img_objs_batch = [obj for sublist in img_objs_batch for obj in sublist]
-    
-    assert len(img_objs_batch) == len(img_objs_individual)
-    
-    for img_obj_individual, img_obj_batch in zip(img_objs_individual, img_objs_batch):
-        # assert np.array_equal(img_obj_individual["face"], img_obj_batch["face"])
-        for key in img_obj_individual["facial_area"]:
-            if key == "left_eye" or key == "right_eye":
-                continue
+    assert all(
+        len(imgs_objs_batch[i]) == 1 
+        for i in range(len(imgs_objs_batch[:-1]))
+    )
+    assert len(imgs_objs_batch[-1]) == 2
+
+    for img_objs_individual, img_objs_batch in zip(imgs_objs_individual, imgs_objs_batch):
+        assert len(img_objs_batch) == len(img_objs_individual), (
+            "Batch and individual extraction results should have the same number of detected faces"
+        )
+        for img_obj_individual, img_obj_batch in zip(img_objs_individual, img_objs_batch):
+            for key in img_obj_individual["facial_area"]:
+                if key == "left_eye" or key == "right_eye":
+                    continue
+                assert abs(
+                    img_obj_individual["facial_area"][key] - 
+                    img_obj_batch["facial_area"][key]
+                ) <= 0.03 * img_obj_individual["facial_area"][key]
             assert abs(
-                img_obj_individual["facial_area"][key] - 
-                img_obj_batch["facial_area"][key]
-            ) <= 0.03 * img_obj_individual["facial_area"][key]
-        assert abs(
-            img_obj_individual["confidence"] - 
-            img_obj_batch["confidence"]
-        ) <= 0.03 * img_obj_individual["confidence"]
+                img_obj_individual["confidence"] - 
+                img_obj_batch["confidence"]
+            ) <= 0.03 * img_obj_individual["confidence"]
     
 
 def test_backends_for_enforced_detection_with_non_facial_inputs():

From 1c825e88034a78438e66b74a7792ec84d94ca034 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 09:18:33 +0000
Subject: [PATCH 19/41] add more models and detector-specific rtol

---
 tests/test_extract_faces.py | 33 +++++++++++++++++++++++++--------
 1 file changed, 25 insertions(+), 8 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 50a268b7..3ac1dcba 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -81,9 +81,18 @@ def test_different_detectors():
 
 @pytest.mark.parametrize("detector_backend", [
     "opencv",
-    "ssd"
+    "ssd",
+    "mtcnn",
+    "retinaface",
 ])
 def test_batch_extract_faces(detector_backend):
+    detector_backend_to_rtol = {
+        "opencv": 0.1,
+        "ssd": 0.01,
+        "mtcnn": 0.2,
+        "retinaface": 0.01,
+    }
+    rtol = detector_backend_to_rtol[detector_backend]
     img_paths = [
         "dataset/img2.jpg",
         "dataset/img3.jpg",
@@ -123,16 +132,24 @@ def test_batch_extract_faces(detector_backend):
         )
         for img_obj_individual, img_obj_batch in zip(img_objs_individual, img_objs_batch):
             for key in img_obj_individual["facial_area"]:
-                if key == "left_eye" or key == "right_eye":
-                    continue
-                assert abs(
-                    img_obj_individual["facial_area"][key] - 
-                    img_obj_batch["facial_area"][key]
-                ) <= 0.03 * img_obj_individual["facial_area"][key]
+                if isinstance(img_obj_individual["facial_area"][key], tuple):
+                    for ind_val, batch_val in zip(
+                        img_obj_individual["facial_area"][key], 
+                        img_obj_batch["facial_area"][key]
+                    ):
+                        assert abs(ind_val - batch_val) <= rtol * ind_val
+                elif (
+                    isinstance(img_obj_individual["facial_area"][key], int) or 
+                    isinstance(img_obj_individual["facial_area"][key], float)
+                ):
+                    assert abs(
+                        img_obj_individual["facial_area"][key] - 
+                        img_obj_batch["facial_area"][key]
+                    ) <= rtol * img_obj_individual["facial_area"][key]
             assert abs(
                 img_obj_individual["confidence"] - 
                 img_obj_batch["confidence"]
-            ) <= 0.03 * img_obj_individual["confidence"]
+            ) <= rtol * img_obj_individual["confidence"]
     
 
 def test_backends_for_enforced_detection_with_non_facial_inputs():

From 1d358aa15a3ce6d3fd3be5cd1121cfb66b7cfadc Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 09:44:59 +0000
Subject: [PATCH 20/41] pseudo-batching dlib

---
 deepface/models/face_detection/Dlib.py | 21 +++++++++++++++++++--
 1 file changed, 19 insertions(+), 2 deletions(-)

diff --git a/deepface/models/face_detection/Dlib.py b/deepface/models/face_detection/Dlib.py
index 26bce84c..2ff9c864 100644
--- a/deepface/models/face_detection/Dlib.py
+++ b/deepface/models/face_detection/Dlib.py
@@ -1,5 +1,5 @@
 # built-in dependencies
-from typing import List
+from typing import List, Union
 
 # 3rd party dependencies
 import numpy as np
@@ -47,10 +47,27 @@ def build_model(self) -> dict:
         detector["sp"] = sp
         return detector
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with dlib
 
+        Args:
+            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+
+        Returns:
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+        """
+        if isinstance(img, np.ndarray):
+            return self._detect_faces_in_single_image(img)
+        elif isinstance(img, list):
+            return [self._detect_faces_in_single_image(single_img) for single_img in img]
+        else:
+            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+
+    def _detect_faces_in_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
+        """
+        Helper function to detect faces in a single image.
+
         Args:
             img (np.ndarray): pre-loaded image as numpy array
 

From f5188c802c0fbd5640043bd1d1e90957fc374948 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 09:47:06 +0000
Subject: [PATCH 21/41] pseudo-batching centerface

---
 deepface/models/face_detection/CenterFace.py | 25 ++++++++++++++++----
 1 file changed, 21 insertions(+), 4 deletions(-)

diff --git a/deepface/models/face_detection/CenterFace.py b/deepface/models/face_detection/CenterFace.py
index b8fdf6b3..7e7d72ea 100644
--- a/deepface/models/face_detection/CenterFace.py
+++ b/deepface/models/face_detection/CenterFace.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import List
+from typing import List, Union
 
 # 3rd party dependencies
 import numpy as np
@@ -34,12 +34,29 @@ def build_model(self):
 
         return CenterFace(weight_path=weights_path)
 
-    def detect_faces(self, img: np.ndarray) -> List["FacialAreaRegion"]:
+    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with CenterFace
 
         Args:
-            img (np.ndarray): pre-loaded image as numpy array
+            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+
+        Returns:
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+        """
+        if isinstance(img, np.ndarray):
+            return self._process_single_image(img)
+        elif isinstance(img, list):
+            return [self._process_single_image(single_img) for single_img in img]
+        else:
+            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+
+    def _process_single_image(self, single_img: np.ndarray) -> List[FacialAreaRegion]:
+        """
+        Helper function to detect faces in a single image.
+
+        Args:
+            single_img (np.ndarray): pre-loaded image as numpy array
 
         Returns:
             results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
@@ -53,7 +70,7 @@ def detect_faces(self, img: np.ndarray) -> List["FacialAreaRegion"]:
         #     img, img.shape[0], img.shape[1], threshold=threshold
         # )
         detections, landmarks = self.build_model().forward(
-            img, img.shape[0], img.shape[1], threshold=threshold
+            single_img, single_img.shape[0], single_img.shape[1], threshold=threshold
         )
 
         for i, detection in enumerate(detections):

From 26e537d2a56ec601a5baca29ae62b6f85ff810d9 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 09:48:01 +0000
Subject: [PATCH 22/41] psedu-batching fastmtcnn

---
 deepface/models/face_detection/FastMtCnn.py | 19 ++++++++++++++++++-
 1 file changed, 18 insertions(+), 1 deletion(-)

diff --git a/deepface/models/face_detection/FastMtCnn.py b/deepface/models/face_detection/FastMtCnn.py
index 52590366..8315b6d5 100644
--- a/deepface/models/face_detection/FastMtCnn.py
+++ b/deepface/models/face_detection/FastMtCnn.py
@@ -17,10 +17,27 @@ class FastMtCnnClient(Detector):
     def __init__(self):
         self.model = self.build_model()
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with mtcnn
 
+        Args:
+            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+
+        Returns:
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+        """
+        if isinstance(img, np.ndarray):
+            return self._process_single_image(img)
+        elif isinstance(img, list):
+            return [self._process_single_image(single_img) for single_img in img]
+        else:
+            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+
+    def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
+        """
+        Helper function to detect faces in a single image.
+
         Args:
             img (np.ndarray): pre-loaded image as numpy array
 

From 7f04e6b2987a18ee134c5821b88595587f2a08fc Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 09:49:25 +0000
Subject: [PATCH 23/41] mediapipe pseudo bathcing

---
 deepface/models/face_detection/MediaPipe.py | 21 +++++++++++++++++++--
 1 file changed, 19 insertions(+), 2 deletions(-)

diff --git a/deepface/models/face_detection/MediaPipe.py b/deepface/models/face_detection/MediaPipe.py
index 48bc2f8d..86311bcb 100644
--- a/deepface/models/face_detection/MediaPipe.py
+++ b/deepface/models/face_detection/MediaPipe.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import Any, List
+from typing import Any, List, Union
 
 # 3rd party dependencies
 import numpy as np
@@ -43,10 +43,27 @@ def build_model(self) -> Any:
         )
         return face_detection
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with mediapipe
 
+        Args:
+            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+
+        Returns:
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+        """
+        if isinstance(img, np.ndarray):
+            return self._process_single_image(img)
+        elif isinstance(img, list):
+            return [self._process_single_image(single_img) for single_img in img]
+        else:
+            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+
+    def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
+        """
+        Helper function to detect faces in a single image.
+
         Args:
             img (np.ndarray): pre-loaded image as numpy array
 

From 991566ffb11f24bf8daa555623299e9dc6e778d0 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 09:51:40 +0000
Subject: [PATCH 24/41] yunet pseudobatching

---
 deepface/models/face_detection/YuNet.py | 21 +++++++++++++++++++--
 1 file changed, 19 insertions(+), 2 deletions(-)

diff --git a/deepface/models/face_detection/YuNet.py b/deepface/models/face_detection/YuNet.py
index 90759275..e3d310f9 100644
--- a/deepface/models/face_detection/YuNet.py
+++ b/deepface/models/face_detection/YuNet.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import Any, List
+from typing import Any, List, Union
 
 # 3rd party dependencies
 import cv2
@@ -57,10 +57,27 @@ def build_model(self) -> Any:
             ) from err
         return face_detector
 
-    def detect_faces(self, img: np.ndarray) -> List[FacialAreaRegion]:
+    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with yunet
 
+        Args:
+            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+
+        Returns:
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+        """
+        if isinstance(img, np.ndarray):
+            return self._process_single_image(img)
+        elif isinstance(img, list):
+            return [self._process_single_image(single_img) for single_img in img]
+        else:
+            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+
+    def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
+        """
+        Helper function to detect faces in a single image.
+
         Args:
             img (np.ndarray): pre-loaded image as numpy array
 

From 70b61a7f4fd7b9a8c0d17702462b096a2841f96c Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 10:03:27 +0000
Subject: [PATCH 25/41] change interface in a special case

---
 deepface/models/face_detection/CenterFace.py | 12 ++++++------
 deepface/models/face_detection/Dlib.py       | 16 ++++++++--------
 deepface/models/face_detection/FastMtCnn.py  | 12 ++++++------
 deepface/models/face_detection/MediaPipe.py  | 12 ++++++------
 deepface/models/face_detection/YuNet.py      | 12 ++++++------
 5 files changed, 32 insertions(+), 32 deletions(-)

diff --git a/deepface/models/face_detection/CenterFace.py b/deepface/models/face_detection/CenterFace.py
index 7e7d72ea..03faa973 100644
--- a/deepface/models/face_detection/CenterFace.py
+++ b/deepface/models/face_detection/CenterFace.py
@@ -44,12 +44,12 @@ def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[F
         Returns:
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
-            return self._process_single_image(img)
-        elif isinstance(img, list):
-            return [self._process_single_image(single_img) for single_img in img]
-        else:
-            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+        if not isinstance(img, list):
+            img = [img]
+        results = [self._process_single_image(single_img) for single_img in img]
+        if len(results) == 1:
+            return results[0]
+        return results
 
     def _process_single_image(self, single_img: np.ndarray) -> List[FacialAreaRegion]:
         """
diff --git a/deepface/models/face_detection/Dlib.py b/deepface/models/face_detection/Dlib.py
index 2ff9c864..7500fff6 100644
--- a/deepface/models/face_detection/Dlib.py
+++ b/deepface/models/face_detection/Dlib.py
@@ -57,14 +57,14 @@ def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[F
         Returns:
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
-            return self._detect_faces_in_single_image(img)
-        elif isinstance(img, list):
-            return [self._detect_faces_in_single_image(single_img) for single_img in img]
-        else:
-            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
-
-    def _detect_faces_in_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
+        if not isinstance(img, list):
+            img = [img]
+        results = [self._process_single_image(single_img) for single_img in img]
+        if len(results) == 1:
+            return results[0]
+        return results
+
+    def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
         Helper function to detect faces in a single image.
 
diff --git a/deepface/models/face_detection/FastMtCnn.py b/deepface/models/face_detection/FastMtCnn.py
index 8315b6d5..22282200 100644
--- a/deepface/models/face_detection/FastMtCnn.py
+++ b/deepface/models/face_detection/FastMtCnn.py
@@ -27,12 +27,12 @@ def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[F
         Returns:
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
-            return self._process_single_image(img)
-        elif isinstance(img, list):
-            return [self._process_single_image(single_img) for single_img in img]
-        else:
-            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+        if not isinstance(img, list):
+            img = [img]
+        results = [self._process_single_image(single_img) for single_img in img]
+        if len(results) == 1:
+            return results[0]
+        return results
 
     def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
diff --git a/deepface/models/face_detection/MediaPipe.py b/deepface/models/face_detection/MediaPipe.py
index 86311bcb..9e20c8dc 100644
--- a/deepface/models/face_detection/MediaPipe.py
+++ b/deepface/models/face_detection/MediaPipe.py
@@ -53,12 +53,12 @@ def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[F
         Returns:
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
-            return self._process_single_image(img)
-        elif isinstance(img, list):
-            return [self._process_single_image(single_img) for single_img in img]
-        else:
-            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+        if not isinstance(img, list):
+            img = [img]
+        results = [self._process_single_image(single_img) for single_img in img]
+        if len(results) == 1:
+            return results[0]
+        return results
 
     def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
diff --git a/deepface/models/face_detection/YuNet.py b/deepface/models/face_detection/YuNet.py
index e3d310f9..4086f17e 100644
--- a/deepface/models/face_detection/YuNet.py
+++ b/deepface/models/face_detection/YuNet.py
@@ -67,12 +67,12 @@ def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[F
         Returns:
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
-            return self._process_single_image(img)
-        elif isinstance(img, list):
-            return [self._process_single_image(single_img) for single_img in img]
-        else:
-            raise ValueError("Input must be a numpy array or a list of numpy arrays.")
+        if not isinstance(img, list):
+            img = [img]
+        results = [self._process_single_image(single_img) for single_img in img]
+        if len(results) == 1:
+            return results[0]
+        return results
 
     def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """

From 27dea80248be128942420bd860c6f964ad91e38c Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 10:13:03 +0000
Subject: [PATCH 26/41] batch test add other detector models

---
 tests/test_extract_faces.py | 11 ++++++++---
 1 file changed, 8 insertions(+), 3 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 3ac1dcba..11c37fa6 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -84,15 +84,20 @@ def test_different_detectors():
     "ssd",
     "mtcnn",
     "retinaface",
+    "yunet",
+    "centerface",
+    # optional
+    # "yolov11s",
+    # "mediapipe",
+    # "dlib",
 ])
 def test_batch_extract_faces(detector_backend):
     detector_backend_to_rtol = {
         "opencv": 0.1,
-        "ssd": 0.01,
         "mtcnn": 0.2,
-        "retinaface": 0.01,
+        "yolov11s": 0.03,
     }
-    rtol = detector_backend_to_rtol[detector_backend]
+    rtol = detector_backend_to_rtol.get(detector_backend, 0.01)
     img_paths = [
         "dataset/img2.jpg",
         "dataset/img3.jpg",

From 526ab1baf7f4e74a75cd06ecfb1a0ccaf63b67fb Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 10:26:52 +0000
Subject: [PATCH 27/41] test numpy array batched input

---
 tests/test_extract_faces.py | 50 +++++++++++++++++++++++++++++++++++++
 1 file changed, 50 insertions(+)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 11c37fa6..7ed228c2 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -157,6 +157,56 @@ def test_batch_extract_faces(detector_backend):
             ) <= rtol * img_obj_individual["confidence"]
     
 
+@pytest.mark.parametrize("detector_backend", [
+    "opencv",
+    "ssd",
+    "mtcnn",
+    "retinaface",
+    "yunet",
+    "centerface",
+    # optional
+    # "yolov11s",
+    # "mediapipe",
+    # "dlib",
+])
+def test_batch_extract_faces_with_nparray(detector_backend):
+    img_paths = [
+        "dataset/img2.jpg",
+        "dataset/img3.jpg",
+        "dataset/img11.jpg",
+        "dataset/couple.jpg"
+    ]
+    imgs = [
+        cv2.resize(image_utils.load_image(img_path)[0], (1920, 1080))
+        for img_path in img_paths
+    ]
+
+    # load images as numpy arrays
+    imgs_batch = np.stack(imgs, axis=0)
+
+    # extract faces in batch of numpy arrays
+    imgs_objs_batch = DeepFace.extract_faces(
+        img_path=imgs_batch,
+        detector_backend=detector_backend,
+        align=True,
+        enforce_detection=False,
+    )
+
+    # extract faces in batch of paths
+    imgs_objs_batch_paths = DeepFace.extract_faces(
+        img_path=imgs,
+        detector_backend=detector_backend,
+        align=True,
+        enforce_detection=False,
+    )
+
+    # compare results
+    for img_objs_batch, img_objs_batch_paths in zip(imgs_objs_batch, imgs_objs_batch_paths):
+        assert len(img_objs_batch) == len(img_objs_batch_paths), (
+            "Batch and individual extraction results should have the same number of detected faces"
+        )
+
+
 def test_backends_for_enforced_detection_with_non_facial_inputs():
     black_img = np.zeros([224, 224, 3])
     for detector in detectors:

From 988afa6a70f894d2ad455ec48049d9900370d4e0 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 10:27:23 +0000
Subject: [PATCH 28/41] fix batched numpy array input

---
 deepface/modules/detection.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index e3b679d0..2b14a7c8 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -82,6 +82,8 @@ def extract_faces(
             just available in the result only if anti_spoofing is set to True in input arguments.
     """
 
+    if isinstance(img_path, np.ndarray) and img_path.ndim == 4:
+        img_path = [img_path[i] for i in range(img_path.shape[0])]
     if not isinstance(img_path, list):
         img_path = [img_path]
 

From 3e34675aab33ed4878e9129a08625404266eaa61 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 10:31:48 +0000
Subject: [PATCH 29/41] lint

---
 deepface/models/face_detection/CenterFace.py | 11 ++++++++---
 deepface/models/face_detection/Dlib.py       | 11 ++++++++---
 deepface/models/face_detection/FastMtCnn.py  | 11 ++++++++---
 deepface/models/face_detection/MediaPipe.py  | 11 ++++++++---
 4 files changed, 32 insertions(+), 12 deletions(-)

diff --git a/deepface/models/face_detection/CenterFace.py b/deepface/models/face_detection/CenterFace.py
index 03faa973..66fc6cc2 100644
--- a/deepface/models/face_detection/CenterFace.py
+++ b/deepface/models/face_detection/CenterFace.py
@@ -34,15 +34,20 @@ def build_model(self):
 
         return CenterFace(weight_path=weights_path)
 
-    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+    def detect_faces(
+        self, 
+        img: Union[np.ndarray, List[np.ndarray]],
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with CenterFace
 
         Args:
-            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
         """
         if not isinstance(img, list):
             img = [img]
diff --git a/deepface/models/face_detection/Dlib.py b/deepface/models/face_detection/Dlib.py
index 7500fff6..208b0442 100644
--- a/deepface/models/face_detection/Dlib.py
+++ b/deepface/models/face_detection/Dlib.py
@@ -47,15 +47,20 @@ def build_model(self) -> dict:
         detector["sp"] = sp
         return detector
 
-    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]],
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with dlib
 
         Args:
-            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
         """
         if not isinstance(img, list):
             img = [img]
diff --git a/deepface/models/face_detection/FastMtCnn.py b/deepface/models/face_detection/FastMtCnn.py
index 22282200..ea2431e5 100644
--- a/deepface/models/face_detection/FastMtCnn.py
+++ b/deepface/models/face_detection/FastMtCnn.py
@@ -17,15 +17,20 @@ class FastMtCnnClient(Detector):
     def __init__(self):
         self.model = self.build_model()
 
-    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]],
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with mtcnn
 
         Args:
-            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
         """
         if not isinstance(img, list):
             img = [img]
diff --git a/deepface/models/face_detection/MediaPipe.py b/deepface/models/face_detection/MediaPipe.py
index 9e20c8dc..4716e7c5 100644
--- a/deepface/models/face_detection/MediaPipe.py
+++ b/deepface/models/face_detection/MediaPipe.py
@@ -43,15 +43,20 @@ def build_model(self) -> Any:
         )
         return face_detection
 
-    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]],
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """
         Detect and align face with mediapipe
 
         Args:
-            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            pre-loaded image as numpy array or a list of those
 
         Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
         """
         if not isinstance(img, list):
             img = [img]

From 2eb5cac37b9429d79ed08e245b6efe62f1281c6c Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 10:40:57 +0000
Subject: [PATCH 30/41] batch extract faces on single image special case

---
 tests/test_extract_faces.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 7ed228c2..2d3fc78f 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -207,6 +207,16 @@ def test_batch_extract_faces_with_nparray(detector_backend):
         )
 
 
+def test_batch_extract_faces_single_image():
+    img_path = "dataset/couple.jpg"
+    imgs_objs_batch = DeepFace.extract_faces(
+        img_path=[img_path],
+        align=True,
+    )
+    assert len(imgs_objs_batch) == 2
+    assert [isinstance(obj, dict) for obj in imgs_objs_batch]
+
+
 def test_backends_for_enforced_detection_with_non_facial_inputs():
     black_img = np.zeros([224, 224, 3])
     for detector in detectors:

From c30f55c3804b5c219194d3fcb23e81da7e32d991 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Tue, 18 Feb 2025 10:55:02 +0000
Subject: [PATCH 31/41] lint

---
 deepface/models/face_detection/CenterFace.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/deepface/models/face_detection/CenterFace.py b/deepface/models/face_detection/CenterFace.py
index 66fc6cc2..a947900b 100644
--- a/deepface/models/face_detection/CenterFace.py
+++ b/deepface/models/face_detection/CenterFace.py
@@ -35,7 +35,7 @@ def build_model(self):
         return CenterFace(weight_path=weights_path)
 
     def detect_faces(
-        self, 
+        self,
         img: Union[np.ndarray, List[np.ndarray]],
     ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
         """

From dc6cb81ec535177b79fc02c680fef13526c1d3ce Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Fri, 21 Feb 2025 17:34:10 +0000
Subject: [PATCH 32/41] batch test assert shape

---
 tests/test_extract_faces.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 2d3fc78f..68939f3b 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -180,6 +180,7 @@ def test_batch_extract_faces_with_nparray(detector_backend):
         cv2.resize(image_utils.load_image(img_path)[0], (1920, 1080))
         for img_path in img_paths
     ]
+    expected_num_faces = [1, 1, 1, 2]
 
     # load images as numpy arrays
     imgs_batch = np.stack(imgs, axis=0)
@@ -191,6 +192,9 @@ def test_batch_extract_faces_with_nparray(detector_backend):
         align=True,
         enforce_detection=False,
     )
+    assert len(imgs_objs_batch) == 4
+    for img_objs_batch, expected_num_faces in zip(imgs_objs_batch, expected_num_faces):
+        assert len(img_objs_batch) == expected_num_faces
 
     # extract faces in batch of paths
     imgs_objs_batch_paths = DeepFace.extract_faces(

From 6143ed9bb4a9773a32cbe7c7d8d740ec3a9c7a9f Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Fri, 21 Feb 2025 17:35:25 +0000
Subject: [PATCH 33/41] clearify test batch extract

---
 tests/test_extract_faces.py | 16 +++++++---------
 1 file changed, 7 insertions(+), 9 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 68939f3b..c61f1b54 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -104,6 +104,7 @@ def test_batch_extract_faces(detector_backend):
         "dataset/img11.jpg",
         "dataset/couple.jpg"
     ]
+    expected_num_faces = [1, 1, 1, 2]
     
     # Extract faces one by one
     imgs_objs_individual = [
@@ -121,15 +122,12 @@ def test_batch_extract_faces(detector_backend):
         align=True,
     )
     
-    assert (
-        len(imgs_objs_batch) == 4 and 
-        all(isinstance(obj, list) for obj in imgs_objs_batch)
-    )
-    assert all(
-        len(imgs_objs_batch[i]) == 1 
-        for i in range(len(imgs_objs_batch[:-1]))
-    )
-    assert len(imgs_objs_batch[-1]) == 2
+    # Check that the batch extraction returned the expected number of face lists
+    assert len(imgs_objs_batch) == len(img_paths)
+    
+    # Check that each face list has the expected number of faces
+    for i, expected_faces in enumerate(expected_num_faces):
+        assert len(imgs_objs_batch[i]) == expected_faces
 
     for img_objs_individual, img_objs_batch in zip(imgs_objs_individual, imgs_objs_batch):
         assert len(img_objs_batch) == len(img_objs_individual), (

From c46d886a673d3d5d01935a3a069af514f58de820 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Fri, 21 Feb 2025 17:40:28 +0000
Subject: [PATCH 34/41] more shape checks

---
 tests/test_extract_faces.py | 26 ++++++++++++++++++++++++++
 1 file changed, 26 insertions(+)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index c61f1b54..3b8d3de1 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -23,6 +23,10 @@ def test_different_detectors():
 
     for detector in detectors:
         img_objs = DeepFace.extract_faces(img_path=img_path, detector_backend=detector)
+
+        # Check return type for non-batch input
+        assert isinstance(img_objs, list) and all(isinstance(obj, dict) for obj in img_objs)
+
         for img_obj in img_objs:
             assert "face" in img_obj.keys()
             assert "facial_area" in img_obj.keys()
@@ -114,6 +118,15 @@ def test_batch_extract_faces(detector_backend):
             align=True,
         ) for img_path in img_paths
     ]
+
+    # Check that individual extraction returns a list of faces
+    for img_objs_individual in imgs_objs_individual:
+        assert isinstance(img_objs_individual, list)
+        assert all(isinstance(face, dict) for face in img_objs_individual)
+
+    # Check that the individual extraction results match the expected number of faces
+    for img_objs_individual, expected_faces in zip(imgs_objs_individual, expected_num_faces):
+        assert len(img_objs_individual) == expected_faces
     
     # Extract faces in batch
     imgs_objs_batch = DeepFace.extract_faces(
@@ -129,6 +142,7 @@ def test_batch_extract_faces(detector_backend):
     for i, expected_faces in enumerate(expected_num_faces):
         assert len(imgs_objs_batch[i]) == expected_faces
 
+    # Check that the individual extraction results match the batch extraction results
     for img_objs_individual, img_objs_batch in zip(imgs_objs_individual, imgs_objs_batch):
         assert len(img_objs_batch) == len(img_objs_individual), (
             "Batch and individual extraction results should have the same number of detected faces"
@@ -190,6 +204,18 @@ def test_batch_extract_faces_with_nparray(detector_backend):
         align=True,
         enforce_detection=False,
     )
+
+    # Check return type for batch input
+    assert (
+        isinstance(imgs_objs_batch, list) and 
+        all(
+            isinstance(obj, list) and 
+            all(isinstance(face, dict) for face in obj) 
+            for obj in imgs_objs_batch
+        )
+    )
+
+    # Check that the batch extraction returned the expected number of face lists
     assert len(imgs_objs_batch) == 4
     for img_objs_batch, expected_num_faces in zip(imgs_objs_batch, expected_num_faces):
         assert len(img_objs_batch) == expected_num_faces

From add4c7394472a6495b27dc30bbf74d223954b758 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Fri, 21 Feb 2025 17:49:34 +0000
Subject: [PATCH 35/41] disable mtcnn batching by default due to unexpected
 behaviour

---
 deepface/models/face_detection/MtCnn.py | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/deepface/models/face_detection/MtCnn.py b/deepface/models/face_detection/MtCnn.py
index be3a51fa..8c420757 100644
--- a/deepface/models/face_detection/MtCnn.py
+++ b/deepface/models/face_detection/MtCnn.py
@@ -82,8 +82,21 @@ def detect_faces(
 
     def _supports_batch_detection(self) -> bool:
         import mtcnn
+        import os
+        supports_batch_detection = os.getenv(
+            "ENABLE_MTCNN_BATCH_DETECTION", "false"
+        ).lower() == "true"
+        if not supports_batch_detection:
+            logger.warning(
+                "Batch detection is disabled for mtcnn by default "
+                "since the results are not consistent with single image detection. "
+                "You can force enable it by setting the environment variable "
+                "ENABLE_MTCNN_BATCH_DETECTION to true."
+            )
+            return False
         try:
             mtcnn_version = mtcnn.__version__
+            supports_batch_detection = mtcnn_version >= "1.0.0"
         except AttributeError:
             try:
                 import mtcnn.metadata

From 93b8af100b09bb5111ce1407996cb38bc283cdde Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 23 Feb 2025 12:17:12 +0000
Subject: [PATCH 36/41] comments

---
 tests/test_extract_faces.py | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 3b8d3de1..18ef34fc 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -96,12 +96,8 @@ def test_different_detectors():
     # "dlib",
 ])
 def test_batch_extract_faces(detector_backend):
-    detector_backend_to_rtol = {
-        "opencv": 0.1,
-        "mtcnn": 0.2,
-        "yolov11s": 0.03,
-    }
-    rtol = detector_backend_to_rtol.get(detector_backend, 0.01)
+    # Relative tolerance for comparing floating-point values
+    rtol = 0.03
     img_paths = [
         "dataset/img2.jpg",
         "dataset/img3.jpg",
@@ -154,15 +150,20 @@ def test_batch_extract_faces(detector_backend):
                         img_obj_individual["facial_area"][key], 
                         img_obj_batch["facial_area"][key]
                     ):
+                        # Ensure the difference between individual and batch values 
+                        # is within rtol% of the individual value
                         assert abs(ind_val - batch_val) <= rtol * ind_val
                 elif (
                     isinstance(img_obj_individual["facial_area"][key], int) or 
                     isinstance(img_obj_individual["facial_area"][key], float)
                 ):
+                    # Ensure the difference between individual and batch values 
+                    # is within rtol% of the individual value
                     assert abs(
                         img_obj_individual["facial_area"][key] - 
                         img_obj_batch["facial_area"][key]
                     ) <= rtol * img_obj_individual["facial_area"][key]
+            # Ensure the confidence difference is within rtol% of the individual confidence
             assert abs(
                 img_obj_individual["confidence"] - 
                 img_obj_batch["confidence"]
@@ -175,7 +176,7 @@ def test_batch_extract_faces(detector_backend):
     "mtcnn",
     "retinaface",
     "yunet",
-    "centerface",
+    # "centerface",
     # optional
     # "yolov11s",
     # "mediapipe",
@@ -217,8 +218,8 @@ def test_batch_extract_faces_with_nparray(detector_backend):
 
     # Check that the batch extraction returned the expected number of face lists
     assert len(imgs_objs_batch) == 4
-    for img_objs_batch, expected_num_faces in zip(imgs_objs_batch, expected_num_faces):
-        assert len(img_objs_batch) == expected_num_faces
+    for img_objs_batch, img_expected_num_faces in zip(imgs_objs_batch, expected_num_faces):
+        assert len(img_objs_batch) == img_expected_num_faces
 
     # extract faces in batch of paths
     imgs_objs_batch_paths = DeepFace.extract_faces(

From 8b1b465d220677113e1d5f9f275ddb218226d739 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 23 Feb 2025 13:27:18 +0000
Subject: [PATCH 37/41] change behaviour in special case batched single image

---
 deepface/models/face_detection/CenterFace.py |   5 +-
 deepface/models/face_detection/Dlib.py       |   5 +-
 deepface/models/face_detection/FastMtCnn.py  |   5 +-
 deepface/models/face_detection/MediaPipe.py  |   5 +-
 deepface/models/face_detection/MtCnn.py      |   5 +-
 deepface/models/face_detection/OpenCv.py     |  20 ++-
 deepface/models/face_detection/RetinaFace.py |   7 +-
 deepface/models/face_detection/Ssd.py        | 162 ++++++++++---------
 deepface/models/face_detection/YuNet.py      |   5 +-
 deepface/modules/detection.py                |  48 +++---
 tests/test_extract_faces.py                  |   4 +-
 11 files changed, 159 insertions(+), 112 deletions(-)

diff --git a/deepface/models/face_detection/CenterFace.py b/deepface/models/face_detection/CenterFace.py
index a947900b..523f2bfd 100644
--- a/deepface/models/face_detection/CenterFace.py
+++ b/deepface/models/face_detection/CenterFace.py
@@ -49,10 +49,11 @@ def detect_faces(
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
             A list or a list of lists of FacialAreaRegion objects
         """
-        if not isinstance(img, list):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             img = [img]
         results = [self._process_single_image(single_img) for single_img in img]
-        if len(results) == 1:
+        if not is_batched_input:
             return results[0]
         return results
 
diff --git a/deepface/models/face_detection/Dlib.py b/deepface/models/face_detection/Dlib.py
index 208b0442..254a32be 100644
--- a/deepface/models/face_detection/Dlib.py
+++ b/deepface/models/face_detection/Dlib.py
@@ -62,10 +62,11 @@ def detect_faces(
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
             A list or a list of lists of FacialAreaRegion objects
         """
-        if not isinstance(img, list):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             img = [img]
         results = [self._process_single_image(single_img) for single_img in img]
-        if len(results) == 1:
+        if not is_batched_input:
             return results[0]
         return results
 
diff --git a/deepface/models/face_detection/FastMtCnn.py b/deepface/models/face_detection/FastMtCnn.py
index ea2431e5..7d5ccf58 100644
--- a/deepface/models/face_detection/FastMtCnn.py
+++ b/deepface/models/face_detection/FastMtCnn.py
@@ -32,10 +32,11 @@ def detect_faces(
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
             A list or a list of lists of FacialAreaRegion objects
         """
-        if not isinstance(img, list):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             img = [img]
         results = [self._process_single_image(single_img) for single_img in img]
-        if len(results) == 1:
+        if not is_batched_input:
             return results[0]
         return results
 
diff --git a/deepface/models/face_detection/MediaPipe.py b/deepface/models/face_detection/MediaPipe.py
index 4716e7c5..9fcdbbc7 100644
--- a/deepface/models/face_detection/MediaPipe.py
+++ b/deepface/models/face_detection/MediaPipe.py
@@ -58,10 +58,11 @@ def detect_faces(
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
             A list or a list of lists of FacialAreaRegion objects
         """
-        if not isinstance(img, list):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             img = [img]
         results = [self._process_single_image(single_img) for single_img in img]
-        if len(results) == 1:
+        if not is_batched_input:
             return results[0]
         return results
 
diff --git a/deepface/models/face_detection/MtCnn.py b/deepface/models/face_detection/MtCnn.py
index 8c420757..23826700 100644
--- a/deepface/models/face_detection/MtCnn.py
+++ b/deepface/models/face_detection/MtCnn.py
@@ -38,7 +38,8 @@ def detect_faces(
                 or a list of lists of FacialAreaRegion objects for each image
         """
 
-        if not isinstance(img, list):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             img = [img]
 
         resp = []
@@ -76,7 +77,7 @@ def detect_faces(
 
             resp.append(image_resp)
 
-        if len(resp) == 1:
+        if not is_batched_input:
             return resp[0]
         return resp
 
diff --git a/deepface/models/face_detection/OpenCv.py b/deepface/models/face_detection/OpenCv.py
index f97f6586..a6d39c93 100644
--- a/deepface/models/face_detection/OpenCv.py
+++ b/deepface/models/face_detection/OpenCv.py
@@ -1,6 +1,7 @@
 # built-in dependencies
 import os
 from typing import Any, List, Union
+import logging
 
 # 3rd party dependencies
 import cv2
@@ -9,6 +10,7 @@
 #project dependencies
 from deepface.models.Detector import Detector, FacialAreaRegion
 
+logger = logging.getLogger(__name__)
 
 class OpenCvClient(Detector):
     """
@@ -17,6 +19,7 @@ class OpenCvClient(Detector):
 
     def __init__(self):
         self.model = self.build_model()
+        self.supports_batch_detection = self._supports_batch_detection()
 
     def build_model(self):
         """
@@ -28,6 +31,19 @@ def build_model(self):
         detector["face_detector"] = self.__build_cascade("haarcascade")
         detector["eye_detector"] = self.__build_cascade("haarcascade_eye")
         return detector
+    
+    def _supports_batch_detection(self) -> bool:
+        supports_batch_detection = os.getenv(
+            "ENABLE_OPENCV_BATCH_DETECTION", "false"
+        ).lower() == "true"
+        if not supports_batch_detection:
+            logger.warning(
+                "Batch detection is disabled for opencv by default "
+                "since the results are not consistent with single image detection. "
+                "You can force enable it by setting the environment variable "
+                "ENABLE_OPENCV_BATCH_DETECTION to true."
+            )
+        return supports_batch_detection
 
     def detect_faces(
         self,
@@ -46,8 +62,10 @@ def detect_faces(
         """
         if isinstance(img, np.ndarray):
             imgs = [img]
-        else:
+        elif self.supports_batch_detection:
             imgs = img
+        else:
+            return [self.detect_faces(single_img) for single_img in img]
 
         batch_results = []
 
diff --git a/deepface/models/face_detection/RetinaFace.py b/deepface/models/face_detection/RetinaFace.py
index b0d1c949..2722e011 100644
--- a/deepface/models/face_detection/RetinaFace.py
+++ b/deepface/models/face_detection/RetinaFace.py
@@ -28,7 +28,8 @@ def detect_faces(
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
             A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             imgs = [img]
         else:
             imgs = img
@@ -81,4 +82,6 @@ def detect_faces(
 
             batch_results.append(resp)
 
-        return batch_results if len(batch_results) > 1 else batch_results[0]
+        if not is_batched_input:
+            return batch_results[0]
+        return batch_results
diff --git a/deepface/models/face_detection/Ssd.py b/deepface/models/face_detection/Ssd.py
index c0ae2cbf..a620f96c 100644
--- a/deepface/models/face_detection/Ssd.py
+++ b/deepface/models/face_detection/Ssd.py
@@ -69,81 +69,89 @@ def detect_faces(
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
             A list or a list of lists of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
-            imgs = [img]
-        else:
-            imgs = img
-
-        batch_results = []
-
-        for single_img in imgs:
-            # Because cv2.dnn.blobFromImage expects CV_8U (8-bit unsigned integer) values
-            if single_img.dtype != np.uint8:
-                single_img = single_img.astype(np.uint8)
-
-            opencv_module: OpenCv.OpenCvClient = self.model["opencv_module"]
-
-            target_size = (300, 300)
-            original_size = single_img.shape
-            current_img = cv2.resize(single_img, target_size)
-
-            aspect_ratio_x = original_size[1] / target_size[1]
-            aspect_ratio_y = original_size[0] / target_size[0]
-
-            imageBlob = cv2.dnn.blobFromImage(image=current_img)
-
-            face_detector = self.model["face_detector"]
-            face_detector.setInput(imageBlob)
-            detections = face_detector.forward()
-
-            class ssd_labels(IntEnum):
-                img_id = 0
-                is_face = 1
-                confidence = 2
-                left = 3
-                top = 4
-                right = 5
-                bottom = 6
-
-            faces = detections[0][0]
-            faces = faces[
-                (faces[:, ssd_labels.is_face] == 1) & (faces[:, ssd_labels.confidence] >= 0.90)
-            ]
-            margins = [ssd_labels.left, ssd_labels.top, ssd_labels.right, ssd_labels.bottom]
-            faces[:, margins] = np.int32(faces[:, margins] * 300)
-            faces[:, margins] = np.int32(
-                faces[:, margins] * [aspect_ratio_x, aspect_ratio_y, aspect_ratio_x, aspect_ratio_y]
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
+            img = [img]
+        results = [self._process_single_image(single_img) for single_img in img]
+        if not is_batched_input:
+            return results[0]
+        return results
+
+    def _process_single_image(self, single_img: np.ndarray) -> List[FacialAreaRegion]:
+        """
+        Helper function to detect faces in a single image.
+
+        Args:
+            single_img (np.ndarray): Pre-loaded image as numpy array
+
+        Returns:
+            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
+        """
+        # Because cv2.dnn.blobFromImage expects CV_8U (8-bit unsigned integer) values
+        if single_img.dtype != np.uint8:
+            single_img = single_img.astype(np.uint8)
+
+        opencv_module: OpenCv.OpenCvClient = self.model["opencv_module"]
+
+        target_size = (300, 300)
+        original_size = single_img.shape
+        current_img = cv2.resize(single_img, target_size)
+
+        aspect_ratio_x = original_size[1] / target_size[1]
+        aspect_ratio_y = original_size[0] / target_size[0]
+
+        imageBlob = cv2.dnn.blobFromImage(image=current_img)
+
+        face_detector = self.model["face_detector"]
+        face_detector.setInput(imageBlob)
+        detections = face_detector.forward()
+
+        class ssd_labels(IntEnum):
+            img_id = 0
+            is_face = 1
+            confidence = 2
+            left = 3
+            top = 4
+            right = 5
+            bottom = 6
+
+        faces = detections[0][0]
+        faces = faces[
+            (faces[:, ssd_labels.is_face] == 1) & (faces[:, ssd_labels.confidence] >= 0.90)
+        ]
+        margins = [ssd_labels.left, ssd_labels.top, ssd_labels.right, ssd_labels.bottom]
+        faces[:, margins] = np.int32(faces[:, margins] * 300)
+        faces[:, margins] = np.int32(
+            faces[:, margins] * [aspect_ratio_x, aspect_ratio_y, aspect_ratio_x, aspect_ratio_y]
+        )
+        faces[:, [ssd_labels.right, ssd_labels.bottom]] -= faces[
+            :, [ssd_labels.left, ssd_labels.top]
+        ]
+
+        resp = []
+        for face in faces:
+            confidence = float(face[ssd_labels.confidence])
+            x, y, w, h = map(int, face[margins])
+            detected_face = single_img[y : y + h, x : x + w]
+
+            left_eye, right_eye = opencv_module.find_eyes(detected_face)
+
+            # eyes found in the detected face instead image itself
+            # detected face's coordinates should be added
+            if left_eye is not None:
+                left_eye = x + int(left_eye[0]), y + int(left_eye[1])
+            if right_eye is not None:
+                right_eye = x + int(right_eye[0]), y + int(right_eye[1])
+
+            facial_area = FacialAreaRegion(
+                x=x,
+                y=y,
+                w=w,
+                h=h,
+                left_eye=left_eye,
+                right_eye=right_eye,
+                confidence=confidence,
             )
-            faces[:, [ssd_labels.right, ssd_labels.bottom]] -= faces[
-                :, [ssd_labels.left, ssd_labels.top]
-            ]
-
-            resp = []
-            for face in faces:
-                confidence = float(face[ssd_labels.confidence])
-                x, y, w, h = map(int, face[margins])
-                detected_face = single_img[y : y + h, x : x + w]
-
-                left_eye, right_eye = opencv_module.find_eyes(detected_face)
-
-                # eyes found in the detected face instead image itself
-                # detected face's coordinates should be added
-                if left_eye is not None:
-                    left_eye = x + int(left_eye[0]), y + int(left_eye[1])
-                if right_eye is not None:
-                    right_eye = x + int(right_eye[0]), y + int(right_eye[1])
-
-                facial_area = FacialAreaRegion(
-                    x=x,
-                    y=y,
-                    w=w,
-                    h=h,
-                    left_eye=left_eye,
-                    right_eye=right_eye,
-                    confidence=confidence,
-                )
-                resp.append(facial_area)
-
-            batch_results.append(resp)
-
-        return batch_results if len(batch_results) > 1 else batch_results[0]
+            resp.append(facial_area)
+
+        return resp
diff --git a/deepface/models/face_detection/YuNet.py b/deepface/models/face_detection/YuNet.py
index 4086f17e..93e65a8d 100644
--- a/deepface/models/face_detection/YuNet.py
+++ b/deepface/models/face_detection/YuNet.py
@@ -67,10 +67,11 @@ def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[F
         Returns:
             results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
         """
-        if not isinstance(img, list):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             img = [img]
         results = [self._process_single_image(single_img) for single_img in img]
-        if len(results) == 1:
+        if not is_batched_input:
             return results[0]
         return results
 
diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index 2b14a7c8..9977ea3e 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -82,15 +82,23 @@ def extract_faces(
             just available in the result only if anti_spoofing is set to True in input arguments.
     """
 
-    if isinstance(img_path, np.ndarray) and img_path.ndim == 4:
-        img_path = [img_path[i] for i in range(img_path.shape[0])]
-    if not isinstance(img_path, list):
-        img_path = [img_path]
+    batched_input = (
+        (
+            isinstance(img_path, np.ndarray) and 
+            img_path.ndim == 4
+        ) or isinstance(img_path, list)
+    )
+    if not batched_input:
+        imgs_path = [img_path]
+    elif isinstance(img_path, np.ndarray):
+        imgs_path = [img_path[i] for i in range(img_path.shape[0])]
+    else:
+        imgs_path = img_path
 
     all_images = []
     img_names = []
 
-    for single_img_path in img_path:
+    for single_img_path in imgs_path:
         # img might be path, base64 or numpy array. Convert it to numpy whatever it is.
         img, img_name = image_utils.load_image(single_img_path)
 
@@ -109,9 +117,6 @@ def extract_faces(
         max_faces=max_faces,
     )
 
-    if len(all_images) == 1:
-        all_face_objs = [all_face_objs]
-
     all_resp_objs = []
 
     for img, img_name, face_objs in zip(all_images, img_names, all_face_objs):
@@ -203,7 +208,7 @@ def extract_faces(
 
         all_resp_objs.append(img_resp_objs)
 
-    if len(all_resp_objs) == 1:
+    if not batched_input:
         return all_resp_objs[0]
     return all_resp_objs
 
@@ -239,8 +244,18 @@ def detect_faces(
 
         - confidence (float): The confidence score associated with the detected face.
     """
-    if not isinstance(img, list):
-        img = [img]
+    batched_input = (
+        (
+            isinstance(img, np.ndarray) and 
+            img.ndim == 4
+        ) or isinstance(img, list)
+    )
+    if not batched_input:
+        imgs = [img]
+    elif isinstance(img, np.ndarray):
+        imgs = [img[i] for i in range(img.shape[0])]
+    else:
+        imgs = img
 
     if detector_backend == "skip":
         all_face_objs = [
@@ -253,9 +268,9 @@ def detect_faces(
                     confidence=0,
                 )
             ]
-            for single_img in img
+            for single_img in imgs
         ]
-        if len(img) == 1:
+        if not batched_input:
             all_face_objs = all_face_objs[0]
         return all_face_objs
 
@@ -266,7 +281,7 @@ def detect_faces(
     preprocessed_images = []
     width_borders = []
     height_borders = []
-    for single_img in img:
+    for single_img in imgs:
         height, width, _ = single_img.shape
 
         # validate expand percentage score
@@ -299,9 +314,6 @@ def detect_faces(
     # Detect faces in all preprocessed images
     all_facial_areas = face_detector.detect_faces(preprocessed_images)
 
-    if len(preprocessed_images) == 1:
-        all_facial_areas = [all_facial_areas]
-
     all_detected_faces = []
     for (
         single_img,
@@ -336,7 +348,7 @@ def detect_faces(
 
         all_detected_faces.append(detected_faces)
 
-    if len(all_detected_faces) == 1:
+    if not batched_input:
         return all_detected_faces[0]
     return all_detected_faces
 
diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 18ef34fc..2814c548 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -242,8 +242,8 @@ def test_batch_extract_faces_single_image():
         img_path=[img_path],
         align=True,
     )
-    assert len(imgs_objs_batch) == 2
-    assert [isinstance(obj, dict) for obj in imgs_objs_batch]
+    assert len(imgs_objs_batch) == 1 and isinstance(imgs_objs_batch[0], list)
+    assert [isinstance(obj, dict) for obj in imgs_objs_batch[0]]
 
 
 def test_backends_for_enforced_detection_with_non_facial_inputs():

From aae3af0d05c59f23060b995824e3e40f004b2b6a Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 23 Feb 2025 13:33:17 +0000
Subject: [PATCH 38/41] rm opencv from batch test since it still occasionally
 fails

---
 deepface/models/face_detection/OpenCv.py | 2 +-
 deepface/modules/detection.py            | 4 ++--
 tests/test_extract_faces.py              | 2 +-
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/deepface/models/face_detection/OpenCv.py b/deepface/models/face_detection/OpenCv.py
index a6d39c93..c86f2da5 100644
--- a/deepface/models/face_detection/OpenCv.py
+++ b/deepface/models/face_detection/OpenCv.py
@@ -31,7 +31,7 @@ def build_model(self):
         detector["face_detector"] = self.__build_cascade("haarcascade")
         detector["eye_detector"] = self.__build_cascade("haarcascade_eye")
         return detector
-    
+
     def _supports_batch_detection(self) -> bool:
         supports_batch_detection = os.getenv(
             "ENABLE_OPENCV_BATCH_DETECTION", "false"
diff --git a/deepface/modules/detection.py b/deepface/modules/detection.py
index 9977ea3e..202d2ac7 100644
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@@ -84,7 +84,7 @@ def extract_faces(
 
     batched_input = (
         (
-            isinstance(img_path, np.ndarray) and 
+            isinstance(img_path, np.ndarray) and
             img_path.ndim == 4
         ) or isinstance(img_path, list)
     )
@@ -246,7 +246,7 @@ def detect_faces(
     """
     batched_input = (
         (
-            isinstance(img, np.ndarray) and 
+            isinstance(img, np.ndarray) and
             img.ndim == 4
         ) or isinstance(img, list)
     )
diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 2814c548..3d36397b 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -84,7 +84,7 @@ def test_different_detectors():
 
 
 @pytest.mark.parametrize("detector_backend", [
-    "opencv",
+    # "opencv",
     "ssd",
     "mtcnn",
     "retinaface",

From 8c7c2cb9b7505bd17beed69e3bbf16a8b4c8940d Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 23 Feb 2025 14:07:37 +0000
Subject: [PATCH 39/41] refactor detectors to have default detect_faces method
 that is based on process_single_image method

---
 deepface/models/Detector.py                  | 85 ++++++++++++-------
 deepface/models/face_detection/CenterFace.py | 31 +------
 deepface/models/face_detection/Dlib.py       | 25 +-----
 deepface/models/face_detection/FastMtCnn.py  | 23 -----
 deepface/models/face_detection/MediaPipe.py  | 25 +-----
 deepface/models/face_detection/OpenCv.py     | 89 ++++++++------------
 deepface/models/face_detection/Ssd.py        | 39 ++-------
 deepface/models/face_detection/Yolo.py       |  5 +-
 deepface/models/face_detection/YuNet.py      | 20 +----
 9 files changed, 109 insertions(+), 233 deletions(-)

diff --git a/deepface/models/Detector.py b/deepface/models/Detector.py
index 6db5e7be..e369c9d8 100644
--- a/deepface/models/Detector.py
+++ b/deepface/models/Detector.py
@@ -1,37 +1,8 @@
 from typing import List, Tuple, Optional, Union
-from abc import ABC, abstractmethod
+from abc import ABC
 from dataclasses import dataclass
 import numpy as np
 
-# Notice that all facial detector models must be inherited from this class
-
-
-# pylint: disable=unnecessary-pass, too-few-public-methods, too-many-instance-attributes
-class Detector(ABC):
-    @abstractmethod
-    def detect_faces(
-        self,
-        img: Union[np.ndarray, List[np.ndarray]]
-    ) -> Union[List["FacialAreaRegion"], List[List["FacialAreaRegion"]]]:
-        """
-        Interface for detect and align faces in a batch of images
-
-        Args:
-            img (Union[np.ndarray, List[np.ndarray]]): 
-            Pre-loaded image as numpy array or a list of those
-
-        Returns:
-            results (Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]): 
-            A list or a list of lists of FacialAreaRegion objects
-                where each object contains:
-
-            - facial_area (FacialAreaRegion): The facial area region represented
-                as x, y, w, h, left_eye and right_eye. left eye and right eye are
-                eyes on the left and right respectively with respect to the person
-                instead of observer.
-        """
-        pass
-
 
 @dataclass
 class FacialAreaRegion:
@@ -77,3 +48,57 @@ class DetectedFace:
     img: np.ndarray
     facial_area: FacialAreaRegion
     confidence: float
+
+
+# Notice that all facial detector models must be inherited from this class
+
+# pylint: disable=unnecessary-pass, too-few-public-methods, too-many-instance-attributes
+class Detector(ABC):
+
+    def detect_faces(
+        self,
+        img: Union[np.ndarray, List[np.ndarray]],
+    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+        """
+        Detect and align faces in an image or a list of images
+
+        Args:
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            pre-loaded image as numpy array or a list of those
+
+        Returns:
+            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
+            A list or a list of lists of FacialAreaRegion objects
+        """
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
+            img = [img]
+        results = [self._process_single_image(single_img) for single_img in img]
+        if not is_batched_input:
+            return results[0]
+        return results
+
+    def _process_single_image(
+        self,
+        img: np.ndarray
+    ) -> List[FacialAreaRegion]:
+        """
+        Interface for detect and align faces in a single image
+
+        Args:
+            img (Union[np.ndarray, List[np.ndarray]]): 
+            Pre-loaded image as numpy array or a list of those
+
+        Returns:
+            results (Union[List[List[FacialAreaRegion]], List[FacialAreaRegion]]): 
+            A list or a list of lists of FacialAreaRegion objects
+                where each object contains:
+
+            - facial_area (FacialAreaRegion): The facial area region represented
+                as x, y, w, h, left_eye and right_eye. left eye and right eye are
+                eyes on the left and right respectively with respect to the person
+                instead of observer.
+        """
+        raise NotImplementedError(
+            "Subclasses that do not implement batch detection must implement this method"
+        )
diff --git a/deepface/models/face_detection/CenterFace.py b/deepface/models/face_detection/CenterFace.py
index 523f2bfd..e5ef2be6 100644
--- a/deepface/models/face_detection/CenterFace.py
+++ b/deepface/models/face_detection/CenterFace.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import List, Union
+from typing import List
 
 # 3rd party dependencies
 import numpy as np
@@ -34,35 +34,12 @@ def build_model(self):
 
         return CenterFace(weight_path=weights_path)
 
-    def detect_faces(
-        self,
-        img: Union[np.ndarray, List[np.ndarray]],
-    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
-        """
-        Detect and align face with CenterFace
-
-        Args:
-            img (Union[np.ndarray, List[np.ndarray]]): 
-            pre-loaded image as numpy array or a list of those
-
-        Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
-            A list or a list of lists of FacialAreaRegion objects
-        """
-        is_batched_input = isinstance(img, list)
-        if not is_batched_input:
-            img = [img]
-        results = [self._process_single_image(single_img) for single_img in img]
-        if not is_batched_input:
-            return results[0]
-        return results
-
-    def _process_single_image(self, single_img: np.ndarray) -> List[FacialAreaRegion]:
+    def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
         Helper function to detect faces in a single image.
 
         Args:
-            single_img (np.ndarray): pre-loaded image as numpy array
+            img (np.ndarray): pre-loaded image as numpy array
 
         Returns:
             results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
@@ -76,7 +53,7 @@ def _process_single_image(self, single_img: np.ndarray) -> List[FacialAreaRegion
         #     img, img.shape[0], img.shape[1], threshold=threshold
         # )
         detections, landmarks = self.build_model().forward(
-            single_img, single_img.shape[0], single_img.shape[1], threshold=threshold
+            img, img.shape[0], img.shape[1], threshold=threshold
         )
 
         for i, detection in enumerate(detections):
diff --git a/deepface/models/face_detection/Dlib.py b/deepface/models/face_detection/Dlib.py
index 254a32be..e8afce25 100644
--- a/deepface/models/face_detection/Dlib.py
+++ b/deepface/models/face_detection/Dlib.py
@@ -1,5 +1,5 @@
 # built-in dependencies
-from typing import List, Union
+from typing import List
 
 # 3rd party dependencies
 import numpy as np
@@ -47,29 +47,6 @@ def build_model(self) -> dict:
         detector["sp"] = sp
         return detector
 
-    def detect_faces(
-        self,
-        img: Union[np.ndarray, List[np.ndarray]],
-    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
-        """
-        Detect and align face with dlib
-
-        Args:
-            img (Union[np.ndarray, List[np.ndarray]]): 
-            pre-loaded image as numpy array or a list of those
-
-        Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
-            A list or a list of lists of FacialAreaRegion objects
-        """
-        is_batched_input = isinstance(img, list)
-        if not is_batched_input:
-            img = [img]
-        results = [self._process_single_image(single_img) for single_img in img]
-        if not is_batched_input:
-            return results[0]
-        return results
-
     def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
         Helper function to detect faces in a single image.
diff --git a/deepface/models/face_detection/FastMtCnn.py b/deepface/models/face_detection/FastMtCnn.py
index 7d5ccf58..2499dc76 100644
--- a/deepface/models/face_detection/FastMtCnn.py
+++ b/deepface/models/face_detection/FastMtCnn.py
@@ -17,29 +17,6 @@ class FastMtCnnClient(Detector):
     def __init__(self):
         self.model = self.build_model()
 
-    def detect_faces(
-        self,
-        img: Union[np.ndarray, List[np.ndarray]],
-    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
-        """
-        Detect and align face with mtcnn
-
-        Args:
-            img (Union[np.ndarray, List[np.ndarray]]): 
-            pre-loaded image as numpy array or a list of those
-
-        Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
-            A list or a list of lists of FacialAreaRegion objects
-        """
-        is_batched_input = isinstance(img, list)
-        if not is_batched_input:
-            img = [img]
-        results = [self._process_single_image(single_img) for single_img in img]
-        if not is_batched_input:
-            return results[0]
-        return results
-
     def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
         Helper function to detect faces in a single image.
diff --git a/deepface/models/face_detection/MediaPipe.py b/deepface/models/face_detection/MediaPipe.py
index 9fcdbbc7..61bb0b5e 100644
--- a/deepface/models/face_detection/MediaPipe.py
+++ b/deepface/models/face_detection/MediaPipe.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import Any, List, Union
+from typing import Any, List
 
 # 3rd party dependencies
 import numpy as np
@@ -43,29 +43,6 @@ def build_model(self) -> Any:
         )
         return face_detection
 
-    def detect_faces(
-        self,
-        img: Union[np.ndarray, List[np.ndarray]],
-    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
-        """
-        Detect and align face with mediapipe
-
-        Args:
-            img (Union[np.ndarray, List[np.ndarray]]): 
-            pre-loaded image as numpy array or a list of those
-
-        Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
-            A list or a list of lists of FacialAreaRegion objects
-        """
-        is_batched_input = isinstance(img, list)
-        if not is_batched_input:
-            img = [img]
-        results = [self._process_single_image(single_img) for single_img in img]
-        if not is_batched_input:
-            return results[0]
-        return results
-
     def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
         Helper function to detect faces in a single image.
diff --git a/deepface/models/face_detection/OpenCv.py b/deepface/models/face_detection/OpenCv.py
index c86f2da5..801ff114 100644
--- a/deepface/models/face_detection/OpenCv.py
+++ b/deepface/models/face_detection/OpenCv.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import Any, List, Union
+from typing import Any, List
 import logging
 
 # 3rd party dependencies
@@ -45,65 +45,48 @@ def _supports_batch_detection(self) -> bool:
             )
         return supports_batch_detection
 
-    def detect_faces(
-        self,
-        img: Union[np.ndarray, List[np.ndarray]]
-    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
+    def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
-        Detect and align face with opencv
+        Helper function to detect faces in a single image.
 
         Args:
-            img (Union[np.ndarray, List[np.ndarray]]):
-            Pre-loaded image as numpy array or a list of those
+            img (np.ndarray): pre-loaded image as numpy array
 
         Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
-            A list or a list of lists of FacialAreaRegion objects
+            results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
         """
-        if isinstance(img, np.ndarray):
-            imgs = [img]
-        elif self.supports_batch_detection:
-            imgs = img
-        else:
-            return [self.detect_faces(single_img) for single_img in img]
-
-        batch_results = []
-
-        for single_img in imgs:
-            resp = []
-            detected_face = None
-            faces = []
-            try:
-                faces, _, scores = self.model["face_detector"].detectMultiScale3(
-                    single_img, 1.1, 10, outputRejectLevels=True
+        resp = []
+        detected_face = None
+        faces = []
+        try:
+            faces, _, scores = self.model["face_detector"].detectMultiScale3(
+                img, 1.1, 10, outputRejectLevels=True
+            )
+        except:
+            pass
+
+        if len(faces) > 0:
+            for (x, y, w, h), confidence in zip(faces, scores):
+                detected_face = img[int(y):int(y + h), int(x):int(x + w)]
+                left_eye, right_eye = self.find_eyes(img=detected_face)
+
+                if left_eye is not None:
+                    left_eye = (int(x + left_eye[0]), int(y + left_eye[1]))
+                if right_eye is not None:
+                    right_eye = (int(x + right_eye[0]), int(y + right_eye[1]))
+
+                facial_area = FacialAreaRegion(
+                    x=x,
+                    y=y,
+                    w=w,
+                    h=h,
+                    left_eye=left_eye,
+                    right_eye=right_eye,
+                    confidence=(100 - confidence) / 100,
                 )
-            except:
-                pass
-
-            if len(faces) > 0:
-                for (x, y, w, h), confidence in zip(faces, scores):
-                    detected_face = single_img[int(y):int(y + h), int(x):int(x + w)]
-                    left_eye, right_eye = self.find_eyes(img=detected_face)
-
-                    if left_eye is not None:
-                        left_eye = (int(x + left_eye[0]), int(y + left_eye[1]))
-                    if right_eye is not None:
-                        right_eye = (int(x + right_eye[0]), int(y + right_eye[1]))
-
-                    facial_area = FacialAreaRegion(
-                        x=x,
-                        y=y,
-                        w=w,
-                        h=h,
-                        left_eye=left_eye,
-                        right_eye=right_eye,
-                        confidence=(100 - confidence) / 100,
-                    )
-                    resp.append(facial_area)
-
-            batch_results.append(resp)
-
-        return batch_results if len(batch_results) > 1 else batch_results[0]
+                resp.append(facial_area)
+
+        return resp
 
     def find_eyes(self, img: np.ndarray) -> tuple:
         """
diff --git a/deepface/models/face_detection/Ssd.py b/deepface/models/face_detection/Ssd.py
index a620f96c..381d664f 100644
--- a/deepface/models/face_detection/Ssd.py
+++ b/deepface/models/face_detection/Ssd.py
@@ -1,5 +1,5 @@
 # built-in dependencies
-from typing import List, Union
+from typing import List
 from enum import IntEnum
 
 # 3rd party dependencies
@@ -54,48 +54,25 @@ def build_model(self) -> dict:
 
         return {"face_detector": face_detector, "opencv_module": OpenCv.OpenCvClient()}
 
-    def detect_faces(
-        self,
-        img: Union[np.ndarray, List[np.ndarray]]
-    ) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
-        """
-        Detect and align faces with ssd in a batch of images
-
-        Args:
-            img (Union[np.ndarray, List[np.ndarray]]): 
-            Pre-loaded image as numpy array or a list of those
-
-        Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): 
-            A list or a list of lists of FacialAreaRegion objects
-        """
-        is_batched_input = isinstance(img, list)
-        if not is_batched_input:
-            img = [img]
-        results = [self._process_single_image(single_img) for single_img in img]
-        if not is_batched_input:
-            return results[0]
-        return results
-
-    def _process_single_image(self, single_img: np.ndarray) -> List[FacialAreaRegion]:
+    def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
         Helper function to detect faces in a single image.
 
         Args:
-            single_img (np.ndarray): Pre-loaded image as numpy array
+            img (np.ndarray): Pre-loaded image as numpy array
 
         Returns:
             results (List[FacialAreaRegion]): A list of FacialAreaRegion objects
         """
         # Because cv2.dnn.blobFromImage expects CV_8U (8-bit unsigned integer) values
-        if single_img.dtype != np.uint8:
-            single_img = single_img.astype(np.uint8)
+        if img.dtype != np.uint8:
+            img = img.astype(np.uint8)
 
         opencv_module: OpenCv.OpenCvClient = self.model["opencv_module"]
 
         target_size = (300, 300)
-        original_size = single_img.shape
-        current_img = cv2.resize(single_img, target_size)
+        original_size = img.shape
+        current_img = cv2.resize(img, target_size)
 
         aspect_ratio_x = original_size[1] / target_size[1]
         aspect_ratio_y = original_size[0] / target_size[0]
@@ -132,7 +109,7 @@ class ssd_labels(IntEnum):
         for face in faces:
             confidence = float(face[ssd_labels.confidence])
             x, y, w, h = map(int, face[margins])
-            detected_face = single_img[y : y + h, x : x + w]
+            detected_face = img[y : y + h, x : x + w]
 
             left_eye, right_eye = opencv_module.find_eyes(detected_face)
 
diff --git a/deepface/models/face_detection/Yolo.py b/deepface/models/face_detection/Yolo.py
index cbb88799..300bc457 100644
--- a/deepface/models/face_detection/Yolo.py
+++ b/deepface/models/face_detection/Yolo.py
@@ -78,7 +78,8 @@ def detect_faces(
             A list of lists of FacialAreaRegion objects 
             for each image or a list of FacialAreaRegion objects
         """
-        if not isinstance(img, list):
+        is_batched_input = isinstance(img, list)
+        if not is_batched_input:
             img = [img]
 
         all_results = []
@@ -142,7 +143,7 @@ def detect_faces(
 
             all_results.append(resp)
 
-        if len(all_results) == 1:
+        if not is_batched_input:
             return all_results[0]
         return all_results
 
diff --git a/deepface/models/face_detection/YuNet.py b/deepface/models/face_detection/YuNet.py
index 93e65a8d..4b4b9392 100644
--- a/deepface/models/face_detection/YuNet.py
+++ b/deepface/models/face_detection/YuNet.py
@@ -1,6 +1,6 @@
 # built-in dependencies
 import os
-from typing import Any, List, Union
+from typing import Any, List
 
 # 3rd party dependencies
 import cv2
@@ -57,24 +57,6 @@ def build_model(self) -> Any:
             ) from err
         return face_detector
 
-    def detect_faces(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]:
-        """
-        Detect and align face with yunet
-
-        Args:
-            img (Union[np.ndarray, List[np.ndarray]]): pre-loaded image as numpy array or a list of those
-
-        Returns:
-            results (Union[List[FacialAreaRegion], List[List[FacialAreaRegion]]]): A list or a list of lists of FacialAreaRegion objects
-        """
-        is_batched_input = isinstance(img, list)
-        if not is_batched_input:
-            img = [img]
-        results = [self._process_single_image(single_img) for single_img in img]
-        if not is_batched_input:
-            return results[0]
-        return results
-
     def _process_single_image(self, img: np.ndarray) -> List[FacialAreaRegion]:
         """
         Helper function to detect faces in a single image.

From c5ba4a73963176231999d4ef3f5e26d6a50356ba Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Sun, 23 Feb 2025 14:29:31 +0000
Subject: [PATCH 40/41] lint

---
 deepface/models/Detector.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/deepface/models/Detector.py b/deepface/models/Detector.py
index e369c9d8..2fe93fc2 100644
--- a/deepface/models/Detector.py
+++ b/deepface/models/Detector.py
@@ -4,6 +4,7 @@
 import numpy as np
 
 
+# pylint: disable=unnecessary-pass, too-few-public-methods, too-many-instance-attributes
 @dataclass
 class FacialAreaRegion:
     """
@@ -52,7 +53,6 @@ class DetectedFace:
 
 # Notice that all facial detector models must be inherited from this class
 
-# pylint: disable=unnecessary-pass, too-few-public-methods, too-many-instance-attributes
 class Detector(ABC):
 
     def detect_faces(

From 6a3d14cde75903b39ecd5504947314f57f57e312 Mon Sep 17 00:00:00 2001
From: galthran-wq <levmorozov900@gmail.com>
Date: Mon, 24 Feb 2025 14:41:48 +0300
Subject: [PATCH 41/41] Update test_extract_faces.py

---
 tests/test_extract_faces.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/test_extract_faces.py b/tests/test_extract_faces.py
index 3d36397b..1ecaafa9 100644
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@@ -217,7 +217,7 @@ def test_batch_extract_faces_with_nparray(detector_backend):
     )
 
     # Check that the batch extraction returned the expected number of face lists
-    assert len(imgs_objs_batch) == 4
+    assert len(imgs_objs_batch) == len(img_paths)
     for img_objs_batch, img_expected_num_faces in zip(imgs_objs_batch, expected_num_faces):
         assert len(img_objs_batch) == img_expected_num_faces