moving logics under modules

- all extract_faces logic moved to detection module - load image related logics moved to preprocessing module
2025-06-07 03:55:21 +00:00 · 2024-01-31 19:12:16 +00:00 · 2024-01-31 19:12:16 +00:00 · 95c55c0401
commit 95c55c0401
parent 9fbb229b97
9 changed files with 316 additions and 329 deletions
--- a/deepface/DeepFace.py
+++ b/deepface/DeepFace.py
@ -449,6 +449,7 @@ def extract_faces(
        enforce_detection=enforce_detection,
        align=align,
        grayscale=grayscale,
+        human_readable=True,
    )


--- a/deepface/commons/functions.py
+++ b/deepface/commons/functions.py
@ -1,42 +1,19 @@
 import os
-from typing import Union, Tuple, List
-import base64
 from pathlib import Path

 # 3rd party dependencies
-from PIL import Image
-import requests
-import numpy as np
-import cv2
 import tensorflow as tf

 # package dependencies
-from deepface.detectors import DetectorWrapper
-from deepface.models.Detector import DetectedFace, FacialAreaRegion
 from deepface.commons.logger import Logger

 logger = Logger(module="commons.functions")

-# pylint: disable=no-else-raise
-
-# --------------------------------------------------
-# configurations of dependencies
-

 def get_tf_major_version() -> int:
    return int(tf.__version__.split(".", maxsplit=1)[0])


-tf_major_version = get_tf_major_version()
-
-if tf_major_version == 1:
-    from keras.preprocessing import image
-elif tf_major_version == 2:
-    from tensorflow.keras.preprocessing import image
-
-# --------------------------------------------------
-
-
 def initialize_folder() -> None:
    """Initialize the folder for storing weights and models.

@ -65,266 +42,6 @@ def get_deepface_home() -> str:
    return str(os.getenv("DEEPFACE_HOME", default=str(Path.home())))


-# --------------------------------------------------
-
-
-def loadBase64Img(uri: str) -> np.ndarray:
-    """Load image from base64 string.
-
-    Args:
-        uri: a base64 string.
-
-    Returns:
-        numpy array: the loaded image.
-    """
-    encoded_data = uri.split(",")[1]
-    nparr = np.fromstring(base64.b64decode(encoded_data), np.uint8)
-    img_bgr = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
-    # img_rgb = cv2.cvtColor(img_bgr, cv2.COLOR_BGR2RGB)
-    return img_bgr
-
-
-def load_image(img: Union[str, np.ndarray]) -> Tuple[np.ndarray, str]:
-    """
-    Load image from path, url, base64 or numpy array.
-    Args:
-        img: a path, url, base64 or numpy array.
-    Returns:
-        image (numpy array): the loaded image in BGR format
-        image name (str): image name itself
-    """
-
-    # The image is already a numpy array
-    if isinstance(img, np.ndarray):
-        return img, "numpy array"
-
-    if isinstance(img, Path):
-        img = str(img)
-
-    if not isinstance(img, str):
-        raise ValueError(f"img must be numpy array or str but it is {type(img)}")
-
-    # The image is a base64 string
-    if img.startswith("data:image/"):
-        return loadBase64Img(img), "base64 encoded string"
-
-    # The image is a url
-    if img.startswith("http"):
-        return (
-            np.array(Image.open(requests.get(img, stream=True, timeout=60).raw).convert("BGR")),
-            # return url as image name
-            img,
-        )
-
-    # The image is a path
-    if os.path.isfile(img) is not True:
-        raise ValueError(f"Confirm that {img} exists")
-
-    # image must be a file on the system then
-
-    # image name must have english characters
-    if img.isascii() is False:
-        raise ValueError(f"Input image must not have non-english characters - {img}")
-
-    img_obj_bgr = cv2.imread(img)
-    # img_obj_rgb = cv2.cvtColor(img_obj_bgr, cv2.COLOR_BGR2RGB)
-    return img_obj_bgr, img
-
-
-# --------------------------------------------------
-
-
-def extract_faces(
-    img: Union[str, np.ndarray],
-    target_size: tuple = (224, 224),
-    detector_backend: str = "opencv",
-    grayscale: bool = False,
-    enforce_detection: bool = True,
-    align: bool = True,
-) -> List[Tuple[np.ndarray, dict, float]]:
-    """
-    Extract faces from an image.
-    Args:
-        img: a path, url, base64 or numpy array.
-        target_size (tuple, optional): the target size of the extracted faces.
-        Defaults to (224, 224).
-        detector_backend (str, optional): the face detector backend. Defaults to "opencv".
-        grayscale (bool, optional): whether to convert the extracted faces to grayscale.
-        Defaults to False.
-        enforce_detection (bool, optional): whether to enforce face detection. Defaults to True.
-        align (bool, optional): whether to align the extracted faces. Defaults to True.
-
-    Raises:
-        ValueError: if face could not be detected and enforce_detection is True.
-
-    Returns:
-        results (List[Tuple[np.ndarray, dict, float]]): A list of tuples
-            where each tuple contains:
-            - detected_face (np.ndarray): The detected face as a NumPy array.
-            - face_region (dict): The image region represented as
-                {"x": x, "y": y, "w": w, "h": h}
-            - confidence (float): The confidence score associated with the detected face.
-    """
-
-    # this is going to store a list of img itself (numpy), it region and confidence
-    extracted_faces = []
-
-    # img might be path, base64 or numpy array. Convert it to numpy whatever it is.
-    img, img_name = load_image(img)
-
-    base_region = FacialAreaRegion(x=0, y=0, w=img.shape[1], h=img.shape[0])
-
-    if detector_backend == "skip":
-        face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]
-    else:
-        face_objs = DetectorWrapper.detect_faces(detector_backend, img, align)
-
-    # in case of no face found
-    if len(face_objs) == 0 and enforce_detection is True:
-        if img_name is not None:
-            raise ValueError(
-                f"Face could not be detected in {img_name}."
-                "Please confirm that the picture is a face photo "
-                "or consider to set enforce_detection param to False."
-            )
-        else:
-            raise ValueError(
-                "Face could not be detected. Please confirm that the picture is a face photo "
-                "or consider to set enforce_detection param to False."
-            )
-
-    if len(face_objs) == 0 and enforce_detection is False:
-        face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]
-
-    for face_obj in face_objs:
-        current_img = face_obj.img
-        current_region = face_obj.facial_area
-        confidence = face_obj.confidence
-        if current_img.shape[0] > 0 and current_img.shape[1] > 0:
-            if grayscale is True:
-                current_img = cv2.cvtColor(current_img, cv2.COLOR_BGR2GRAY)
-
-            # resize and padding
-            factor_0 = target_size[0] / current_img.shape[0]
-            factor_1 = target_size[1] / current_img.shape[1]
-            factor = min(factor_0, factor_1)
-
-            dsize = (
-                int(current_img.shape[1] * factor),
-                int(current_img.shape[0] * factor),
-            )
-            current_img = cv2.resize(current_img, dsize)
-
-            diff_0 = target_size[0] - current_img.shape[0]
-            diff_1 = target_size[1] - current_img.shape[1]
-            if grayscale is False:
-                # Put the base image in the middle of the padded image
-                current_img = np.pad(
-                    current_img,
-                    (
-                        (diff_0 // 2, diff_0 - diff_0 // 2),
-                        (diff_1 // 2, diff_1 - diff_1 // 2),
-                        (0, 0),
-                    ),
-                    "constant",
-                )
-            else:
-                current_img = np.pad(
-                    current_img,
-                    (
-                        (diff_0 // 2, diff_0 - diff_0 // 2),
-                        (diff_1 // 2, diff_1 - diff_1 // 2),
-                    ),
-                    "constant",
-                )
-
-            # double check: if target image is not still the same size with target.
-            if current_img.shape[0:2] != target_size:
-                current_img = cv2.resize(current_img, target_size)
-
-            # normalizing the image pixels
-            # what this line doing? must?
-            img_pixels = image.img_to_array(current_img)
-            img_pixels = np.expand_dims(img_pixels, axis=0)
-            img_pixels /= 255  # normalize input in [0, 1]
-
-            # int cast is for the exception - object of type 'float32' is not JSON serializable
-            region_obj = {
-                "x": current_region.x,
-                "y": current_region.y,
-                "w": current_region.w,
-                "h": current_region.h,
-            }
-
-            extracted_face = (img_pixels, region_obj, confidence)
-            extracted_faces.append(extracted_face)
-
-    if len(extracted_faces) == 0 and enforce_detection == True:
-        raise ValueError(
-            f"Detected face shape is {img.shape}. Consider to set enforce_detection arg to False."
-        )
-
-    return extracted_faces
-
-
-def normalize_input(img: np.ndarray, normalization: str = "base") -> np.ndarray:
-    """Normalize input image.
-
-    Args:
-        img (numpy array): the input image.
-        normalization (str, optional): the normalization technique. Defaults to "base",
-        for no normalization.
-
-    Returns:
-        numpy array: the normalized image.
-    """
-
-    # issue 131 declares that some normalization techniques improves the accuracy
-
-    if normalization == "base":
-        return img
-
-    # @trevorgribble and @davedgd contributed this feature
-    # restore input in scale of [0, 255] because it was normalized in scale of
-    # [0, 1] in preprocess_face
-    img *= 255
-
-    if normalization == "raw":
-        pass  # return just restored pixels
-
-    elif normalization == "Facenet":
-        mean, std = img.mean(), img.std()
-        img = (img - mean) / std
-
-    elif normalization == "Facenet2018":
-        # simply / 127.5 - 1 (similar to facenet 2018 model preprocessing step as @iamrishab posted)
-        img /= 127.5
-        img -= 1
-
-    elif normalization == "VGGFace":
-        # mean subtraction based on VGGFace1 training data
-        img[..., 0] -= 93.5940
-        img[..., 1] -= 104.7624
-        img[..., 2] -= 129.1863
-
-    elif normalization == "VGGFace2":
-        # mean subtraction based on VGGFace2 training data
-        img[..., 0] -= 91.4953
-        img[..., 1] -= 103.8827
-        img[..., 2] -= 131.0912
-
-    elif normalization == "ArcFace":
-        # Reference study: The faces are cropped and resized to 112×112,
-        # and each pixel (ranged between [0, 255]) in RGB images is normalised
-        # by subtracting 127.5 then divided by 128.
-        img -= 127.5
-        img /= 128
-    else:
-        raise ValueError(f"unimplemented normalization type - {normalization}")
-
-    return img
-
-
 def find_target_size(model_name: str) -> tuple:
    """Find the target size of the model.

--- a/deepface/modules/demography.py
+++ b/deepface/modules/demography.py
@ -6,8 +6,7 @@ import numpy as np
 from tqdm import tqdm

 # project dependencies
-from deepface.modules import modeling
-from deepface.commons import functions
+from deepface.modules import modeling, detection
 from deepface.extendedmodels import Gender, Race, Emotion


@ -114,8 +113,8 @@ def analyze(
    # ---------------------------------
    resp_objects = []

-    img_objs = functions.extract_faces(
-        img=img_path,
+    img_objs = detection.extract_faces(
+        img_path=img_path,
        target_size=(224, 224),
        detector_backend=detector_backend,
        grayscale=False,
@ -123,7 +122,10 @@ def analyze(
        align=align,
    )

-    for img_content, img_region, img_confidence in img_objs:
+    for img_obj in img_objs:
+        img_content = img_obj["face"]
+        img_region = img_obj["facial_area"]
+        img_confidence = img_obj["confidence"]
        if img_content.shape[0] > 0 and img_content.shape[1] > 0:
            obj = {}
            # facial attribute analysis
--- a/deepface/modules/detection.py
+++ b/deepface/modules/detection.py
@ -3,10 +3,26 @@ from typing import Any, Dict, List, Tuple, Union

 # 3rd part dependencies
 import numpy as np
+import cv2
 from PIL import Image

 # project dependencies
+from deepface.modules import preprocessing
+from deepface.models.Detector import DetectedFace, FacialAreaRegion
+from deepface.detectors import DetectorWrapper
 from deepface.commons import functions
+from deepface.commons.logger import Logger
+
+logger = Logger(module="deepface/modules/detection.py")
+
+# pylint: disable=no-else-raise
+
+
+tf_major_version = functions.get_tf_major_version()
+if tf_major_version == 1:
+    from keras.preprocessing import image
+elif tf_major_version == 2:
+    from tensorflow.keras.preprocessing import image


 def extract_faces(
@ -16,6 +32,7 @@ def extract_faces(
    enforce_detection: bool = True,
    align: bool = True,
    grayscale: bool = False,
+    human_readable=False,
 ) -> List[Dict[str, Any]]:
    """
    Extract faces from a given image
@ -38,6 +55,8 @@ def extract_faces(
        grayscale (boolean): Flag to convert the image to grayscale before
            processing (default is False).

+        human_readable (bool): Flag to make the image human readable. 3D RGB for human readable
+            or 4D BGR for ML models (default is False).

    Returns:
        results (List[Dict[str, Any]]): A list of dictionaries, where each dictionary contains:
@ -48,27 +67,108 @@ def extract_faces(

    resp_objs = []

-    img_objs = functions.extract_faces(
-        img=img_path,
-        target_size=target_size,
-        detector_backend=detector_backend,
-        grayscale=grayscale,
-        enforce_detection=enforce_detection,
-        align=align,
+    # img might be path, base64 or numpy array. Convert it to numpy whatever it is.
+    img, img_name = preprocessing.load_image(img_path)
+
+    base_region = FacialAreaRegion(x=0, y=0, w=img.shape[1], h=img.shape[0])
+
+    if detector_backend == "skip":
+        face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]
+    else:
+        face_objs = DetectorWrapper.detect_faces(detector_backend, img, align)
+
+    # in case of no face found
+    if len(face_objs) == 0 and enforce_detection is True:
+        if img_name is not None:
+            raise ValueError(
+                f"Face could not be detected in {img_name}."
+                "Please confirm that the picture is a face photo "
+                "or consider to set enforce_detection param to False."
+            )
+        else:
+            raise ValueError(
+                "Face could not be detected. Please confirm that the picture is a face photo "
+                "or consider to set enforce_detection param to False."
            )

-    for img, region, confidence in img_objs:
-        resp_obj = {}
+    if len(face_objs) == 0 and enforce_detection is False:
+        face_objs = [DetectedFace(img=img, facial_area=base_region, confidence=0)]

+    for face_obj in face_objs:
+        current_img = face_obj.img
+        current_region = face_obj.facial_area
+        confidence = face_obj.confidence
+
+        if current_img.shape[0] == 0 or current_img.shape[1] == 0:
+            continue
+
+        if grayscale is True:
+            current_img = cv2.cvtColor(current_img, cv2.COLOR_BGR2GRAY)
+
+        # resize and padding
+        factor_0 = target_size[0] / current_img.shape[0]
+        factor_1 = target_size[1] / current_img.shape[1]
+        factor = min(factor_0, factor_1)
+
+        dsize = (
+            int(current_img.shape[1] * factor),
+            int(current_img.shape[0] * factor),
+        )
+        current_img = cv2.resize(current_img, dsize)
+
+        diff_0 = target_size[0] - current_img.shape[0]
+        diff_1 = target_size[1] - current_img.shape[1]
+        if grayscale is False:
+            # Put the base image in the middle of the padded image
+            current_img = np.pad(
+                current_img,
+                (
+                    (diff_0 // 2, diff_0 - diff_0 // 2),
+                    (diff_1 // 2, diff_1 - diff_1 // 2),
+                    (0, 0),
+                ),
+                "constant",
+            )
+        else:
+            current_img = np.pad(
+                current_img,
+                (
+                    (diff_0 // 2, diff_0 - diff_0 // 2),
+                    (diff_1 // 2, diff_1 - diff_1 // 2),
+                ),
+                "constant",
+            )
+
+        # double check: if target image is not still the same size with target.
+        if current_img.shape[0:2] != target_size:
+            current_img = cv2.resize(current_img, target_size)
+
+        # normalizing the image pixels
+        # what this line doing? must?
+        img_pixels = image.img_to_array(current_img)
+        img_pixels = np.expand_dims(img_pixels, axis=0)
+        img_pixels /= 255  # normalize input in [0, 1]
        # discard expanded dimension
-        if len(img.shape) == 4:
-            img = img[0]
+        if human_readable is True and len(img_pixels.shape) == 4:
+            img_pixels = img_pixels[0]

-        # bgr to rgb
-        resp_obj["face"] = img[:, :, ::-1]
-        resp_obj["facial_area"] = region
-        resp_obj["confidence"] = confidence
-        resp_objs.append(resp_obj)
+        resp_objs.append(
+            {
+                "face": img_pixels[:, :, ::-1] if human_readable is True else img_pixels,
+                "facial_area": {
+                    "x": current_region.x,
+                    "y": current_region.y,
+                    "w": current_region.w,
+                    "h": current_region.h,
+                },
+                "confidence": confidence,
+            }
+        )
+
+    if len(resp_objs) == 0 and enforce_detection == True:
+        raise ValueError(
+            f"Detected face shape is {img.shape}. Consider to set enforce_detection arg to False."
+        )

    return resp_objs

--- a/deepface/modules/preprocessing.py
+++ b/deepface/modules/preprocessing.py
@ -0,0 +1,131 @@
+import os
+from typing import Union, Tuple
+import base64
+from pathlib import Path
+
+# 3rd party
+import numpy as np
+import cv2
+from PIL import Image
+import requests
+
+
+def load_image(img: Union[str, np.ndarray]) -> Tuple[np.ndarray, str]:
+    """
+    Load image from path, url, base64 or numpy array.
+    Args:
+        img: a path, url, base64 or numpy array.
+    Returns:
+        image (numpy array): the loaded image in BGR format
+        image name (str): image name itself
+    """
+
+    # The image is already a numpy array
+    if isinstance(img, np.ndarray):
+        return img, "numpy array"
+
+    if isinstance(img, Path):
+        img = str(img)
+
+    if not isinstance(img, str):
+        raise ValueError(f"img must be numpy array or str but it is {type(img)}")
+
+    # The image is a base64 string
+    if img.startswith("data:image/"):
+        return load_base64(img), "base64 encoded string"
+
+    # The image is a url
+    if img.startswith("http"):
+        return (
+            np.array(Image.open(requests.get(img, stream=True, timeout=60).raw).convert("BGR")),
+            # return url as image name
+            img,
+        )
+
+    # The image is a path
+    if os.path.isfile(img) is not True:
+        raise ValueError(f"Confirm that {img} exists")
+
+    # image must be a file on the system then
+
+    # image name must have english characters
+    if img.isascii() is False:
+        raise ValueError(f"Input image must not have non-english characters - {img}")
+
+    img_obj_bgr = cv2.imread(img)
+    # img_obj_rgb = cv2.cvtColor(img_obj_bgr, cv2.COLOR_BGR2RGB)
+    return img_obj_bgr, img
+
+
+def load_base64(uri: str) -> np.ndarray:
+    """Load image from base64 string.
+
+    Args:
+        uri: a base64 string.
+
+    Returns:
+        numpy array: the loaded image.
+    """
+    encoded_data = uri.split(",")[1]
+    nparr = np.fromstring(base64.b64decode(encoded_data), np.uint8)
+    img_bgr = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
+    # img_rgb = cv2.cvtColor(img_bgr, cv2.COLOR_BGR2RGB)
+    return img_bgr
+
+
+def normalize_input(img: np.ndarray, normalization: str = "base") -> np.ndarray:
+    """Normalize input image.
+
+    Args:
+        img (numpy array): the input image.
+        normalization (str, optional): the normalization technique. Defaults to "base",
+        for no normalization.
+
+    Returns:
+        numpy array: the normalized image.
+    """
+
+    # issue 131 declares that some normalization techniques improves the accuracy
+
+    if normalization == "base":
+        return img
+
+    # @trevorgribble and @davedgd contributed this feature
+    # restore input in scale of [0, 255] because it was normalized in scale of
+    # [0, 1] in preprocess_face
+    img *= 255
+
+    if normalization == "raw":
+        pass  # return just restored pixels
+
+    elif normalization == "Facenet":
+        mean, std = img.mean(), img.std()
+        img = (img - mean) / std
+
+    elif normalization == "Facenet2018":
+        # simply / 127.5 - 1 (similar to facenet 2018 model preprocessing step as @iamrishab posted)
+        img /= 127.5
+        img -= 1
+
+    elif normalization == "VGGFace":
+        # mean subtraction based on VGGFace1 training data
+        img[..., 0] -= 93.5940
+        img[..., 1] -= 104.7624
+        img[..., 2] -= 129.1863
+
+    elif normalization == "VGGFace2":
+        # mean subtraction based on VGGFace2 training data
+        img[..., 0] -= 91.4953
+        img[..., 1] -= 103.8827
+        img[..., 2] -= 131.0912
+
+    elif normalization == "ArcFace":
+        # Reference study: The faces are cropped and resized to 112×112,
+        # and each pixel (ranged between [0, 255]) in RGB images is normalised
+        # by subtracting 127.5 then divided by 128.
+        img -= 127.5
+        img /= 128
+    else:
+        raise ValueError(f"unimplemented normalization type - {normalization}")
+
+    return img
--- a/deepface/modules/recognition.py
+++ b/deepface/modules/recognition.py
@ -12,7 +12,7 @@ from tqdm import tqdm
 # project dependencies
 from deepface.commons import functions, distance as dst
 from deepface.commons.logger import Logger
-from deepface.modules import representation
+from deepface.modules import representation, detection

 logger = Logger(module="deepface/modules/recognition.py")

@ -202,8 +202,8 @@ def find(
    )

    # img path might have more than once face
-    source_objs = functions.extract_faces(
-        img=img_path,
+    source_objs = detection.extract_faces(
+        img_path=img_path,
        target_size=target_size,
        detector_backend=detector_backend,
        grayscale=False,
@ -213,7 +213,9 @@ def find(

    resp_obj = []

-    for source_img, source_region, _ in source_objs:
+    for source_obj in source_objs:
+        source_img = source_obj["face"]
+        source_region = source_obj["facial_area"]
        target_embedding_obj = representation.represent(
            img_path=source_img,
            model_name=model_name,
@ -333,8 +335,8 @@ def __find_bulk_embeddings(
        desc="Finding representations",
        disable=silent,
    ):
-        img_objs = functions.extract_faces(
-            img=employee,
+        img_objs = detection.extract_faces(
+            img_path=employee,
            target_size=target_size,
            detector_backend=detector_backend,
            grayscale=False,
@ -342,7 +344,9 @@ def __find_bulk_embeddings(
            align=align,
        )

-        for img_content, img_region, _ in img_objs:
+        for img_obj in img_objs:
+            img_content = img_obj["face"]
+            img_region = img_obj["facial_area"]
            embedding_obj = representation.represent(
                img_path=img_content,
                model_name=model_name,
--- a/deepface/modules/representation.py
+++ b/deepface/modules/representation.py
@ -6,7 +6,7 @@ import numpy as np
 import cv2

 # project dependencies
-from deepface.modules import modeling
+from deepface.modules import modeling, detection, preprocessing
 from deepface.commons import functions
 from deepface.models.FacialRecognition import FacialRecognition

@ -63,8 +63,8 @@ def represent(
    # we have run pre-process in verification. so, this can be skipped if it is coming from verify.
    target_size = functions.find_target_size(model_name=model_name)
    if detector_backend != "skip":
-        img_objs = functions.extract_faces(
-            img=img_path,
+        img_objs = detection.extract_faces(
+            img_path=img_path,
            target_size=(target_size[1], target_size[0]),
            detector_backend=detector_backend,
            grayscale=False,
@ -73,7 +73,7 @@ def represent(
        )
    else:  # skip
        # Try load. If load error, will raise exception internal
-        img, _ = functions.load_image(img_path)
+        img, _ = preprocessing.load_image(img_path)
        # --------------------------------
        if len(img.shape) == 4:
            img = img[0]  # e.g. (1, 224, 224, 3) to (224, 224, 3)
@ -85,13 +85,21 @@ def represent(
                img = (img.astype(np.float32) / 255.0).astype(np.float32)
        # --------------------------------
        # make dummy region and confidence to keep compatibility with `extract_faces`
-        img_region = {"x": 0, "y": 0, "w": img.shape[1], "h": img.shape[2]}
-        img_objs = [(img, img_region, 0)]
+        img_objs = [
+            {
+                "face": img,
+                "facial_area": {"x": 0, "y": 0, "w": img.shape[1], "h": img.shape[2]},
+                "confidence": 0,
+            }
+        ]
    # ---------------------------------

-    for img, region, confidence in img_objs:
+    for img_obj in img_objs:
+        img = img_obj["face"]
+        region = img_obj["facial_area"]
+        confidence = img_obj["confidence"]
        # custom normalization
-        img = functions.normalize_input(img=img, normalization=normalization)
+        img = preprocessing.normalize_input(img=img, normalization=normalization)

        embedding = model.find_embeddings(img)

--- a/deepface/modules/verification.py
+++ b/deepface/modules/verification.py
@ -7,7 +7,7 @@ import numpy as np

 # project dependencies
 from deepface.commons import functions, distance as dst
-from deepface.modules import representation
+from deepface.modules import representation, detection


 def verify(
@ -82,8 +82,8 @@ def verify(
    target_size = functions.find_target_size(model_name=model_name)

    # img pairs might have many faces
-    img1_objs = functions.extract_faces(
-        img=img1_path,
+    img1_objs = detection.extract_faces(
+        img_path=img1_path,
        target_size=target_size,
        detector_backend=detector_backend,
        grayscale=False,
@ -91,8 +91,8 @@ def verify(
        align=align,
    )

-    img2_objs = functions.extract_faces(
-        img=img2_path,
+    img2_objs = detection.extract_faces(
+        img_path=img2_path,
        target_size=target_size,
        detector_backend=detector_backend,
        grayscale=False,
@ -103,8 +103,12 @@ def verify(
    distances = []
    regions = []
    # now we will find the face pair with minimum distance
-    for img1_content, img1_region, _ in img1_objs:
-        for img2_content, img2_region, _ in img2_objs:
+    for img1_obj in img1_objs:
+        img1_content = img1_obj["face"]
+        img1_region = img1_obj["facial_area"]
+        for img2_obj in img2_objs:
+            img2_content = img2_obj["face"]
+            img2_region = img2_obj["facial_area"]
            img1_embedding_obj = representation.represent(
                img_path=img1_content,
                model_name=model_name,
--- a/tests/test_extract_faces.py
+++ b/tests/test_extract_faces.py
@ -1,12 +1,14 @@
+import numpy as np
+import pytest
 from deepface import DeepFace
 from deepface.commons.logger import Logger

 logger = Logger("tests/test_extract_faces.py")

-
-def test_different_detectors():
 detectors = ["opencv", "mtcnn"]

+
+def test_different_detectors():
    for detector in detectors:
        img_objs = DeepFace.extract_faces(img_path="dataset/img11.jpg", detector_backend=detector)
        for img_obj in img_objs:
@ -22,3 +24,21 @@ def test_different_detectors():
            img = img_obj["face"]
            assert img.shape[0] > 0 and img.shape[1] > 0
        logger.info(f"✅ extract_faces for {detector} backend test is done")
+
+
+def test_backends_for_enforced_detection_with_non_facial_inputs():
+    black_img = np.zeros([224, 224, 3])
+    for detector in detectors:
+        with pytest.raises(ValueError):
+            _ = DeepFace.extract_faces(img_path=black_img, detector_backend=detector)
+    logger.info("✅ extract_faces for enforced detection and non-facial image test is done")
+
+
+def test_backends_for_not_enforced_detection_with_non_facial_inputs():
+    black_img = np.zeros([224, 224, 3])
+    for detector in detectors:
+        objs = DeepFace.extract_faces(
+            img_path=black_img, detector_backend=detector, enforce_detection=False
+        )
+        assert objs[0]["face"].shape == (224, 224, 3)
+    logger.info("✅ extract_faces for not enforced detection and non-facial image test is done")