improved flexibility for recurring operations

2025-06-07 12:05:22 +00:00 · 2024-12-28 15:19:20 +01:00 · 2024-12-28 15:19:20 +01:00 · ff47b71455
commit ff47b71455
parent ca6afd98ef
3 changed files with 265 additions and 16 deletions
--- a/deepface/DeepFace.py
+++ b/deepface/DeepFace.py
@ -262,6 +262,83 @@ def analyze(
    )
 def analyze_from_image_objects(
    img_objs: List[Dict[str, Any]],
    actions: Union[tuple, list] = ("emotion", "age", "gender", "race"),
    silent: bool = False,
    anti_spoofing: bool = False,
 ) -> List[Dict[str, Any]]:
    """
    Analyze facial attributes such as age, gender, emotion, and race in the provided image.
    Args:
        img_objs (List[Dict[str, Any]]): Output of detection.extract_faces.
        actions (tuple): Attributes to analyze. The default is ('age', 'gender', 'emotion', 'race').
            You can exclude some of these attributes from the analysis if needed.
        silent (boolean): Suppress or allow some log messages for a quieter analysis process
            (default is False).
        anti_spoofing (boolean): Flag to enable anti spoofing (default is False).
    Returns:
        results (List[Dict[str, Any]]): A list of dictionaries, where each dictionary represents
           the analysis results for a detected face.
           Each dictionary in the list contains the following keys:
           - 'region' (dict): Represents the rectangular region of the detected face in the image.
               - 'x': x-coordinate of the top-left corner of the face.
               - 'y': y-coordinate of the top-left corner of the face.
               - 'w': Width of the detected face region.
               - 'h': Height of the detected face region.
           - 'age' (float): Estimated age of the detected face.
           - 'face_confidence' (float): Confidence score for the detected face.
                Indicates the reliability of the face detection.
           - 'dominant_gender' (str): The dominant gender in the detected face.
                Either "Man" or "Woman."
           - 'gender' (dict): Confidence scores for each gender category.
               - 'Man': Confidence score for the male gender.
               - 'Woman': Confidence score for the female gender.
           - 'dominant_emotion' (str): The dominant emotion in the detected face.
                Possible values include "sad," "angry," "surprise," "fear," "happy,"
                "disgust," and "neutral."
           - 'emotion' (dict): Confidence scores for each emotion category.
               - 'sad': Confidence score for sadness.
               - 'angry': Confidence score for anger.
               - 'surprise': Confidence score for surprise.
               - 'fear': Confidence score for fear.
               - 'happy': Confidence score for happiness.
               - 'disgust': Confidence score for disgust.
               - 'neutral': Confidence score for neutrality.
           - 'dominant_race' (str): The dominant race in the detected face.
                Possible values include "indian," "asian," "latino hispanic,"
                "black," "middle eastern," and "white."
           - 'race' (dict): Confidence scores for each race category.
               - 'indian': Confidence score for Indian ethnicity.
               - 'asian': Confidence score for Asian ethnicity.
               - 'latino hispanic': Confidence score for Latino/Hispanic ethnicity.
               - 'black': Confidence score for Black ethnicity.
               - 'middle eastern': Confidence score for Middle Eastern ethnicity.
               - 'white': Confidence score for White ethnicity.
    """
    return demography.analyze_from_image_objects(
        img_objs=img_objs,
        actions=actions,
        silent=silent,
        anti_spoofing=anti_spoofing,
    )
 def find(
        img_path: Union[str, np.ndarray],
        db_path: str,
@ -440,6 +517,52 @@ def represent(
    )
 def represent_from_image_objects(
    img_objs: List[Dict[str, Any]],
    model_name: str = "VGG-Face",
    normalization: str = "base",
    anti_spoofing: bool = False,
    max_faces: Optional[int] = None,
 ) -> List[Dict[str, Any]]:
    """
    Represent facial images as multi-dimensional vector embeddings.
    Args:
        img_objs (List[Dict[str, Any]]): Output of detection.extract_faces.
        model_name (str): Model for face recognition. Options: VGG-Face, Facenet, Facenet512,
            OpenFace, DeepFace, DeepID, Dlib, ArcFace, SFace and GhostFaceNet
        normalization (string): Normalize the input image before feeding it to the model.
            Default is base. Options: base, raw, Facenet, Facenet2018, VGGFace, VGGFace2, ArcFace
        anti_spoofing (boolean): Flag to enable anti spoofing (default is False).
        max_faces (int): Set a limit on the number of faces to be processed (default is None).
    Returns:
        results (List[Dict[str, Any]]): A list of dictionaries, each containing the
            following fields:
        - embedding (List[float]): Multidimensional vector representing facial features.
            The number of dimensions varies based on the reference model
            (e.g., FaceNet returns 128 dimensions, VGG-Face returns 4096 dimensions).
        - facial_area (dict): Detected facial area by face detection in dictionary format.
            Contains 'x' and 'y' as the left-corner point, and 'w' and 'h'
            as the width and height. If `detector_backend` is set to 'skip', it represents
            the full image area and is nonsensical.
        - face_confidence (float): Confidence score of face detection. If `detector_backend` is set
            to 'skip', the confidence will be 0 and is nonsensical.
    """
    return representation.represent_from_image_objects(
        img_objs=img_objs,
        model_name=model_name,
        normalization=normalization,
        anti_spoofing=anti_spoofing,
        max_faces=max_faces,
    )
 def stream(
        db_path: str = "",
        model_name: str = "VGG-Face",
--- a/deepface/modules/demography.py
+++ b/deepface/modules/demography.py
@ -100,6 +100,94 @@ def analyze(
               - 'white': Confidence score for White ethnicity.
    """
    img_objs = detection.extract_faces(
        img_path=img_path,
        detector_backend=detector_backend,
        enforce_detection=enforce_detection,
        grayscale=False,
        align=align,
        expand_percentage=expand_percentage,
        anti_spoofing=anti_spoofing,
    )
    return analyze_from_image_objects(
        img_objs=img_objs,
        actions=actions,
        silent=silent,
        anti_spoofing=anti_spoofing
    )
 def analyze_from_image_objects(
    img_objs: List[Dict[str, Any]],
    actions: Union[tuple, list] = ("emotion", "age", "gender", "race"),
    silent: bool = False,
    anti_spoofing: bool = False,
 ) -> List[Dict[str, Any]]:
    """
    Analyze facial attributes such as age, gender, emotion, and race in the provided image.
    Args:
        img_objs (List[Dict[str, Any]]): Output of detection.extract_faces.
        actions (tuple): Attributes to analyze. The default is ('age', 'gender', 'emotion', 'race').
            You can exclude some of these attributes from the analysis if needed.
        silent (boolean): Suppress or allow some log messages for a quieter analysis process
            (default is False).
        anti_spoofing (boolean): Flag to enable anti spoofing (default is False).
    Returns:
        results (List[Dict[str, Any]]): A list of dictionaries, where each dictionary represents
           the analysis results for a detected face.
           Each dictionary in the list contains the following keys:
           - 'region' (dict): Represents the rectangular region of the detected face in the image.
               - 'x': x-coordinate of the top-left corner of the face.
               - 'y': y-coordinate of the top-left corner of the face.
               - 'w': Width of the detected face region.
               - 'h': Height of the detected face region.
           - 'age' (float): Estimated age of the detected face.
           - 'face_confidence' (float): Confidence score for the detected face.
                Indicates the reliability of the face detection.
           - 'dominant_gender' (str): The dominant gender in the detected face.
                Either "Man" or "Woman."
           - 'gender' (dict): Confidence scores for each gender category.
               - 'Man': Confidence score for the male gender.
               - 'Woman': Confidence score for the female gender.
           - 'dominant_emotion' (str): The dominant emotion in the detected face.
                Possible values include "sad," "angry," "surprise," "fear," "happy,"
                "disgust," and "neutral."
           - 'emotion' (dict): Confidence scores for each emotion category.
               - 'sad': Confidence score for sadness.
               - 'angry': Confidence score for anger.
               - 'surprise': Confidence score for surprise.
               - 'fear': Confidence score for fear.
               - 'happy': Confidence score for happiness.
               - 'disgust': Confidence score for disgust.
               - 'neutral': Confidence score for neutrality.
           - 'dominant_race' (str): The dominant race in the detected face.
                Possible values include "indian," "asian," "latino hispanic,"
                "black," "middle eastern," and "white."
           - 'race' (dict): Confidence scores for each race category.
               - 'indian': Confidence score for Indian ethnicity.
               - 'asian': Confidence score for Asian ethnicity.
               - 'latino hispanic': Confidence score for Latino/Hispanic ethnicity.
               - 'black': Confidence score for Black ethnicity.
               - 'middle eastern': Confidence score for Middle Eastern ethnicity.
               - 'white': Confidence score for White ethnicity.
    """
    # if actions is passed as tuple with single item, interestingly it becomes str here
    if isinstance(actions, str):
        actions = (actions,)
@ -120,16 +208,6 @@ def analyze(
    # ---------------------------------
    resp_objects = []
    img_objs = detection.extract_faces(
        img_path=img_path,
        detector_backend=detector_backend,
        enforce_detection=enforce_detection,
        grayscale=False,
        align=align,
        expand_percentage=expand_percentage,
        anti_spoofing=anti_spoofing,
    )
    for img_obj in img_objs:
        if anti_spoofing is True and img_obj.get("is_real", True) is False:
            raise ValueError("Spoof detected in the given image.")
--- a/deepface/modules/representation.py
+++ b/deepface/modules/representation.py
@ -64,15 +64,9 @@ def represent(
        - face_confidence (float): Confidence score of face detection. If `detector_backend` is set
            to 'skip', the confidence will be 0 and is nonsensical.
    """
    resp_objs = []
    model: FacialRecognition = modeling.build_model(
        task="facial_recognition", model_name=model_name
    )
    # ---------------------------------
    # we have run pre-process in verification. so, this can be skipped if it is coming from verify.
    target_size = model.input_shape
    if detector_backend != "skip":
        img_objs = detection.extract_faces(
            img_path=img_path,
@ -101,6 +95,60 @@ def represent(
        ]
    # ---------------------------------
    return represent_from_image_objects(
        img_objs=img_objs,
        model_name=model_name,
        normalization=normalization,
        anti_spoofing=anti_spoofing,
        max_faces=max_faces
    )
 def represent_from_image_objects(
    img_objs: List[Dict[str, Any]],
    model_name: str = "VGG-Face",
    normalization: str = "base",
    anti_spoofing: bool = False,
    max_faces: Optional[int] = None,
 ) -> List[Dict[str, Any]]:
    """
    Represent facial images as multi-dimensional vector embeddings.
    Args:
        img_objs (List[Dict[str, Any]]): Output of detection.extract_faces.
        model_name (str): Model for face recognition. Options: VGG-Face, Facenet, Facenet512,
            OpenFace, DeepFace, DeepID, Dlib, ArcFace, SFace and GhostFaceNet
        normalization (string): Normalize the input image before feeding it to the model.
            Default is base. Options: base, raw, Facenet, Facenet2018, VGGFace, VGGFace2, ArcFace
        anti_spoofing (boolean): Flag to enable anti spoofing (default is False).
        max_faces (int): Set a limit on the number of faces to be processed (default is None).
    Returns:
        results (List[Dict[str, Any]]): A list of dictionaries, each containing the
            following fields:
        - embedding (List[float]): Multidimensional vector representing facial features.
            The number of dimensions varies based on the reference model
            (e.g., FaceNet returns 128 dimensions, VGG-Face returns 4096 dimensions).
        - facial_area (dict): Detected facial area by face detection in dictionary format.
            Contains 'x' and 'y' as the left-corner point, and 'w' and 'h'
            as the width and height. If `detector_backend` is set to 'skip', it represents
            the full image area and is nonsensical.
        - face_confidence (float): Confidence score of face detection. If `detector_backend` is set
            to 'skip', the confidence will be 0 and is nonsensical.
    """
    resp_objs = []
    model: FacialRecognition = modeling.build_model(
        task="facial_recognition", model_name=model_name
    )
    target_size = model.input_shape
    if max_faces is not None and max_faces < len(img_objs):
        # sort as largest facial areas come first
        img_objs = sorted(