[update] enhance predict methods in Emotion and Race models to support single and batch inputs

2025-07-23 02:10:02 +00:00 · 2024-12-17 13:55:07 +08:00 · 2024-12-17 13:55:07 +08:00 · 38c06522a5
commit 38c06522a5
parent 27e8fc9d5e
2 changed files with 94 additions and 11 deletions
--- a/deepface/models/demography/Emotion.py
+++ b/deepface/models/demography/Emotion.py
@ -1,3 +1,6 @@
 # stdlib dependencies
 from typing import List, Union
 # 3rd party dependencies
 import numpy as np
 import cv2
@ -43,16 +46,61 @@ class EmotionClient(Demography):
        self.model = load_model()
        self.model_name = "Emotion"
-    def predict(self, img: np.ndarray) -> np.ndarray:
+    def _preprocess_image(self, img: np.ndarray) -> np.ndarray:
-        img_gray = cv2.cvtColor(img[0], cv2.COLOR_BGR2GRAY)
+        """
        Preprocess single image for emotion detection
        Args:
            img: Input image (224, 224, 3)
        Returns:
            Preprocessed grayscale image (48, 48)
        """
        img_gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
        img_gray = cv2.resize(img_gray, (48, 48))
-        img_gray = np.expand_dims(img_gray, axis=0)
+        return img_gray
-        # model.predict causes memory issue when it is called in a for loop
+    def predict(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[np.ndarray, np.ndarray]:
-        # emotion_predictions = self.model.predict(img_gray, verbose=0)[0, :]
+        """
-        emotion_predictions = self.model(img_gray, training=False).numpy()[0, :]
+        Predict emotion probabilities for single or multiple faces
        Args:
            img: Single image as np.ndarray (224, 224, 3) or
                List of images as List[np.ndarray] or
                Batch of images as np.ndarray (n, 224, 224, 3)
        Returns:
            Single prediction as np.ndarray (n_emotions,) [emotion_probs] or
            Multiple predictions as np.ndarray (n, n_emotions)
            where n_emotions is the number of emotion categories
        """
        # Convert to numpy array if input is list
        if isinstance(img, list):
            imgs = np.array(img)
        else:
            imgs = img
        # Remove batch dimension if exists
        imgs = imgs.squeeze()
        # Check input dimension
        if len(imgs.shape) == 3:
            # Single image - add batch dimension
            imgs = np.expand_dims(imgs, axis=0)
            is_single = True
        else:
            is_single = False
        # Preprocess each image
        processed_imgs = np.array([self._preprocess_image(img) for img in imgs])
        # Add channel dimension for grayscale images
        processed_imgs = np.expand_dims(processed_imgs, axis=-1)
        # Batch prediction
        predictions = self.model.predict_on_batch(processed_imgs)
        # Return single prediction for single image
        if is_single:
            return predictions[0]
        return predictions
        return emotion_predictions
 def load_model(
--- a/deepface/models/demography/Race.py
+++ b/deepface/models/demography/Race.py
@ -1,3 +1,6 @@
 # stdlib dependencies
 from typing import List, Union
 # 3rd party dependencies
 import numpy as np
@ -37,10 +40,42 @@ class RaceClient(Demography):
        self.model = load_model()
        self.model_name = "Race"
-    def predict(self, img: np.ndarray) -> np.ndarray:
+    def predict(self, img: Union[np.ndarray, List[np.ndarray]]) -> Union[np.ndarray, np.ndarray]:
-        # model.predict causes memory issue when it is called in a for loop
+        """
-        # return self.model.predict(img, verbose=0)[0, :]
+        Predict race probabilities for single or multiple faces
-        return self.model(img, training=False).numpy()[0, :]
+        Args:
            img: Single image as np.ndarray (224, 224, 3) or
                List of images as List[np.ndarray] or
                Batch of images as np.ndarray (n, 224, 224, 3)
        Returns:
            Single prediction as np.ndarray (n_races,) [race_probs] or
            Multiple predictions as np.ndarray (n, n_races)
            where n_races is the number of race categories
        """
        # Convert to numpy array if input is list
        if isinstance(img, list):
            imgs = np.array(img)
        else:
            imgs = img
        # Remove batch dimension if exists
        imgs = imgs.squeeze()
        # Check input dimension
        if len(imgs.shape) == 3:
            # Single image - add batch dimension
            imgs = np.expand_dims(imgs, axis=0)
            is_single = True
        else:
            is_single = False
        # Batch prediction
        predictions = self.model.predict_on_batch(imgs)
        # Return single prediction for single image
        if is_single:
            return predictions[0]
        return predictions
 def load_model(