reproduce experiments procedures added

2025-07-21 17:30:02 +00:00 · 2024-04-07 08:57:32 +01:00 · 2024-04-07 08:57:32 +01:00 · 8fbc25612b
commit 8fbc25612b
parent 357a397f1b
4 changed files with 2142 additions and 0 deletions
--- a/benchmarks/Evaluate-Results.ipynb
+++ b/benchmarks/Evaluate-Results.ipynb
--- a/benchmarks/Perform-Experiments.ipynb
+++ b/benchmarks/Perform-Experiments.ipynb
@ -0,0 +1,351 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "8133a99d",
+   "metadata": {},
+   "source": [
+    "# Perform Experiments with DeepFace on LFW dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "5aab0cbe",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# built-in dependencies\n",
+    "import os\n",
+    "\n",
+    "# 3rd party dependencies\n",
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "from tqdm import tqdm\n",
+    "import matplotlib.pyplot as plt\n",
+    "from sklearn.metrics import accuracy_score\n",
+    "from sklearn.datasets import fetch_lfw_pairs\n",
+    "from deepface import DeepFace"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "64c9ed9a",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "This experiment is done with pip package of deepface with 0.0.89 version\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(f\"This experiment is done with pip package of deepface with {DeepFace.__version__} version\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "feaec973",
+   "metadata": {},
+   "source": [
+    "### Configuration Sets"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "453104b4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# all configuration alternatives for 4 dimensions of arguments\n",
+    "alignment = [True, False]\n",
+    "models = [\"Facenet\", \"Facenet512\", \"VGG-Face\", \"ArcFace\", \"Dlib\", \"GhostFaceNet\", \"SFace\", \"OpenFace\", \"DeepFace\", \"DeepID\"]\n",
+    "detectors = [\"retinaface\", \"mtcnn\", \"dlib\", \"yolov8\", \"yunet\", \"mediapipe\", \"ssd\", \"opencv\", \"skip\"]\n",
+    "metrics = [\"euclidean\", \"euclidean_l2\", \"cosine\"]\n",
+    "expand_percentage = 0"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c9aeb57a",
+   "metadata": {},
+   "source": [
+    "### Create Required Folders if necessary"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "671d8a00",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "target_paths = [\"lfwe\", \"dataset\", \"outputs\", \"results\"]\n",
+    "for target_path in target_paths:\n",
+    "    if os.path.exists(target_path) != True:\n",
+    "        os.mkdir(target_path)\n",
+    "        print(f\"{target_path} is just created\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fc31f03a",
+   "metadata": {},
+   "source": [
+    "### Load LFW Dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "721a7d70",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "pairs_touch = \"outputs/lfwe.txt\"\n",
+    "instances = 1000 #pairs.shape[0]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "010184d8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "target_path = \"dataset/lfw.npy\"\n",
+    "labels_path = \"dataset/labels.npy\"\n",
+    "\n",
+    "if os.path.exists(target_path) != True:\n",
+    "    fetch_lfw_pairs = fetch_lfw_pairs(subset = 'test', color = True\n",
+    "                                  , resize = 2\n",
+    "                                  , funneled = False\n",
+    "                                  , slice_=None\n",
+    "                                 )\n",
+    "    pairs = fetch_lfw_pairs.pairs\n",
+    "    labels = fetch_lfw_pairs.target\n",
+    "    target_names = fetch_lfw_pairs.target_names\n",
+    "    np.save(target_path, pairs)\n",
+    "    np.save(labels_path, labels)\n",
+    "else:\n",
+    "    if os.path.exists(pairs_touch) != True:\n",
+    "        # loading pairs takes some time. but if we extract these pairs as image, no need to load it anymore\n",
+    "        pairs = np.load(target_path)\n",
+    "    labels = np.load(labels_path)    "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "005f582e",
+   "metadata": {},
+   "source": [
+    "### Save LFW image pairs into file system"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "5bc23313",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "100%|██████████| 1000/1000 [00:00<00:00, 219746.63it/s]\n"
+     ]
+    }
+   ],
+   "source": [
+    "for i in tqdm(range(0, instances)):\n",
+    "    img1_target = f\"lfwe/{i}_1.jpg\"\n",
+    "    img2_target = f\"lfwe/{i}_2.jpg\"\n",
+    "    \n",
+    "    if os.path.exists(img1_target) != True:\n",
+    "        img1 = pairs[i][0]\n",
+    "        # plt.imsave(img1_target, img1/255) #works for my mac\n",
+    "        plt.imsave(img1_target, img1) #works for my debian\n",
+    "    \n",
+    "    if os.path.exists(img2_target) != True:\n",
+    "        img2 = pairs[i][1]\n",
+    "        # plt.imsave(img2_target, img2/255) #works for my mac\n",
+    "        plt.imsave(img2_target, img2) #works for my debian\n",
+    "    \n",
+    "if os.path.exists(pairs_touch) != True:\n",
+    "    open(pairs_touch,'a').close()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6f8fa8fa",
+   "metadata": {},
+   "source": [
+    "### Perform Experiments\n",
+    "\n",
+    "This block will save the experiments results in outputs folder"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "e7fba936",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "for model_name in models:\n",
+    "    for detector_backend in detectors:\n",
+    "        for distance_metric in metrics:\n",
+    "            for align in alignment:\n",
+    "                \n",
+    "                if detector_backend == \"skip\" and align is True:\n",
+    "                    # Alignment is not possible for a skipped detector configuration\n",
+    "                    continue\n",
+    "                \n",
+    "                alignment_text = \"aligned\" if align is True else \"unaligned\"\n",
+    "                task = f\"{model_name}_{detector_backend}_{distance_metric}_{alignment_text}\"\n",
+    "                output_file = f\"outputs/{task}.csv\"\n",
+    "                if os.path.exists(output_file) is True:\n",
+    "                     #print(f\"{output_file} is available already\")\n",
+    "                     continue\n",
+    "                \n",
+    "                distances = []\n",
+    "                for i in tqdm(range(0, instances), desc = task):\n",
+    "                    img1_target = f\"lfwe/{i}_1.jpg\"\n",
+    "                    img2_target = f\"lfwe/{i}_2.jpg\"\n",
+    "                    result = DeepFace.verify(\n",
+    "                        img1_path=img1_target,\n",
+    "                        img2_path=img2_target,\n",
+    "                        model_name=model_name,\n",
+    "                        detector_backend=detector_backend,\n",
+    "                        distance_metric=distance_metric,\n",
+    "                        align=align,\n",
+    "                        enforce_detection=False,\n",
+    "                        expand_percentage=expand_percentage,\n",
+    "                    )\n",
+    "                    distance = result[\"distance\"]\n",
+    "                    distances.append(distance)\n",
+    "                # -----------------------------------\n",
+    "                df = pd.DataFrame(list(labels), columns = [\"actuals\"])\n",
+    "                df[\"distances\"] = distances\n",
+    "                df.to_csv(output_file, index=False)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a0b8dafa",
+   "metadata": {},
+   "source": [
+    "### Calculate Results\n",
+    "\n",
+    "Experiments were responsible for calculating distances. We will calculate the best accuracy scores in this block."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "67376e76",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "data = [[0 for _ in range(len(models))] for _ in range(len(detectors))]\n",
+    "base_df = pd.DataFrame(data, columns=models, index=detectors)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "f2cc536b",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "results/pivot_euclidean_with_alignment_True.csv saved\n",
+      "results/pivot_euclidean_l2_with_alignment_True.csv saved\n",
+      "results/pivot_cosine_with_alignment_True.csv saved\n",
+      "results/pivot_euclidean_with_alignment_False.csv saved\n",
+      "results/pivot_euclidean_l2_with_alignment_False.csv saved\n",
+      "results/pivot_cosine_with_alignment_False.csv saved\n"
+     ]
+    }
+   ],
+   "source": [
+    "for is_aligned in alignment:\n",
+    "    for distance_metric in metrics:\n",
+    "\n",
+    "        current_df = base_df.copy()\n",
+    "        \n",
+    "        target_file = f\"results/pivot_{distance_metric}_with_alignment_{is_aligned}.csv\"\n",
+    "        if os.path.exists(target_file):\n",
+    "            continue\n",
+    "        \n",
+    "        for model_name in models:\n",
+    "            for detector_backend in detectors:\n",
+    "\n",
+    "                align = \"aligned\" if is_aligned is True else \"unaligned\"\n",
+    "\n",
+    "                if detector_backend == \"skip\" and is_aligned is True:\n",
+    "                    # Alignment is not possible for a skipped detector configuration\n",
+    "                    align = \"unaligned\"\n",
+    "\n",
+    "                source_file = f\"outputs/{model_name}_{detector_backend}_{distance_metric}_{align}.csv\"\n",
+    "                df = pd.read_csv(source_file)\n",
+    "                  \n",
+    "                positive_mean = df[(df[\"actuals\"] == True) | (df[\"actuals\"] == 1)][\"distances\"].mean()\n",
+    "                negative_mean = df[(df[\"actuals\"] == False) | (df[\"actuals\"] == 0)][\"distances\"].mean()\n",
+    "\n",
+    "                distances = sorted(df[\"distances\"].values.tolist())\n",
+    "\n",
+    "                items = []\n",
+    "                for i, distance in enumerate(distances):\n",
+    "                    if distance >= positive_mean and distance <= negative_mean:\n",
+    "                        sandbox_df = df.copy()\n",
+    "                        sandbox_df[\"predictions\"] = False\n",
+    "                        idx = sandbox_df[sandbox_df[\"distances\"] < distance].index\n",
+    "                        sandbox_df.loc[idx, \"predictions\"] = True\n",
+    "\n",
+    "                        actuals = sandbox_df.actuals.values.tolist()\n",
+    "                        predictions = sandbox_df.predictions.values.tolist()\n",
+    "                        accuracy = 100*accuracy_score(actuals, predictions)\n",
+    "                        items.append((distance, accuracy))\n",
+    "\n",
+    "                pivot_df = pd.DataFrame(items, columns = [\"distance\", \"accuracy\"])\n",
+    "                pivot_df = pivot_df.sort_values(by = [\"accuracy\"], ascending = False)\n",
+    "                # threshold = pivot_df.iloc[0][\"distance\"]\n",
+    "                accuracy = pivot_df.iloc[0][\"accuracy\"]\n",
+    "\n",
+    "                # print(source_file, round(accuracy, 1))\n",
+    "                current_df.at[detector_backend, model_name] = round(accuracy, 1)\n",
+    "        \n",
+    "        current_df.to_csv(target_file)\n",
+    "        print(f\"{target_file} saved\")"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/benchmarks/README.md
+++ b/benchmarks/README.md
@ -0,0 +1,104 @@
+# Benchmarks
+
+DeepFace offers various configurations that significantly impact accuracy, including the facial recognition model, face detector model, distance metric, and alignment mode. Our experiments conducted on the [LFW dataset](https://sefiks.com/2020/08/27/labeled-faces-in-the-wild-for-face-recognition/) using different combinations of these configurations yield the following results.
+
+You can reproduce the results by executing the `Perform-Experiments.ipynb` and `Evaluate-Results.ipynb` notebooks, respectively.
+
+## ROC Curves
+
+ROC curves provide a valuable means of evaluating the performance of different models on a broader scale. The following illusration shows ROC curves for different facial recognition models alongside their optimal configurations yielding the highest accuracy scores.
+
+<!--
+<p align="center"><img src="https://raw.githubusercontent.com/serengil/deepface/master/icon/benchmarks.jpg" width="95%" height="95%"></p>
+-->
+<p align="center"><img src="../icon/benchmarks.jpg" width="95%" height="95%"></p>
+
+In summary, FaceNet-512d surpasses human-level accuracy, while FaceNet-128d reaches it, with Dlib, VGG-Face, and ArcFace closely trailing but slightly below, and GhostFaceNet and SFace making notable contributions despite not leading, while OpenFace, DeepFace, and DeepId exhibit lower performance.
+
+## Accuracy Scores
+
+Please note that humans achieve a 97.5% accuracy score on the same dataset. Configurations that outperform this benchmark are highlighted in bold.
+
+### Performance Matrix for Euclidean while alignment is True
+
+| | Facenet |Facenet512 |VGG-Face |ArcFace |Dlib |GhostFaceNet |SFace |OpenFace |DeepFace |DeepID |
+| --- |  --- | --- | --- | --- | --- | --- | --- | --- | --- | --- |
+| retinaface |93.5 |95.9 |95.8 |85.2 |88.9 |85.9 |80.2 |69.4 |67.0 |65.6 |
+| mtcnn |93.8 |95.2 |95.9 |83.7 |89.4 |83.0 |77.4 |70.2 |66.5 |63.3 |
+| dlib |90.8 |96.0 |94.5 |88.6 |96.8 |65.7 |66.3 |75.8 |63.4 |60.4 |
+| yolov8 |91.9 |94.4 |95.0 |84.1 |89.2 |77.6 |73.4 |68.7 |69.0 |66.5 |
+| yunet |96.1 |97.3 |96.0 |84.9 |92.2 |84.0 |79.4 |70.9 |65.8 |65.2 |
+| mediapipe |88.6 |95.1 |92.9 |73.2 |93.1 |63.2 |72.5 |78.7 |61.8 |62.2 |
+| ssd |85.6 |88.9 |87.0 |75.8 |83.1 |79.1 |76.9 |66.8 |63.4 |62.5 |
+| opencv |84.2 |88.2 |87.3 |73.0 |84.4 |83.8 |81.1 |66.4 |65.5 |59.6 |
+| skip |64.1 |92.0 |90.6 |56.6 |69.0 |75.1 |81.4 |57.4 |60.8 |60.7 |
+
+### Performance Matrix for Euclidean while alignment is False
+
+| | Facenet |Facenet512 |VGG-Face |ArcFace |Dlib |GhostFaceNet |SFace |OpenFace |DeepFace |DeepID |
+| --- |  --- | --- | --- | --- | --- | --- | --- | --- | --- | --- |
+| retinaface |92.8 |96.1 |95.7 |84.1 |88.3 |83.2 |78.6 |70.8 |67.4 |64.3 |
+| mtcnn |92.5 |95.9 |95.5 |81.8 |89.3 |83.2 |76.3 |70.9 |65.9 |63.2 |
+| dlib |89.0 |96.0 |94.1 |82.6 |96.3 |65.6 |73.1 |75.9 |61.8 |61.9 |
+| yolov8 |90.8 |94.8 |95.2 |83.2 |88.4 |77.6 |71.6 |68.9 |68.2 |66.3 |
+| yunet |96.5 |**97.9** |96.3 |84.1 |91.4 |82.7 |78.2 |71.7 |65.5 |65.2 |
+| mediapipe |87.1 |94.9 |93.1 |71.1 |91.9 |61.9 |73.2 |77.6 |61.7 |62.4 |
+| ssd |94.9 |97.2 |96.7 |83.9 |88.6 |84.9 |82.0 |69.9 |66.7 |64.0 |
+| opencv |90.2 |94.1 |95.8 |89.8 |91.2 |91.0 |86.9 |71.1 |68.4 |61.1 |
+| skip |64.1 |92.0 |90.6 |56.6 |69.0 |75.1 |81.4 |57.4 |60.8 |60.7 |
+
+### Performance Matrix for L2 normalized Euclidean while alignment is True
+
+| | Facenet |Facenet512 |VGG-Face |ArcFace |Dlib |GhostFaceNet |SFace |OpenFace |DeepFace |DeepID |
+| --- |  --- | --- | --- | --- | --- | --- | --- | --- | --- | --- |
+| retinaface |96.4 |**98.4** |95.8 |96.6 |89.1 |90.5 |92.4 |69.4 |67.7 |64.4 |
+| mtcnn |96.8 |**97.6** |95.9 |96.0 |90.0 |89.8 |90.5 |70.2 |66.4 |64.0 |
+| dlib |92.6 |97.0 |94.5 |95.1 |96.4 |63.3 |69.8 |75.8 |66.5 |59.5 |
+| yolov8 |95.7 |97.3 |95.0 |95.5 |88.8 |88.9 |91.9 |68.7 |67.5 |66.0 |
+| yunet |97.4 |**97.9** |96.0 |96.7 |91.6 |89.1 |91.0 |70.9 |66.5 |63.6 |
+| mediapipe |90.6 |96.1 |92.9 |90.3 |92.6 |64.4 |75.4 |78.7 |64.7 |63.0 |
+| ssd |87.5 |88.7 |87.0 |86.2 |83.3 |82.2 |84.6 |66.8 |64.1 |62.6 |
+| opencv |84.8 |87.6 |87.3 |84.6 |84.0 |85.0 |83.6 |66.4 |63.8 |60.9 |
+| skip |67.6 |91.4 |90.6 |57.2 |69.3 |78.4 |83.4 |57.4 |62.6 |61.6 |
+
+### Performance Matrix for L2 normalized Euclidean while alignment is False
+
+| | Facenet |Facenet512 |VGG-Face |ArcFace |Dlib |GhostFaceNet |SFace |OpenFace |DeepFace |DeepID |
+| --- |  --- | --- | --- | --- | --- | --- | --- | --- | --- | --- |
+| retinaface |95.9 |**98.0** |95.7 |95.7 |88.4 |89.5 |90.6 |70.8 |67.7 |64.6 |
+| mtcnn |96.2 |**97.8** |95.5 |95.9 |89.2 |88.0 |91.1 |70.9 |67.0 |64.0 |
+| dlib |89.9 |96.5 |94.1 |93.8 |95.6 |63.0 |75.0 |75.9 |62.6 |61.8 |
+| yolov8 |95.8 |**97.7** |95.2 |95.0 |88.1 |88.7 |89.8 |68.9 |68.9 |65.3 |
+| yunet |96.8 |**98.3** |96.3 |96.1 |91.7 |88.0 |90.5 |71.7 |67.6 |63.2 |
+| mediapipe |90.0 |96.3 |93.1 |89.3 |91.8 |65.6 |74.6 |77.6 |64.9 |61.6 |
+| ssd |97.0 |**97.9** |96.7 |96.6 |89.4 |91.5 |93.0 |69.9 |68.7 |64.9 |
+| opencv |92.9 |96.2 |95.8 |93.2 |91.5 |93.3 |91.7 |71.1 |68.3 |61.6 |
+| skip |67.6 |91.4 |90.6 |57.2 |69.3 |78.4 |83.4 |57.4 |62.6 |61.6 |
+
+### Performance Matrix for cosine while alignment is True
+
+| | Facenet |Facenet512 |VGG-Face |ArcFace |Dlib |GhostFaceNet |SFace |OpenFace |DeepFace |DeepID |
+| --- |  --- | --- | --- | --- | --- | --- | --- | --- | --- | --- |
+| retinaface |96.4 |**98.4** |95.8 |96.6 |89.1 |90.5 |92.4 |69.4 |67.7 |64.4 |
+| mtcnn |96.8 |**97.6** |95.9 |96.0 |90.0 |89.8 |90.5 |70.2 |66.3 |63.0 |
+| dlib |92.6 |97.0 |94.5 |95.1 |96.4 |63.3 |69.8 |75.8 |66.5 |58.7 |
+| yolov8 |95.7 |97.3 |95.0 |95.5 |88.8 |88.9 |91.9 |68.7 |67.5 |65.9 |
+| yunet |97.4 |**97.9** |96.0 |96.7 |91.6 |89.1 |91.0 |70.9 |66.5 |63.5 |
+| mediapipe |90.6 |96.1 |92.9 |90.3 |92.6 |64.3 |75.4 |78.7 |64.8 |63.0 |
+| ssd |87.5 |88.7 |87.0 |86.2 |83.3 |82.2 |84.5 |66.8 |63.8 |62.6 |
+| opencv |84.9 |87.6 |87.2 |84.6 |84.0 |85.0 |83.6 |66.2 |63.7 |60.1 |
+| skip |67.6 |91.4 |90.6 |54.8 |69.3 |78.4 |83.4 |57.4 |62.6 |61.1 |
+
+### Performance Matrix for cosine while alignment is False
+
+| | Facenet |Facenet512 |VGG-Face |ArcFace |Dlib |GhostFaceNet |SFace |OpenFace |DeepFace |DeepID |
+| --- |  --- | --- | --- | --- | --- | --- | --- | --- | --- | --- |
+| retinaface |95.9 |**98.0** |95.7 |95.7 |88.4 |89.5 |90.6 |70.8 |67.7 |63.7 |
+| mtcnn |96.2 |**97.8** |95.5 |95.9 |89.2 |88.0 |91.1 |70.9 |67.0 |64.0 |
+| dlib |89.9 |96.5 |94.1 |93.8 |95.6 |63.0 |75.0 |75.9 |62.6 |61.7 |
+| yolov8 |95.8 |**97.7** |95.2 |95.0 |88.1 |88.7 |89.8 |68.9 |68.9 |65.3 |
+| yunet |96.8 |**98.3** |96.3 |96.1 |91.7 |88.0 |90.5 |71.7 |67.6 |63.2 |
+| mediapipe |90.0 |96.3 |93.1 |89.3 |91.8 |64.8 |74.6 |77.6 |64.9 |61.6 |
+| ssd |97.0 |**97.9** |96.7 |96.6 |89.4 |91.5 |93.0 |69.9 |68.7 |63.8 |
+| opencv |92.9 |96.2 |95.8 |93.2 |91.5 |93.3 |91.7 |71.1 |68.1 |61.1 |
+| skip |67.6 |91.4 |90.6 |54.8 |69.3 |78.4 |83.4 |57.4 |62.6 |61.1 |
--- a/icon/benchmarks.jpg
+++ b/icon/benchmarks.jpg