[+] Add some analysis

e3183085 · Victor Demessance · 79a278f2 · e3183085 · e3183085 · e3183085
Commit e3183085 authored 11 months ago by Victor Demessance
--- a/machine_learning/learn.ipynb
+++ b/machine_learning/learn.ipynb
@@ -7,13 +7,6 @@
    "## Entrainement d'un modèle avec la méthode des SVM"
   ]
  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "#### Chargement des données d'entrainement"
-   ]
-  },
  {
   "cell_type": "code",
   "execution_count": 1,
@@ -21,9 +14,16 @@
   "outputs": [],
   "source": [
    "import os\n",
-    "import cv2\n",
    "import numpy as np\n",
-    "import random"
+    "import random\n",
+    "from PIL import Image"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 1) Fonctions de Preprocessing des datasets"
   ]
  },
  {
@@ -32,36 +32,39 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "\"\"\" \n",
+    "AVERAGE_SIZE_IMAGE = (127, 145)  # Thanks to the stats, we know that size of bbox will be (127, 145) -> Average size of labels \n",
-    "We will create a dict with all the usefull datas of the training dataset\n",
-    "datas = {\n",
-    "    \"XXXX\" (name of the file) : {\n",
-    "        \"img\" : ndarray of the image,\n",
-    "        \"labels\" (data of the labels): {\n",
-    "            \"X\" index of the label (0,1,...,n) : {\n",
-    "                \"name\" : name of the label,\n",
-    "                \"coord\" : coord of the label like xmin, ymin, xmax, ymax,\n",
-    "                \"img\" : crooped img of the label,\n",
-    "            }\n",
-    "        }\n",
-    "    }\n",
-    "}\n",
-    "\n",
-    "\"\"\"\n",
    "\n",
    "def generate_empty_bbox(image_width, image_height):\n",
-    "    # Thanks to the stats, we know that size of bbox will be (127, 145) -> Average size of labels \n",
+    "    \"\"\" \n",
-    "    # Génération de coordonnées aléatoires pour le coin supérieur gauche de la boundebox\n",
+    "    Generate an empty box for images without label\n",
-    "    x_min = random.randint(0, image_width - 127)\n",
+    "    \"\"\"\n",
-    "    y_min = random.randint(0, image_height - 145)\n",
+    "    # Generating random coords for the bbox\n",
+    "    x_min = random.randint(0, image_width - AVERAGE_SIZE_IMAGE[0])\n",
+    "    y_min = random.randint(0, image_height - AVERAGE_SIZE_IMAGE[1])\n",
    "    \n",
-    "    # Calcul des coordonnées du coin inférieur droit de la boundebox\n",
+    "    # Compute complete coords of the bbox\n",
-    "    x_max = x_min + 127\n",
+    "    x_max = x_min + AVERAGE_SIZE_IMAGE[0]\n",
-    "    y_max = y_min + 145\n",
+    "    y_max = y_min + AVERAGE_SIZE_IMAGE[1]\n",
    "    \n",
    "    return (x_min, y_min, x_max, y_max)\n",
    "\n",
    "def load_data(image_dir, label_dir):\n",
+    "    \"\"\" \n",
+    "    Create a dict with all the usefull datas of the dataset\n",
+    "    datas = {\n",
+    "        \"XXXX\" (name of the file) : {\n",
+    "            \"img\" : image as an array,\n",
+    "            \"labels\" (data of the labels): {\n",
+    "                \"X\" index of the label (0,1,...,n) : {\n",
+    "                    \"name\" : name of the label,\n",
+    "                    \"coord\" : coord of the label like xmin, ymin, xmax, ymax,\n",
+    "                    \"img\" : crooped img of the label,\n",
+    "                }\n",
+    "            }\n",
+    "        }\n",
+    "    }\n",
+    "    \"\"\"\n",
+    "    \n",
    "    datas = {}\n",
    "\n",
    "    for image_file in os.listdir(image_dir):\n",
@@ -71,7 +74,7 @@
    "        label_path = label_dir + '/' + name + '.csv'\n",
    "        \n",
    "        # Import image as array\n",
-    "        image = cv2.imread(image_path)\n",
+    "        image = np.array(Image.open(image_path))\n",
    "\n",
    "        # Import labels as array \n",
    "        with open(label_path, 'r') as file:\n",
@@ -83,7 +86,7 @@
    "                xmin, ymin, xmax, ymax = generate_empty_bbox(image.shape[1], image.shape[0])\n",
    "    \n",
    "                # Get the cropped image (as array) of the label\n",
-    "                cropped_image = image[ymin:ymax, xmin:xmax]\n",
+    "                cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))\n",
    "               \n",
    "                label_data[0] = {\n",
    "                        \"name\":\"empty\",\n",
@@ -101,7 +104,7 @@
    "                    class_name = row[4]\n",
    "\n",
    "                    # Get the cropped image (as array) of the label\n",
-    "                    cropped_image = image[ymin:ymax, xmin:xmax]\n",
+    "                    cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))\n",
    "                    \n",
    "                    # Adding to the json\n",
    "                    label_data[i] = {\n",
@@ -115,7 +118,28 @@
    "             \"labels\" : label_data,\n",
    "        }\n",
    "       \n",
-    "    return datas"
+    "    return datas\n",
+    "\n",
+    "# Dict to convert str class name to int\n",
+    "name_to_int = {\n",
+    "    \"danger\": 0,\n",
+    "    \"interdiction\": 1,\n",
+    "    \"obligation\": 2,\n",
+    "    \"stop\": 3,\n",
+    "    \"ceder\": 4,\n",
+    "    \"frouge\": 5,\n",
+    "    \"forange\": 6,\n",
+    "    \"fvert\": 7,\n",
+    "    \"ff\": 8,\n",
+    "    \"empty\": 9\n",
+    "}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 2) Fonction de création des datasets"
   ]
  },
  {
@@ -124,9 +148,28 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "# Creating the dict of the datas \n",
+    "def create_xy(datas):\n",
+    "    # Creating arrays with all labels datas & classes\n",
+    "    X = []\n",
+    "    Y = []\n",
+    "\n",
+    "    for name, data in datas.items():\n",
+    "        for row in data[\"labels\"].values():\n",
+    "            image_as_array = np.array(row[\"img\"]).flatten()\n",
+    "            X.append(image_as_array)\n",
+    "            Y.append(name_to_int[row[\"name\"]])\n",
+    "\n",
+    "    X = np.array(X)\n",
+    "    Y = np.array(Y)\n",
    "\n",
-    "datas = load_data(\"../data/train/images\", \"../data/train/labels\")"
+    "    return X, Y"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 3) Création des datasets"
   ]
  },
  {
@@ -135,73 +178,115 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "def extract_features(img):\n",
+    "# Training dataset\n",
-    "    # Convertion to gray level\n",
+    "datas_train = load_data(\"../../data/train/images\", \"../../data/train/labels\")\n",
-    "    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)\n",
+    "X_train, Y_train = create_xy(datas=datas_train)\n",
    "\n",
-    "    # Color Hist\n",
+    "# Validation dataset\n",
-    "    hist_color = cv2.calcHist([img], [0, 1, 2], None, [8, 8, 8], [0, 256, 0, 256, 0, 256])\n",
+    "datas_val = load_data(\"../../data/val/images\", \"../../data/val/labels\")\n",
-    "    hist_color = cv2.normalize(hist_color, hist_color).flatten()\n",
+    "X_val, Y_val = create_xy(datas=datas_val)"
-    "    \n",
+   ]
-    "    # Gradient Hist\n",
+  },
-    "    sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=5)\n",
+  {
-    "    sobely = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=5)\n",
+   "cell_type": "markdown",
-    "    grad_mag = np.sqrt(sobelx**2 + sobely**2)\n",
+   "metadata": {},
-    "    hist_gradient = cv2.calcHist([grad_mag.astype(np.uint8)], [0], None, [16], [0, 256])\n",
+   "source": [
-    "    hist_gradient = cv2.normalize(hist_gradient, hist_gradient).flatten()\n",
+    "### 4) Application de la méthode Adaboost"
-    "    \n",
+   ]
-    "    return np.concatenate((hist_color, hist_gradient))\n",
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "c:\\Users\\victo\\AppData\\Local\\Programs\\Python\\Python312\\Lib\\site-packages\\sklearn\\ensemble\\_weight_boosting.py:519: FutureWarning: The SAMME.R algorithm (the default) is deprecated and will be removed in 1.6. Use the SAMME algorithm to circumvent this warning.\n",
+      "  warnings.warn(\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Taux d'erreur : 0.6302521008403361\n"
+     ]
+    }
+   ],
+   "source": [
+    "from sklearn.ensemble import AdaBoostClassifier\n",
    "\n",
+    "adaboost_clf = AdaBoostClassifier(n_estimators=10) # To change\n",
+    "adaboost_clf.fit(X_train, Y_train)\n",
+    "y = adaboost_clf.predict(X_val)\n",
    "\n",
-    "# Dict to convert str class name to int\n",
+    "print(f\"Taux d'erreur : {np.mean(y != Y_val)}\")"
-    "name_to_int = {\n",
+   ]
-    "    \"danger\": 0,\n",
+  },
-    "    \"interdiction\": 1,\n",
+  {
-    "    \"obligation\": 2,\n",
+   "cell_type": "markdown",
-    "    \"stop\": 3,\n",
+   "metadata": {},
-    "    \"ceder\": 4,\n",
+   "source": [
-    "    \"frouge\": 5,\n",
+    "### 5) Test de la méthode Adaboost avec application des caractéristiques HOG"
-    "    \"forange\": 6,\n",
+   ]
-    "    \"fvert\": 7,\n",
+  },
-    "    \"ff\": 8,\n",
+  {
-    "    \"empty\": 9\n",
+   "cell_type": "code",
-    "}\n",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from skimage.feature import hog\n",
+    "from skimage.color import rgb2gray\n",
+    "\n",
+    "def extract_hog(datas):\n",
+    "    # Creating X array with all HOG information of images\n",
+    "    X = []\n",
+    "\n",
+    "    for name, data in datas.items():\n",
+    "        for row in data[\"labels\"].values():\n",
+    "            image_as_array = np.array(hog(rgb2gray(row[\"img\"]))).flatten()\n",
+    "            X.append(image_as_array)\n",
    "\n",
+    "    return np.array(X)\n",
    "\n",
-    "# Creating arrays with all labels datas & classes\n",
-    "X_train = []\n",
-    "Y_train = []\n",
    "\n",
-    "for name, data in datas.items():\n",
+    "# Update training dataset\n",
-    "    for row in data[\"labels\"].values():\n",
+    "X_train_HOG = extract_hog(datas=datas_train)\n",
-    "        X_train.append(extract_features(row[\"img\"]))\n",
-    "        Y_train.append(name_to_int[row[\"name\"]])\n",
    "\n",
-    "X_train = np.array(X_train)\n",
+    "# Update validation dataset\n",
-    "Y_train = np.array(Y_train)"
+    "X_val_HOG = extract_hog(datas=datas_val)"
   ]
  },
  {
   "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 7,
   "metadata": {},
   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "c:\\Users\\victo\\AppData\\Local\\Programs\\Python\\Python312\\Lib\\site-packages\\sklearn\\ensemble\\_weight_boosting.py:519: FutureWarning: The SAMME.R algorithm (the default) is deprecated and will be removed in 1.6. Use the SAMME algorithm to circumvent this warning.\n",
+      "  warnings.warn(\n"
+     ]
+    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
-      "[1 1 0 ... 1 5 7]\n"
+      "Taux d'erreur : 0.5378151260504201\n"
     ]
    }
   ],
   "source": [
-    "from sklearn import svm\n",
+    "adaboost_clf = AdaBoostClassifier(n_estimators=10)\n",
-    "from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score\n",
+    "adaboost_clf.fit(X_train_HOG, Y_train)\n",
-    "\n",
+    "y_HOG = adaboost_clf.predict(X_val_HOG)\n",
-    "svm_model = svm.SVC(kernel='linear')  # Choix du noyau linéaire\n",
-    "svm_model.fit(X_train, Y_train)\n",
    "\n",
-    "print(svm_model)"
+    "print(f\"Taux d'erreur : {np.mean(y_HOG != Y_val)}\")"
   ]
  }
 ],
@@ -221,7 +306,7 @@
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
-   "version": "3.10.11"
+   "version": "3.12.2"
  }
 },
 "nbformat": 4,

 %% Cell type:markdown id: tags:
 ## Entrainement d'un modèle avec la méthode des SVM
-%% Cell type:markdown id: tags:
-#### Chargement des données d'entrainement
 %% Cell type:code id: tags:
 ``` python
 import os
-import cv2
 import numpy as np
 import random
+from PIL import Image
 ```
+%% Cell type:markdown id: tags:
+### 1) Fonctions de Preprocessing des datasets
 %% Cell type:code id: tags:
 ``` python
-"""
+AVERAGE_SIZE_IMAGE = (127, 145)  # Thanks to the stats, we know that size of bbox will be (127, 145) -> Average size of labels
-We will create a dict with all the usefull datas of the training dataset
-datas = {
-    "XXXX" (name of the file) : {
-        "img" : ndarray of the image,
-        "labels" (data of the labels): {
-            "X" index of the label (0,1,...,n) : {
-                "name" : name of the label,
-                "coord" : coord of the label like xmin, ymin, xmax, ymax,
-                "img" : crooped img of the label,
-            }
-        }
-    }
-}
-"""
 def generate_empty_bbox(image_width, image_height):
-    # Thanks to the stats, we know that size of bbox will be (127, 145) -> Average size of labels
+    """
-    # Génération de coordonnées aléatoires pour le coin supérieur gauche de la boundebox
+    Generate an empty box for images without label
-    x_min = random.randint(0, image_width - 127)
+    """
-    y_min = random.randint(0, image_height - 145)
+    # Generating random coords for the bbox
+    x_min = random.randint(0, image_width - AVERAGE_SIZE_IMAGE[0])
-    # Calcul des coordonnées du coin inférieur droit de la boundebox
+    y_min = random.randint(0, image_height - AVERAGE_SIZE_IMAGE[1])
-    x_max = x_min + 127
-    y_max = y_min + 145
+    # Compute complete coords of the bbox
+    x_max = x_min + AVERAGE_SIZE_IMAGE[0]
+    y_max = y_min + AVERAGE_SIZE_IMAGE[1]
    return (x_min, y_min, x_max, y_max)
 def load_data(image_dir, label_dir):
+    """
+    Create a dict with all the usefull datas of the dataset
+    datas = {
+        "XXXX" (name of the file) : {
+            "img" : image as an array,
+            "labels" (data of the labels): {
+                "X" index of the label (0,1,...,n) : {
+                    "name" : name of the label,
+                    "coord" : coord of the label like xmin, ymin, xmax, ymax,
+                    "img" : crooped img of the label,
+                }
+            }
+        }
+    }
+    """
    datas = {}
    for image_file in os.listdir(image_dir):
        # Computing name and files paths
        image_path = image_dir + '/' + image_file
        name = image_file.split('.')[0]
        label_path = label_dir + '/' + name + '.csv'
        # Import image as array
-        image = cv2.imread(image_path)
+        image = np.array(Image.open(image_path))
        # Import labels as array
        with open(label_path, 'r') as file:
            rows = file.readlines()
            label_data = {}
            if rows == ['\n']:  # Create a random empty label to balance model
                # Create random coords for empty label
                xmin, ymin, xmax, ymax = generate_empty_bbox(image.shape[1], image.shape[0])
                # Get the cropped image (as array) of the label
-                cropped_image = image[ymin:ymax, xmin:xmax]
+                cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))
                label_data[0] = {
                        "name":"empty",
                        "coord": (xmin, ymin, xmax, ymax),
                        "img":cropped_image
                    }
            else:
                for i, row in enumerate(rows):  # One image can contain several labels
                    row = row.strip().split(",")
                    # Compute coords of the label
                    xmin, ymin, xmax, ymax = map(int, row[0:4])
                    # Get the label name
                    class_name = row[4]
                    # Get the cropped image (as array) of the label
-                    cropped_image = image[ymin:ymax, xmin:xmax]
+                    cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))
                    # Adding to the json
                    label_data[i] = {
                        "name":class_name,
                        "coord": (xmin, ymin, xmax, ymax),
                        "img":cropped_image
                    }
        datas[name] = {
             "img" : image,
             "labels" : label_data,
        }
    return datas
+# Dict to convert str class name to int
+name_to_int = {
+    "danger": 0,
+    "interdiction": 1,
+    "obligation": 2,
+    "stop": 3,
+    "ceder": 4,
+    "frouge": 5,
+    "forange": 6,
+    "fvert": 7,
+    "ff": 8,
+    "empty": 9
+}
 ```
+%% Cell type:markdown id: tags:
+### 2) Fonction de création des datasets
 %% Cell type:code id: tags:
 ``` python
-# Creating the dict of the datas
+def create_xy(datas):
+    # Creating arrays with all labels datas & classes
+    X = []
+    Y = []
+    for name, data in datas.items():
+        for row in data["labels"].values():
+            image_as_array = np.array(row["img"]).flatten()
+            X.append(image_as_array)
+            Y.append(name_to_int[row["name"]])
+    X = np.array(X)
+    Y = np.array(Y)
+    return X, Y
+```
-datas = load_data("../data/train/images", "../data/train/labels")
+%% Cell type:markdown id: tags:
+### 3) Création des datasets
+%% Cell type:code id: tags:
+``` python
+# Training dataset
+datas_train = load_data("../../data/train/images", "../../data/train/labels")
+X_train, Y_train = create_xy(datas=datas_train)
+# Validation dataset
+datas_val = load_data("../../data/val/images", "../../data/val/labels")
+X_val, Y_val = create_xy(datas=datas_val)
 ```
+%% Cell type:markdown id: tags:
+### 4) Application de la méthode Adaboost
 %% Cell type:code id: tags:
 ``` python
-def extract_features(img):
+from sklearn.ensemble import AdaBoostClassifier
-    # Convertion to gray level
-    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
-    # Color Hist
+adaboost_clf = AdaBoostClassifier(n_estimators=10) # To change
-    hist_color = cv2.calcHist([img], [0, 1, 2], None, [8, 8, 8], [0, 256, 0, 256, 0, 256])
+adaboost_clf.fit(X_train, Y_train)
-    hist_color = cv2.normalize(hist_color, hist_color).flatten()
+y = adaboost_clf.predict(X_val)
-    # Gradient Hist
+print(f"Taux d'erreur : {np.mean(y != Y_val)}")
-    sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0, ksize=5)
+```
-    sobely = cv2.Sobel(gray, cv2.CV_64F, 0, 1, ksize=5)
-    grad_mag = np.sqrt(sobelx**2 + sobely**2)
-    hist_gradient = cv2.calcHist([grad_mag.astype(np.uint8)], [0], None, [16], [0, 256])
-    hist_gradient = cv2.normalize(hist_gradient, hist_gradient).flatten()
-    return np.concatenate((hist_color, hist_gradient))
+%% Output
+    c:\Users\victo\AppData\Local\Programs\Python\Python312\Lib\site-packages\sklearn\ensemble\_weight_boosting.py:519: FutureWarning: The SAMME.R algorithm (the default) is deprecated and will be removed in 1.6. Use the SAMME algorithm to circumvent this warning.
+      warnings.warn(
-# Dict to convert str class name to int
+    Taux d'erreur : 0.6302521008403361
-name_to_int = {
-    "danger": 0,
-    "interdiction": 1,
-    "obligation": 2,
-    "stop": 3,
-    "ceder": 4,
-    "frouge": 5,
-    "forange": 6,
-    "fvert": 7,
-    "ff": 8,
-    "empty": 9
-}
+%% Cell type:markdown id: tags:
-# Creating arrays with all labels datas & classes
+### 5) Test de la méthode Adaboost avec application des caractéristiques HOG
-X_train = []
-Y_train = []
-for name, data in datas.items():
+%% Cell type:code id: tags:
-    for row in data["labels"].values():
-        X_train.append(extract_features(row["img"]))
-        Y_train.append(name_to_int[row["name"]])
-X_train = np.array(X_train)
+``` python
-Y_train = np.array(Y_train)
+from skimage.feature import hog
+from skimage.color import rgb2gray
+def extract_hog(datas):
+    # Creating X array with all HOG information of images
+    X = []
+    for name, data in datas.items():
+        for row in data["labels"].values():
+            image_as_array = np.array(hog(rgb2gray(row["img"]))).flatten()
+            X.append(image_as_array)
+    return np.array(X)
+# Update training dataset
+X_train_HOG = extract_hog(datas=datas_train)
+# Update validation dataset
+X_val_HOG = extract_hog(datas=datas_val)
 ```
 %% Cell type:code id: tags:
 ``` python
-from sklearn import svm
+adaboost_clf = AdaBoostClassifier(n_estimators=10)
-from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score
+adaboost_clf.fit(X_train_HOG, Y_train)
+y_HOG = adaboost_clf.predict(X_val_HOG)
-svm_model = svm.SVC(kernel='linear')  # Choix du noyau linéaire
+print(f"Taux d'erreur : {np.mean(y_HOG != Y_val)}")
-svm_model.fit(X_train, Y_train)
-print(svm_model)
 ```
 %% Output
-    [1 1 0 ... 1 5 7]
+    c:\Users\victo\AppData\Local\Programs\Python\Python312\Lib\site-packages\sklearn\ensemble\_weight_boosting.py:519: FutureWarning: The SAMME.R algorithm (the default) is deprecated and will be removed in 1.6. Use the SAMME algorithm to circumvent this warning.
+      warnings.warn(
+    Taux d'erreur : 0.5378151260504201

--- a/machine_learning/classification/RandomForest.ipynb
+++ b/machine_learning/classification/RandomForest.ipynb
--- a/machine_learning/classification/SVM.ipynb
+++ b/machine_learning/classification/SVM.ipynb
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Entrainement d'un modèle avec la méthode des SVM"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import numpy as np\n",
+    "import random\n",
+    "from PIL import Image"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 1) Fonctions de Preprocessing des datasets"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 21,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "AVERAGE_SIZE_IMAGE = (127, 145)  # Thanks to the stats, we know that size of bbox will be (127, 145) -> Average size of labels \n",
+    "\n",
+    "def generate_empty_bbox(image_width, image_height):\n",
+    "    \"\"\" \n",
+    "    Generate an empty box for images without label\n",
+    "    \"\"\"\n",
+    "    # Generating random coords for the bbox\n",
+    "    x_min = random.randint(0, image_width - AVERAGE_SIZE_IMAGE[0])\n",
+    "    y_min = random.randint(0, image_height - AVERAGE_SIZE_IMAGE[1])\n",
+    "    \n",
+    "    # Compute complete coords of the bbox\n",
+    "    x_max = x_min + AVERAGE_SIZE_IMAGE[0]\n",
+    "    y_max = y_min + AVERAGE_SIZE_IMAGE[1]\n",
+    "    \n",
+    "    return (x_min, y_min, x_max, y_max)\n",
+    "\n",
+    "def load_data(image_dir, label_dir):\n",
+    "    \"\"\" \n",
+    "    Create a dict with all the usefull datas of the dataset\n",
+    "    datas = {\n",
+    "        \"XXXX\" (name of the file) : {\n",
+    "            \"img\" : image as an array,\n",
+    "            \"labels\" (data of the labels): {\n",
+    "                \"X\" index of the label (0,1,...,n) : {\n",
+    "                    \"name\" : name of the label,\n",
+    "                    \"coord\" : coord of the label like xmin, ymin, xmax, ymax,\n",
+    "                    \"img\" : crooped img of the label,\n",
+    "                }\n",
+    "            }\n",
+    "        }\n",
+    "    }\n",
+    "    \"\"\"\n",
+    "    \n",
+    "    datas = {}\n",
+    "\n",
+    "    for image_file in os.listdir(image_dir):\n",
+    "        # Computing name and files paths\n",
+    "        image_path = image_dir + '/' + image_file\n",
+    "        name = image_file.split('.')[0]\n",
+    "        label_path = label_dir + '/' + name + '.csv'\n",
+    "        \n",
+    "        # Import image as array\n",
+    "        image = np.array(Image.open(image_path))\n",
+    "\n",
+    "        # Import labels as array \n",
+    "        with open(label_path, 'r') as file:\n",
+    "            rows = file.readlines()\n",
+    "\n",
+    "            label_data = {}\n",
+    "            if rows == ['\\n']:  # Create a random empty label to balance model\n",
+    "                # Create random coords for empty label\n",
+    "                xmin, ymin, xmax, ymax = generate_empty_bbox(image.shape[1], image.shape[0])\n",
+    "    \n",
+    "                # Get the cropped image (as array) of the label\n",
+    "                cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))\n",
+    "               \n",
+    "                label_data[0] = {\n",
+    "                        \"name\":\"empty\",\n",
+    "                        \"coord\": (xmin, ymin, xmax, ymax),\n",
+    "                        \"img\":cropped_image\n",
+    "                    }\n",
+    "            else:\n",
+    "                for i, row in enumerate(rows):  # One image can contain several labels\n",
+    "                    row = row.strip().split(\",\")\n",
+    "\n",
+    "                    # Compute coords of the label\n",
+    "                    xmin, ymin, xmax, ymax = map(int, row[0:4])\n",
+    "\n",
+    "                    # Get the label name\n",
+    "                    class_name = row[4]\n",
+    "\n",
+    "                    # Get the cropped image (as array) of the label\n",
+    "                    cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))\n",
+    "                    \n",
+    "                    # Adding to the json\n",
+    "                    label_data[i] = {\n",
+    "                        \"name\":class_name,\n",
+    "                        \"coord\": (xmin, ymin, xmax, ymax),\n",
+    "                        \"img\":cropped_image\n",
+    "                    }\n",
+    "\n",
+    "        datas[name] = {\n",
+    "             \"img\" : image,\n",
+    "             \"labels\" : label_data,\n",
+    "        }\n",
+    "       \n",
+    "    return datas\n",
+    "\n",
+    "# Dict to convert str class name to int\n",
+    "name_to_int = {\n",
+    "    \"danger\": 0,\n",
+    "    \"interdiction\": 1,\n",
+    "    \"obligation\": 2,\n",
+    "    \"stop\": 3,\n",
+    "    \"ceder\": 4,\n",
+    "    \"frouge\": 5,\n",
+    "    \"forange\": 6,\n",
+    "    \"fvert\": 7,\n",
+    "    \"ff\": 8,\n",
+    "    \"empty\": 9\n",
+    "}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 2) Fonction de création des datasets"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 22,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def create_xy(datas):\n",
+    "    # Creating arrays with all labels datas & classes\n",
+    "    X = []\n",
+    "    Y = []\n",
+    "\n",
+    "    for name, data in datas.items():\n",
+    "        for row in data[\"labels\"].values():\n",
+    "            image_as_array = np.array(row[\"img\"]).flatten()\n",
+    "            X.append(image_as_array)\n",
+    "            Y.append(name_to_int[row[\"name\"]])\n",
+    "\n",
+    "    X = np.array(X)\n",
+    "    Y = np.array(Y)\n",
+    "\n",
+    "    return X, Y"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 3) Création des datasets"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Training dataset\n",
+    "datas_train = load_data(\"../../data/train/images\", \"../../data/train/labels\")\n",
+    "X_train, Y_train = create_xy(datas=datas_train)\n",
+    "\n",
+    "# Validation dataset\n",
+    "datas_val = load_data(\"../../data/val/images\", \"../../data/val/labels\")\n",
+    "X_val, Y_val = create_xy(datas=datas_val)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 4) Application de la méthode des SVM"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Taux d'erreur : 0.226890756302521\n"
+     ]
+    }
+   ],
+   "source": [
+    "from sklearn import svm\n",
+    "\n",
+    "svm_model = svm.SVC(kernel='linear') \n",
+    "svm_model.fit(X_train, Y_train)\n",
+    "y = svm_model.predict(X_val)\n",
+    "\n",
+    "print(f\"Taux d'erreur : {np.mean(y != Y_val)}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 5) Test de la méthode SVM avec application des caractéristiques HOG"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 27,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from skimage.feature import hog\n",
+    "from skimage.color import rgb2gray\n",
+    "\n",
+    "def extract_hog(datas):\n",
+    "    # Creating X array with all HOG information of images\n",
+    "    X = []\n",
+    "\n",
+    "    for name, data in datas.items():\n",
+    "        for row in data[\"labels\"].values():\n",
+    "            image_as_array = np.array(hog(rgb2gray(row[\"img\"]))).flatten()\n",
+    "            X.append(image_as_array)\n",
+    "\n",
+    "    return np.array(X)\n",
+    "\n",
+    "\n",
+    "# Update training dataset\n",
+    "X_train_HOG = extract_hog(datas=datas_train)\n",
+    "\n",
+    "# Update validation dataset\n",
+    "X_val_HOG = extract_hog(datas=datas_val)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 28,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Taux d'erreur : 0.15966386554621848\n"
+     ]
+    }
+   ],
+   "source": [
+    "svm_model = svm.SVC(kernel='linear') \n",
+    "svm_model.fit(X_train_HOG, Y_train)\n",
+    "y_HOG = svm_model.predict(X_val_HOG)\n",
+    "\n",
+    "print(f\"Taux d'erreur : {np.mean(y_HOG != Y_val)}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### 6) Test de la méthode SVM avec application des LPB"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 34,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "c:\\Users\\victo\\AppData\\Local\\Programs\\Python\\Python312\\Lib\\site-packages\\skimage\\feature\\texture.py:360: UserWarning: Applying `local_binary_pattern` to floating-point images may give unexpected results when small numerical differences between adjacent pixels are present. It is recommended to use this function with images of integer dtype.\n",
+      "  warnings.warn(\n"
+     ]
+    },
+    {
+     "ename": "ValueError",
+     "evalue": "setting an array element with a sequence. The requested array has an inhomogeneous shape after 1 dimensions. The detected shape was (1071,) + inhomogeneous part.",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mValueError\u001b[0m                                Traceback (most recent call last)",
+      "Cell \u001b[1;32mIn[34], line 17\u001b[0m\n\u001b[0;32m     13\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m np\u001b[38;5;241m.\u001b[39marray(X)\n\u001b[0;32m     16\u001b[0m \u001b[38;5;66;03m# Update training dataset\u001b[39;00m\n\u001b[1;32m---> 17\u001b[0m X_train_LBP \u001b[38;5;241m=\u001b[39m \u001b[43mextract_LBP\u001b[49m\u001b[43m(\u001b[49m\u001b[43mdatas\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdatas_train\u001b[49m\u001b[43m)\u001b[49m\n\u001b[0;32m     19\u001b[0m \u001b[38;5;66;03m# Update validation dataset\u001b[39;00m\n\u001b[0;32m     20\u001b[0m X_val_LBP \u001b[38;5;241m=\u001b[39m extract_LBP(datas\u001b[38;5;241m=\u001b[39mdatas_val)\n",
+      "Cell \u001b[1;32mIn[34], line 13\u001b[0m, in \u001b[0;36mextract_LBP\u001b[1;34m(datas)\u001b[0m\n\u001b[0;32m     10\u001b[0m         image_as_array \u001b[38;5;241m=\u001b[39m np\u001b[38;5;241m.\u001b[39marray(hog(local_binary_pattern(rgb2gray(data[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mimg\u001b[39m\u001b[38;5;124m\"\u001b[39m]), P \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m8\u001b[39m, R \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m1\u001b[39m)))\u001b[38;5;241m.\u001b[39mflatten()\n\u001b[0;32m     11\u001b[0m         X\u001b[38;5;241m.\u001b[39mappend(image_as_array)\n\u001b[1;32m---> 13\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mnp\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43marray\u001b[49m\u001b[43m(\u001b[49m\u001b[43mX\u001b[49m\u001b[43m)\u001b[49m\n",
+      "\u001b[1;31mValueError\u001b[0m: setting an array element with a sequence. The requested array has an inhomogeneous shape after 1 dimensions. The detected shape was (1071,) + inhomogeneous part."
+     ]
+    }
+   ],
+   "source": [
+    "import cv2\n",
+    "\n",
+    "def extract_SIFT(datas):\n",
+    "    # Creating X array with all HOG information of images\n",
+    "    X = []\n",
+    "    sift = cv2.SIFT_create()\n",
+    "\n",
+    "    for name, data in datas.items():\n",
+    "        for row in data[\"labels\"].values():\n",
+    "            gray_image = cv2.cvtColor(data[\"img\"], cv2.COLOR_RGB2GRAY)\n",
+    "            keypoints, descriptors = sift.detectAndCompute(gray_image, None)\n",
+    "            if descriptors is not None:\n",
+    "                X.append(descriptors.flatten())\n",
+    "\n",
+    "    return np.array(X)\n",
+    "\n",
+    "\n",
+    "# Update training dataset\n",
+    "X_train_LBP = extract_SIFT(datas=datas_train)\n",
+    "\n",
+    "# Update validation dataset\n",
+    "X_val_LBP = extract_SIFT(datas=datas_val)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "svm_model = svm.SVC(kernel='linear') \n",
+    "svm_model.fit(X_train_LBP, Y_train)\n",
+    "y_LBP = svm_model.predict(X_val_LBP)\n",
+    "\n",
+    "print(f\"Taux d'erreur : {np.mean(y_LBP != Y_val)}\")"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.2"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
+%% Cell type:markdown id: tags:
+## Entrainement d'un modèle avec la méthode des SVM
+%% Cell type:code id: tags:
+``` python
+import os
+import numpy as np
+import random
+from PIL import Image
+```
+%% Cell type:markdown id: tags:
+### 1) Fonctions de Preprocessing des datasets
+%% Cell type:code id: tags:
+``` python
+AVERAGE_SIZE_IMAGE = (127, 145)  # Thanks to the stats, we know that size of bbox will be (127, 145) -> Average size of labels
+def generate_empty_bbox(image_width, image_height):
+    """
+    Generate an empty box for images without label
+    """
+    # Generating random coords for the bbox
+    x_min = random.randint(0, image_width - AVERAGE_SIZE_IMAGE[0])
+    y_min = random.randint(0, image_height - AVERAGE_SIZE_IMAGE[1])
+    # Compute complete coords of the bbox
+    x_max = x_min + AVERAGE_SIZE_IMAGE[0]
+    y_max = y_min + AVERAGE_SIZE_IMAGE[1]
+    return (x_min, y_min, x_max, y_max)
+def load_data(image_dir, label_dir):
+    """
+    Create a dict with all the usefull datas of the dataset
+    datas = {
+        "XXXX" (name of the file) : {
+            "img" : image as an array,
+            "labels" (data of the labels): {
+                "X" index of the label (0,1,...,n) : {
+                    "name" : name of the label,
+                    "coord" : coord of the label like xmin, ymin, xmax, ymax,
+                    "img" : crooped img of the label,
+                }
+            }
+        }
+    }
+    """
+    datas = {}
+    for image_file in os.listdir(image_dir):
+        # Computing name and files paths
+        image_path = image_dir + '/' + image_file
+        name = image_file.split('.')[0]
+        label_path = label_dir + '/' + name + '.csv'
+        # Import image as array
+        image = np.array(Image.open(image_path))
+        # Import labels as array
+        with open(label_path, 'r') as file:
+            rows = file.readlines()
+            label_data = {}
+            if rows == ['\n']:  # Create a random empty label to balance model
+                # Create random coords for empty label
+                xmin, ymin, xmax, ymax = generate_empty_bbox(image.shape[1], image.shape[0])
+                # Get the cropped image (as array) of the label
+                cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))
+                label_data[0] = {
+                        "name":"empty",
+                        "coord": (xmin, ymin, xmax, ymax),
+                        "img":cropped_image
+                    }
+            else:
+                for i, row in enumerate(rows):  # One image can contain several labels
+                    row = row.strip().split(",")
+                    # Compute coords of the label
+                    xmin, ymin, xmax, ymax = map(int, row[0:4])
+                    # Get the label name
+                    class_name = row[4]
+                    # Get the cropped image (as array) of the label
+                    cropped_image = np.array(Image.fromarray(image[ymin:ymax, xmin:xmax]).resize(AVERAGE_SIZE_IMAGE))
+                    # Adding to the json
+                    label_data[i] = {
+                        "name":class_name,
+                        "coord": (xmin, ymin, xmax, ymax),
+                        "img":cropped_image
+                    }
+        datas[name] = {
+             "img" : image,
+             "labels" : label_data,
+        }
+    return datas
+# Dict to convert str class name to int
+name_to_int = {
+    "danger": 0,
+    "interdiction": 1,
+    "obligation": 2,
+    "stop": 3,
+    "ceder": 4,
+    "frouge": 5,
+    "forange": 6,
+    "fvert": 7,
+    "ff": 8,
+    "empty": 9
+}
+```
+%% Cell type:markdown id: tags:
+### 2) Fonction de création des datasets
+%% Cell type:code id: tags:
+``` python
+def create_xy(datas):
+    # Creating arrays with all labels datas & classes
+    X = []
+    Y = []
+    for name, data in datas.items():
+        for row in data["labels"].values():
+            image_as_array = np.array(row["img"]).flatten()
+            X.append(image_as_array)
+            Y.append(name_to_int[row["name"]])
+    X = np.array(X)
+    Y = np.array(Y)
+    return X, Y
+```
+%% Cell type:markdown id: tags:
+### 3) Création des datasets
+%% Cell type:code id: tags:
+``` python
+# Training dataset
+datas_train = load_data("../../data/train/images", "../../data/train/labels")
+X_train, Y_train = create_xy(datas=datas_train)
+# Validation dataset
+datas_val = load_data("../../data/val/images", "../../data/val/labels")
+X_val, Y_val = create_xy(datas=datas_val)
+```
+%% Cell type:markdown id: tags:
+### 4) Application de la méthode des SVM
+%% Cell type:code id: tags:
+``` python
+from sklearn import svm
+svm_model = svm.SVC(kernel='linear')
+svm_model.fit(X_train, Y_train)
+y = svm_model.predict(X_val)
+print(f"Taux d'erreur : {np.mean(y != Y_val)}")
+```
+%% Output
+    Taux d'erreur : 0.226890756302521
+%% Cell type:markdown id: tags:
+### 5) Test de la méthode SVM avec application des caractéristiques HOG
+%% Cell type:code id: tags:
+``` python
+from skimage.feature import hog
+from skimage.color import rgb2gray
+def extract_hog(datas):
+    # Creating X array with all HOG information of images
+    X = []
+    for name, data in datas.items():
+        for row in data["labels"].values():
+            image_as_array = np.array(hog(rgb2gray(row["img"]))).flatten()
+            X.append(image_as_array)
+    return np.array(X)
+# Update training dataset
+X_train_HOG = extract_hog(datas=datas_train)
+# Update validation dataset
+X_val_HOG = extract_hog(datas=datas_val)
+```
+%% Cell type:code id: tags:
+``` python
+svm_model = svm.SVC(kernel='linear')
+svm_model.fit(X_train_HOG, Y_train)
+y_HOG = svm_model.predict(X_val_HOG)
+print(f"Taux d'erreur : {np.mean(y_HOG != Y_val)}")
+```
+%% Output
+    Taux d'erreur : 0.15966386554621848
+%% Cell type:markdown id: tags:
+### 6) Test de la méthode SVM avec application des LPB
+%% Cell type:code id: tags:
+``` python
+import cv2
+def extract_SIFT(datas):
+    # Creating X array with all HOG information of images
+    X = []
+    sift = cv2.SIFT_create()
+    for name, data in datas.items():
+        for row in data["labels"].values():
+            gray_image = cv2.cvtColor(data["img"], cv2.COLOR_RGB2GRAY)
+            keypoints, descriptors = sift.detectAndCompute(gray_image, None)
+            if descriptors is not None:
+                X.append(descriptors.flatten())
+    return np.array(X)
+# Update training dataset
+X_train_LBP = extract_SIFT(datas=datas_train)
+# Update validation dataset
+X_val_LBP = extract_SIFT(datas=datas_val)
+```
+%% Output
+    c:\Users\victo\AppData\Local\Programs\Python\Python312\Lib\site-packages\skimage\feature\texture.py:360: UserWarning: Applying `local_binary_pattern` to floating-point images may give unexpected results when small numerical differences between adjacent pixels are present. It is recommended to use this function with images of integer dtype.
+      warnings.warn(
+    ---------------------------------------------------------------------------
+    ValueError                                Traceback (most recent call last)
+Cell     In[34], line 17
+         13     return np.array(X)
+         16 # Update training dataset
+    ---> 17 X_train_LBP = extract_LBP(datas=datas_train)
+         19 # Update validation dataset
+         20 X_val_LBP = extract_LBP(datas=datas_val)
+Cell     In[34], line 13, in extract_LBP(datas)
+         10         image_as_array = np.array(hog(local_binary_pattern(rgb2gray(data["img"]), P = 8, R = 1))).flatten()
+         11         X.append(image_as_array)
+    ---> 13 return np.array(X)
+    ValueError: setting an array element with a sequence. The requested array has an inhomogeneous shape after 1 dimensions. The detected shape was (1071,) + inhomogeneous part.
+%% Cell type:code id: tags:
+``` python
+svm_model = svm.SVC(kernel='linear')
+svm_model.fit(X_train_LBP, Y_train)
+y_LBP = svm_model.predict(X_val_LBP)
+print(f"Taux d'erreur : {np.mean(y_LBP != Y_val)}")
+```