Merge pull request #69 from Flippchen/dev

Flippchen · web-flow · commit e3bfb9a12434 · 2023-08-17T01:25:20.000+02:00
Dev
diff --git a/README.md b/README.md
@@ -63,11 +63,26 @@ To see the architecture of the Local App UI, click the arrow below.
 <img alt="Architecture of the Web UI" src="assets/architecture.png"  height="400">
 </details>
 
+### Experimental Ensemble Models 🧪
+To improve accuracy and prediction capabilities, I have experimented with two ensemble models. Ensemble models combine predictions from multiple models to give a final verdict, which often results in better prediction accuracy. These ensemble models are still in the experimental phase and can be found in the [ensemble](web_ui/main_ensemble.py).
+
+1. Car Type Ensemble Model (weighted average)
+    - Description: Trained two models on the same objective. Each with its on strengths and weaknesses. The results get weighted (correct weights through intensive testing). The models also differ in model architecture. 
+    - Achievements:
+      - More balanced predictions
+      - Better prediction accuracy
+2. Car Type hierarchy with car series (specific car type) (weighted average)
+    - Description: Created a hierarchy of models. The first models predicts the car type. The second model predicts the car series. After this the results get aligned with the car type model.
+    - Achievements:
+      - much less outlier predictions
+      - better prediction accuracy
+      
+They can be found at [PorscheInsight-Ensemble](https://classify.autos/classify-ensemble).
+
 ### ToDos
 
 - [ ] Experiment with EfficientNet-Lite4
 - [ ] Retrain all models with better dataset
-- [ ] Build an ensemble model with car_type and car_series
 - [ ] Switch to Google Cloud function/use S3 bucket/compress image
 - [ ] Improve pre_filter model/Use Grounded SAM
 - [ ] Add Taycans to images/models
@@ -99,6 +114,7 @@ To see the architecture of the Local App UI, click the arrow below.
 - [x] Try autokeras
 - [x] Improve model predictions overall
 - [x] Evaluate feature engineering/ More data augmentation
+- [x] Build an ensemble model with car_type and car_series
 
 </details>
 
diff --git a/utilities/class_names.py b/utilities/class_names.py
@@ -11,11 +11,47 @@
                       'Cayman_2013', 'Cayman_2014', 'Cayman_2015', 'Cayman_2016', 'Macan_2014', 'Macan_2015', 'Macan_2016', 'Macan_2017', 'Macan_2018', 'Macan_2019', 'Panamera_2009', 'Panamera_2010',
                       'Panamera_2011', 'Panamera_2012', 'Panamera_2013', 'Panamera_2014', 'Panamera_2015', 'Panamera_2016', 'Panamera_2017', 'Panamera_2018', 'Panamera_2019']
 
-MODEL_VARIANTS = ['911_930', '911_964', '911_991', '911_991_Facelift', '911_992', '911_996_Facelift', '911_997', '911_997_Facelift', '918_Spyderr_1_Generation', 'Boxster_981', 'Boxster_982',
-                  'Boxster_986', 'Boxster_987_Facelift', 'Boxter_986_Facelift', 'Boxter_987', 'Carrera_GT_980', 'Cayenne_955', 'Cayenne_955_Facelift', 'Cayenne_958', 'Cayenne_958_Facelift',
+MODEL_VARIANTS = ['911_930', '911_964', '911_991', '911_991_Facelift', '911_992', '911_996_Facelift', '911_997', '911_997_Facelift', '918_Spyder_1_Generation', 'Boxster_981', 'Boxster_982',
+                  'Boxster_986', 'Boxster_987_Facelift', 'Boxster_986_Facelift', 'Boxter_987', 'Carrera_GT_980', 'Cayenne_955', 'Cayenne_955_Facelift', 'Cayenne_958', 'Cayenne_958_Facelift',
                   'Cayenne_9YA', 'Cayman_981C', 'Cayman_982C', 'Cayman_987C', 'Cayman_987_Facelift', 'Macan_95B', 'Macan_95B_Facelift', 'Panamera_970', 'Panamera_970_Facelift', 'Panamera_971']
 
 PRE_FILTER = ['other', 'other_car_brand', 'porsche']
+HIERARCHY = {
+    '911': [
+        '911_930', '911_964', '911_991', '911_991_Facelift', '911_992',
+        '911_996_Facelift', '911_997', '911_997_Facelift'
+    ],
+    '918': [
+        '918_Spyder_1_Generation'
+    ],
+    'Boxster': [
+        'Boxster_981', 'Boxster_982', 'Boxster_986', 'Boxster_987_Facelift',
+        'Boxster_986_Facelift', 'Boxster_987'
+    ],
+    'Carrera GT': [
+        'Carrera_GT_980'
+    ],
+    'Cayenne': [
+        'Cayenne_955', 'Cayenne_955_Facelift', 'Cayenne_958',
+        'Cayenne_958_Facelift', 'Cayenne_9YA'
+    ],
+    'Cayman': [
+        'Cayman_981C', 'Cayman_982C', 'Cayman_987C', 'Cayman_987_Facelift'
+    ],
+    'Macan': [
+        'Macan_95B', 'Macan_95B_Facelift'
+    ],
+    'Panamera': [
+        'Panamera_970', 'Panamera_970_Facelift', 'Panamera_971'
+    ],
+    '718 Cayman': [
+        'Cayman_981C', 'Cayman_982C', 'Cayman_987C', 'Cayman_987_Facelift'
+    ],
+    '718 Boxster': [
+        'Boxster_981', 'Boxster_982', 'Boxster_986', 'Boxster_987_Facelift',
+        'Boxster_986_Facelift', 'Boxster_987'
+    ]
+}
 
 
 def get_classes_for_model(name: str) -> List[str]:
diff --git a/web_ui/build_requirements.txt b/web_ui/build_requirements.txt
@@ -2,6 +2,6 @@
 eel~=0.16.0
 pooch==1.7.0
 numpy==1.23.5
-Pillow==9.5.0
+Pillow==10.0.0
 rembg~=2.0.32
-onnxruntime==1.14.1
+onnxruntime==1.15.1
diff --git a/web_ui/main.py b/web_ui/main.py
@@ -116,22 +116,27 @@ def prepare_image(image_data: Image, target_size: Tuple, remove_background: bool
     return img_array, mask
 
 
-def get_top_3_predictions(prediction: np.ndarray, model_name: str) -> List[Tuple[str, float]]:
+def get_top_n_predictions(prediction: np.ndarray, model_name: str, n: int = 3) -> List[Tuple[str, float]]:
     """
-    Get top 3 predictions from the model output.
+    Get top n predictions from the model output.
 
     Args:
         prediction (np.ndarray): Output prediction from a model.
         model_name (str): Name of the model that produced the prediction.
+        n (int, optional): Number of top predictions to retrieve. Defaults to 3.
 
     Returns:
-        List[Tuple[str, float]]: A list of top 3 predictions along with their respective scores.
+        List[Tuple[str, float]]: A list of top n predictions along with their respective scores.
     """
 
-    top_3 = prediction[0].argsort()[-3:][::-1]
+    # Ensure that n does not exceed the total number of classes
+    n = min(n, prediction[0].shape[0])
+
+    top_n_indices = prediction[0].argsort()[-n:][::-1]
     classes = get_classes_for_model(model_name)
-    top_3 = [(classes[i], round(prediction[0][i] * 100, 2)) for i in top_3]
-    return top_3
+    top_n_predictions = [(classes[i], round(prediction[0][i] * 100, 2)) for i in top_n_indices]
+
+    return top_n_predictions
 
 
 def get_pre_filter_prediction(image_data: np.ndarray, model_name: str):
@@ -153,7 +158,7 @@ def get_pre_filter_prediction(image_data: np.ndarray, model_name: str):
         models[model_name] = load_model(model_name)
     input_name = models[model_name].get_inputs()[0].name
     prediction = models[model_name].run(None, {input_name: image_data})
-    filter_names = get_top_3_predictions(prediction[0], "pre_filter")
+    filter_names = get_top_n_predictions(prediction[0], "pre_filter")
     return filter_names
 
 
@@ -215,7 +220,7 @@ def classify_image(image_data: str, model_name: str, show_mask: bool = False) ->
     prediction = model.run(None, {input_name: filter_image})
 
     # Retrieving the top 3 predictions
-    top_3_predictions = get_top_3_predictions(prediction[0], model_name)
+    top_3_predictions = get_top_n_predictions(prediction[0], model_name)
 
     return (top_3_predictions, mask_base64) if show_mask else [top_3_predictions]
 
diff --git a/web_ui/main_ensemble.py b/web_ui/main_ensemble.py
@@ -14,7 +14,7 @@
 from io import BytesIO
 from PIL import Image
 
-from utilities.class_names import get_classes_for_model
+from utilities.class_names import get_classes_for_model, HIERARCHY
 from utilities.prepare_images import replace_background, resize_and_pad_image, fix_image, convert_mask
 import pooch
 from rembg import new_session
@@ -25,7 +25,6 @@
     "all_specific_model_variants": None,
     "specific_model_variants": None,
     "pre_filter": None,
-    "car_type_2": None,
 }
 
 # Initiate session
@@ -142,22 +141,27 @@ def prepare_image(image_data: Image, target_size: Tuple, remove_background: bool
     return img_array, mask
 
 
-def get_top_3_predictions(prediction: np.ndarray, model_name: str) -> List[Tuple[str, float]]:
+def get_top_n_predictions(prediction: np.ndarray, model_name: str, n: int = 3) -> List[Tuple[str, float]]:
     """
-    Get top 3 predictions from the model output.
+    Get top n predictions from the model output.
 
     Args:
         prediction (np.ndarray): Output prediction from a model.
         model_name (str): Name of the model that produced the prediction.
+        n (int, optional): Number of top predictions to retrieve. Defaults to 3.
 
     Returns:
-        List[Tuple[str, float]]: A list of top 3 predictions along with their respective scores.
+        List[Tuple[str, float]]: A list of top n predictions along with their respective scores.
     """
 
-    top_3 = prediction[0].argsort()[-3:][::-1]
+    # Ensure that n does not exceed the total number of classes
+    n = min(n, prediction[0].shape[0])
+
+    top_n_indices = prediction[0].argsort()[-n:][::-1]
     classes = get_classes_for_model(model_name)
-    top_3 = [(classes[i], round(prediction[0][i] * 100, 2)) for i in top_3]
-    return top_3
+    top_n_predictions = [(classes[i], round(prediction[0][i] * 100, 2)) for i in top_n_indices]
+
+    return top_n_predictions
 
 
 def get_pre_filter_prediction(image_data: np.ndarray, model_name: str):
@@ -179,7 +183,7 @@ def get_pre_filter_prediction(image_data: np.ndarray, model_name: str):
         models[model_name] = load_model(model_name)
     input_name = models[model_name].get_inputs()[0].name
     prediction = models[model_name].run(None, {input_name: image_data})
-    filter_names = get_top_3_predictions(prediction[0], "pre_filter")
+    filter_names = get_top_n_predictions(prediction[0], "pre_filter")
     return filter_names
 
 
@@ -247,18 +251,83 @@ def classify_image(image_data: str, model_name: str, show_mask: bool = False) ->
     if pre_filter_predictions[0][0] != "porsche":
         return (pre_filter_predictions, mask_base64) if show_mask else [pre_filter_predictions]
 
-    if model_name != "car_type":
+    if model_name != "car_type" and model_name != "specific_model_variants":
+        input_name = model.get_inputs()[0].name
+        prediction = model.run(None, {input_name: filter_image})
+    elif model_name == "specific_model_variants":
+        if models["car_type"] is None:
+            models["car_type"] = load_model("car_type")
+
+        # Hierarchical prediction
+        pre_prediction = ensemble_predictions_weighted(models["car_type"], filter_image)
+        top_pre_prediction = get_top_n_predictions(pre_prediction[0], "car_type", 8)
+
+        # Run the specific model
         input_name = model.get_inputs()[0].name
         prediction = model.run(None, {input_name: filter_image})
+        top_prediction = get_top_n_predictions(prediction[0], "specific_model_variants", 25)
+
+        # Adjust the top_prediction based on top_pre_prediction and hierarchy
+        all_adjusted_predictions = []
+
+        for car_type, car_type_possibility in top_pre_prediction:
+            # Initialize an empty list for each car_type to store its adjusted predictions
+            car_type_adjusted_predictions = []
+
+            # Normalize the car_type_possibility
+            normalized_car_type_possibility = car_type_possibility / 100.0
+
+            # Fetch the possible series based on hierarchy
+            possible_series = HIERARCHY.get(car_type, [])
+
+            # Check if any of the series from the top_prediction belongs to possible_series
+            for car_series, car_series_possibility in top_prediction:
+                if car_series in possible_series:
+                    normalized_car_series_possibility = car_series_possibility / 100.0
+                    # Multiply the normalized possibilities
+                    adjusted_possibility_normalized = 0.6 * normalized_car_series_possibility + 0.4 * normalized_car_type_possibility
+                    # Convert back to the 1-100 scale
+                    adjusted_possibility = adjusted_possibility_normalized * 100
+                    car_type_adjusted_predictions.append((car_series, adjusted_possibility))
+
+            # Sort the predictions for this car_type
+            car_type_adjusted_predictions = sorted(car_type_adjusted_predictions, key=lambda x: x[1], reverse=True)
+
+            # Append them to the overall list
+            all_adjusted_predictions.extend(car_type_adjusted_predictions)
+
+        # Get top 3 predictions
+        top_3_predictions = all_adjusted_predictions[:3]
+
+        return (top_3_predictions, mask_base64) if show_mask else [top_3_predictions]
     else:
-        # prediction = ensemble_predictions_weighted(model, filter_image)
         prediction = ensemble_predictions_weighted(model, filter_image)
 
     # Retrieving the top 3 predictions
-    top_3_predictions = get_top_3_predictions(prediction[0], model_name)
+    top_3_predictions = get_top_n_predictions(prediction[0], model_name)
 
     return (top_3_predictions, mask_base64) if show_mask else [top_3_predictions]
 
 
 eel.init("web")
 eel.start("index.html", size=(1000, 800), mode="default")
+
+
+"""How the car_type/car_series ensemble works:
+
+Incorporating Hierarchical Predictions for Porsche Images
+
+Hierarchy Setup:
+
+Create a mapping between 'car type' (e.g., Macan, 911) and 'car series' (e.g., 911_991, Macan_95B).
+Prediction Process:
+
+Get the top predictions for 'car type' using Model 1.
+Predict 'car series' using Model 2.
+Adjustment:
+
+For each 'car type' from Model 1:
+Filter 'car series' predictions of Model 2 that align with the hierarchy.
+Adjust the probabilities of these 'car series' predictions based on 'car type' probability.
+Sort and combine the adjusted predictions.
+"""