Spaces:

lombardata
/

Victor_DinoVdEau_Image_Classification

Running

App Files Files Community

lombardata commited on Apr 10, 2024

Commit

9d241a6

verified ·

1 Parent(s): f5a10fc

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -43

app.py CHANGED Viewed

@@ -1,14 +1,26 @@
-import numpy as np
-import gradio as gr
 import torch
-from transformers import Dinov2Config, Dinov2Model, Dinov2ForImageClassification, AutoImageProcessor
-import torch.nn as nn
-import os
-import json
 from huggingface_hub import hf_hub_download
 # DEFINE MODEL NAME
 model_name = "DinoVdeau-large-2024_04_03-with_data_aug_batch-size32_epochs150_freeze"
 # IMPORT CLASSIFICATION MODEL
 def create_head(num_features , number_classes ,dropout_prob=0.5 ,activation_func =nn.ReLU):
@@ -21,7 +33,6 @@ def create_head(num_features , number_classes ,dropout_prob=0.5 ,activation_func
         if dropout_prob !=0 : layers.append(nn.Dropout(dropout_prob))
     layers.append(nn.Linear(features_lst[-1] , number_classes))
     return nn.Sequential(*layers)
-from transformers import Dinov2Config, Dinov2Model
 class NewheadDinov2ForImageClassification(Dinov2ForImageClassification):
     def __init__(self, config: Dinov2Config) -> None:
@@ -30,55 +41,41 @@ class NewheadDinov2ForImageClassification(Dinov2ForImageClassification):
         # Classifier head
         self.classifier = create_head(config.hidden_size * 2, config.num_labels)
-checkpoint_name = "lombardata/" + model_name
 model = NewheadDinov2ForImageClassification.from_pretrained(checkpoint_name)
-# IMPORT MODEL CONFIG PARAMETERS
-config_path = hf_hub_download(repo_id=checkpoint_name, filename="config.json")
-# Opening JSON file
-config_file = open(config_path)
-# returns JSON object as
-config = json.load(config_file)
-# import parameters
-id2label = config["id2label"]
-label2id = config["label2id"]
-image_size = config["image_size"]
-classes_names = list(label2id.keys())
-# PREDICTIONS
 def sigmoid(_outputs):
     return 1.0 / (1.0 + np.exp(-_outputs))
-def predict(input_image):
-    image_processor = AutoImageProcessor.from_pretrained(checkpoint_name)
-    # predict
-    inputs = image_processor(input_image, return_tensors="pt")
-    inputs = inputs
     with torch.no_grad():
         model_outputs = model(**inputs)
-    outputs = model_outputs["logits"][0]
-    scores = sigmoid(outputs)
-    result = {}
-    i = 0
-    for score in scores:
-        label = classes_names[i]
-        result[label] = float(score)
-        i += 1
-    result = {key: result[key] for key in result if result[key] > 0.5}
-    return result
 # Define style
 title = "Victor - DinoVd'eau image classification"
 model_link = "https://huggingface.co/" + checkpoint_name
 description = f"This application showcases the capability of artificial intelligence-based systems to identify objects within underwater images. To utilize it, you can either upload your own image or select one of the provided examples for analysis.\nFor predictions, we use this [open-source model]({model_link})"
-gr.Interface(
     fn=predict,
-    inputs=gr.Image(shape=(image_size, image_size)),
-    outputs="label",
     title=title,
-    description=description,
     examples=["session_GOPR0106.JPG",
               "session_2021_08_30_Mayotte_10_image_00066.jpg",
               "session_2018_11_17_kite_Le_Morne_Manawa_G0065777.JPG",
-              "session_2023_06_28_caplahoussaye_plancha_body_v1B_00_GP1_3_1327.jpeg"]).launch()

 import torch
+from transformers import AutoImageProcessor, Dinov2ForImageClassification, Dinov2Config, Dinov2Model
+from PIL import Image
+import gradio as gr
 from huggingface_hub import hf_hub_download
+import json
+import torch.nn as nn
+import numpy as np
 # DEFINE MODEL NAME
 model_name = "DinoVdeau-large-2024_04_03-with_data_aug_batch-size32_epochs150_freeze"
+checkpoint_name = "lombardata/" + model_name
+# Load the model configuration and create the model
+config_path = hf_hub_download(repo_id=checkpoint_name, filename="config.json")
+with open(config_path, 'r') as config_file:
+    config = json.load(config_file)
+id2label = config["id2label"]
+label2id = config["label2id"]
+image_size = config["image_size"]
+num_labels = len(id2label)
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # IMPORT CLASSIFICATION MODEL
 def create_head(num_features , number_classes ,dropout_prob=0.5 ,activation_func =nn.ReLU):
         if dropout_prob !=0 : layers.append(nn.Dropout(dropout_prob))
     layers.append(nn.Linear(features_lst[-1] , number_classes))
     return nn.Sequential(*layers)
 class NewheadDinov2ForImageClassification(Dinov2ForImageClassification):
     def __init__(self, config: Dinov2Config) -> None:
         # Classifier head
         self.classifier = create_head(config.hidden_size * 2, config.num_labels)
 model = NewheadDinov2ForImageClassification.from_pretrained(checkpoint_name)
+model.to(device)
 def sigmoid(_outputs):
     return 1.0 / (1.0 + np.exp(-_outputs))
+def predict(image, threshold):
+    # Preprocess the image
+    processor = AutoImageProcessor.from_pretrained(checkpoint_name)
+    inputs = processor(images=image, return_tensors="pt").to(device)
+    # Get model predictions
     with torch.no_grad():
         model_outputs = model(**inputs)
+    logits = model_outputs.logits[0]
+    probabilities = torch.sigmoid(logits).cpu().numpy()  # Convert to probabilities
+    # Create a dictionary of label scores
+    results = {id2label[str(i)]: float(prob) for i, prob in enumerate(probabilities)}
+    # Filter out predictions below a certain threshold (e.g., 0.5)
+    filtered_results = {label: prob for label, prob in results.items() if prob > threshold}
+    return filtered_results
 # Define style
 title = "Victor - DinoVd'eau image classification"
 model_link = "https://huggingface.co/" + checkpoint_name
 description = f"This application showcases the capability of artificial intelligence-based systems to identify objects within underwater images. To utilize it, you can either upload your own image or select one of the provided examples for analysis.\nFor predictions, we use this [open-source model]({model_link})"
+iface = gr.Interface(
     fn=predict,
+    inputs=[gr.components.Image(type="pil"), gr.components.Slider(minimum=0, maximum=1, value=0.5, label="Threshold")],
+    outputs=gr.components.Label(),
     title=title,
     examples=["session_GOPR0106.JPG",
               "session_2021_08_30_Mayotte_10_image_00066.jpg",
               "session_2018_11_17_kite_Le_Morne_Manawa_G0065777.JPG",
+              "session_2023_06_28_caplahoussaye_plancha_body_v1B_00_GP1_3_1327.jpeg"]).launch()