Spaces:

diegopacheco
/

diego-llm-img-to-lbl

Running

App Files Files Community

diegopacheco commited on May 7, 2024

Commit

f5b4b81

1 Parent(s): 0b5b4b1

app v1

Browse files

Files changed (9) hide show

README.md +14 -8
app.py +60 -0
bear.jpg +0 -0
boat.jpg +0 -0
install-deps.sh +3 -0
puppy.jpg +0 -0
requirements.txt +17 -0
result.png +0 -0
run.sh +3 -0

README.md CHANGED Viewed

@@ -1,13 +1,19 @@
 ---
-title: Diego Llm Img To Lbl
-emoji: 🚀
-colorFrom: green
-colorTo: pink
 sdk: gradio
-sdk_version: 4.29.0
 app_file: app.py
-pinned: false
-license: unlicense
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Diego's LLM Image to Labeled Image
+emoji: 🖼️
 sdk: gradio
+sdk_version: 4.24.0
+license: cc-by-nc-sa-4.0
+short_description: Diego's LLM Image to Labeled Image. Classify an image and draw the label on the image.
+colorFrom: green
+colorTo: black
 app_file: app.py
 ---
+### Result
+* Given a image
+* Will detect what the image is
+* Print the label and the score on the image
+* Uses the LLM model vit-base-patch16-224
+<img src='result.png' />

app.py ADDED Viewed

	@@ -0,0 +1,60 @@

+from PIL import Image
+import requests
+from transformers import ViTFeatureExtractor, ViTForImageClassification
+import matplotlib.pyplot as plt
+import matplotlib.patches as patches
+import gradio as gr
+import numpy as np
+def classify_and_label_image(image_array):
+    # Convert numpy array to PIL Image
+    image = Image.fromarray(np.uint8(image_array))
+    # Load pre-trained model and feature extractor
+    model = ViTForImageClassification.from_pretrained('google/vit-base-patch16-224')
+    feature_extractor = ViTFeatureExtractor.from_pretrained('google/vit-base-patch16-224')
+    # Preprocess the image
+    inputs = feature_extractor(images=image, return_tensors="pt")
+    # Make prediction
+    outputs = model(**inputs)
+    logits = outputs.logits
+    predicted_class_idx = logits.argmax(-1).item()
+    # Get label of the predicted class
+    labels = model.config.id2label
+    predicted_class_label = labels[predicted_class_idx]
+    # Calculate prediction probability
+    probabilities = logits.softmax(dim=-1)
+    predicted_class_prob = probabilities[0, predicted_class_idx].item()
+    # Draw bounding box and label on the image
+    fig, ax = plt.subplots()
+    ax.imshow(image)
+    rect = patches.Rectangle((50, 50), 100, 100, linewidth=1, edgecolor='r', facecolor='none')
+    ax.add_patch(rect)
+    plt.text(50, 40, f'{predicted_class_label} {predicted_class_prob * 100:.2f}%', color='r')
+    # Convert the figure to a numpy array
+    fig.canvas.draw()
+    img_arr = np.array(fig.canvas.renderer.buffer_rgba())
+    # Close the figure to free up memory
+    plt.close(fig)
+    # Return the image array
+    return img_arr
+examples = [
+    ["bear.jpg"],
+    ["puppy.jpg"],
+    ["boat.jpg"]
+]
+gr.Interface(fn=classify_and_label_image, title="Diego's LLM Image to Labeled Image",
+                                          description="Classify an image and draw the label on the image.",
+                                          examples=examples,
+                                          inputs="image",
+                                          outputs="image")\
+.launch(share=False, server_port=8080)

bear.jpg ADDED Viewed

boat.jpg ADDED Viewed

install-deps.sh ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ #!/bin/bash
2	+
3	+ /bin/pip install -r requirements.txt

puppy.jpg ADDED Viewed

requirements.txt ADDED Viewed

	@@ -0,0 +1,17 @@

+numpy
+transformers
+sentence-transformers
+seaborn
+torch
+torchvision
+matplotlib
+pandas
+scikit-learn
+nltk
+gensim
+tensorflow
+keras
+opencv-python
+fastapi
+uvicorn
+gradio

result.png ADDED Viewed

run.sh ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ #!/bin/bash
2	+
3	+ /bin/python src/main.py