File size: 1,304 Bytes
1e28fa3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3c47be6
 
1e28fa3
 
 
 
 
 
 
 
 
 
 
aac533a
1a5ca17
8cd9b7d
1e28fa3
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
import gradio as gr
from datasets import load_dataset
import numpy as np
import torch
import torch.nn as nn
from torchvision.transforms import Compose, ColorJitter, ToTensor, RandomPerspective
from transformers import AutoFeatureExtractor, AutoModelForImageClassification


with open("dogs_labels.txt", "r") as f:
    labels = f.read().split('\n')


num_labels = len(labels)
id2label = {str(i): c for i, c in enumerate(labels)}


def classify_image(inp):
    # Load model
    model = AutoModelForImageClassification.from_pretrained(pretrained_model_name_or_path="asusevski/vit-dog-classifier")

    # Preprocess
    model_preprocessor_name = "google/vit-base-patch16-224"
    feature_extractor = AutoFeatureExtractor.from_pretrained(model_preprocessor_name)

    inp = np.array(inp.convert('RGB'))
    
    inp = torch.tensor(feature_extractor(images=inp)['pixel_values'])
    preds = model(inp)['logits']
    preds = torch.flatten(preds)
    preds = nn.functional.softmax(preds, dim=0)
    confidences = {labels[i]: preds[i].item() for i in range(num_labels)}
    return confidences


gr.Interface(fn=classify_image, 
    inputs=gr.Image(type="pil"),
    outputs=gr.Label(num_top_classes=3),
    title="Dog Breed Classifier!",
    examples=['bordercollie.jpg', 'stbernard.jpg', 'yorkie.jpg']
).launch()