File size: 940 Bytes
998ea00
81898e8
744fb8a
 
 
565dc8e
81898e8
565dc8e
 
744fb8a
 
 
998ea00
744fb8a
 
998ea00
744fb8a
 
998ea00
744fb8a
 
 
998ea00
565dc8e
 
 
21884ee
565dc8e
81898e8
 
 
744fb8a
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import clip
import gradio as gr
import os
import torch
from torchvision.datasets import CIFAR100
from transformers import CLIPProcessor, CLIPModel

model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32")
processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32")

cifar100 = CIFAR100(root=os.path.expanduser("~/.cache"), download=True, train=False)

text_inputs = torch.cat([clip.tokenize(f"a photo of a {c}") for c in cifar100.classes])


# TODO debug cette ligne pour avoir un affichage correct


# TODO Finir l'affichage du résultat


def send_inputs(img):
    inputs = processor(text=cifar100.classes, images=img, return_tensors="pt", padding=True)
    outputs = model(**inputs)
    logits_per_image = outputs.logits_per_image
    probs = logits_per_image.softmax(dim=1)
    print(probs)
    return probs


if __name__ == "__main__":
    gr.Interface(fn=send_inputs, inputs=["image"], outputs="text").launch()