Ehsa commited on
Commit
d68cbdc
·
1 Parent(s): b982d7b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +51 -16
app.py CHANGED
@@ -1,29 +1,64 @@
 
 
 
1
  import gradio as gr
2
- from transformers import ViTFeatureExtractor, ViTForImageClassification
3
 
4
- import torch
5
 
6
 
 
 
 
 
 
 
 
 
 
 
 
7
 
8
- feature_extractor = ViTFeatureExtractor.from_pretrained("google/vit-base-patch16-224")
 
 
 
 
 
 
 
 
9
 
10
- model = ViTForImageClassification.from_pretrained("google/vit-base-patch16-224")
 
 
 
11
 
12
- inputs = feature_extractor(image, return_tensors="pt")
 
 
 
13
 
14
- with torch.no_grad():
 
 
 
 
 
 
 
 
15
 
16
- logits = model(**inputs).logits
 
17
 
18
- # model predicts one of the 1000 ImageNet classes
 
19
 
20
- predicted_label = logits.argmax(-1).item()
21
 
22
- print(model.config.id2label[predicted_label])
 
 
23
 
24
- gr.Interface.load(
25
- inference,
26
- theme="default",
27
- examples=[["alligator.jpg"], ["laptop.jpg"]],
28
- css=".footer{display:none !important}",
29
- title=None).launch()
 
1
+ import torch
2
+ from PIL import Image
3
+ from torchvision import transforms
4
  import gradio as gr
5
+ import os
6
 
7
+ os.system("wget https://raw.githubusercontent.com/pytorch/hub/master/imagenet_classes.txt")
8
 
9
 
10
+ import torch
11
+ model = torch.hub.load('pytorch/vision:v0.10.0', 'resnet18', pretrained=True)
12
+ # or any of these variants
13
+ # model = torch.hub.load('pytorch/vision:v0.10.0', 'resnet34', pretrained=True)
14
+ # model = torch.hub.load('pytorch/vision:v0.10.0', 'resnet50', pretrained=True)
15
+ # model = torch.hub.load('pytorch/vision:v0.10.0', 'resnet101', pretrained=True)
16
+ # model = torch.hub.load('pytorch/vision:v0.10.0', 'resnet152', pretrained=True)
17
+ model.eval()
18
+
19
+ # Download an example image from the pytorch website
20
+ torch.hub.download_url_to_file("https://github.com/pytorch/hub/raw/master/images/dog.jpg", "dog.jpg")
21
 
22
+ def inference(input_image):
23
+ preprocess = transforms.Compose([
24
+ transforms.Resize(256),
25
+ transforms.CenterCrop(224),
26
+ transforms.ToTensor(),
27
+ transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
28
+ ])
29
+ input_tensor = preprocess(input_image)
30
+ input_batch = input_tensor.unsqueeze(0) # create a mini-batch as expected by the model
31
 
32
+ # move the input and model to GPU for speed if available
33
+ if torch.cuda.is_available():
34
+ input_batch = input_batch.to('cuda')
35
+ model.to('cuda')
36
 
37
+ with torch.no_grad():
38
+ output = model(input_batch)
39
+ # The output has unnormalized scores. To get probabilities, you can run a softmax on it.
40
+ probabilities = torch.nn.functional.softmax(output[0], dim=0)
41
 
42
+ # Read the categories
43
+ with open("imagenet_classes.txt", "r") as f:
44
+ categories = [s.strip() for s in f.readlines()]
45
+ # Show top categories per image
46
+ top5_prob, top5_catid = torch.topk(probabilities, 5)
47
+ result = {}
48
+ for i in range(top5_prob.size(0)):
49
+ result[categories[top5_catid[i]]] = top5_prob[i].item()
50
+ return result
51
 
52
+ inputs = gr.inputs.Image(type='pil')
53
+ outputs = gr.outputs.Label(type="confidences",num_top_classes=5)
54
 
55
+ title = "ResNet"
56
+ description = "Gradio demo for ResNet, Deep residual networks pre-trained on ImageNet. To use it, simply upload your image, or click one of the examples to load them. Read more at the links below."
57
 
58
+ article = "<p style='text-align: center'><a href='https://arxiv.org/abs/1512.03385' target='_blank'>Deep Residual Learning for Image Recognition</a> | <a href='https://github.com/pytorch/vision/blob/main/torchvision/models/resnet.py' target='_blank'>Github Repo</a></p>"
59
 
60
+ examples = [
61
+ ['dog.jpg']
62
+ ]
63
 
64
+ gr.Interface(inference, inputs, outputs, title=title, description=description, article=article, examples=examples, analytics_enabled=False).launch()