Spaces:

wgetdd
/

CIFAR_Custom_Resnet

Sleeping

App Files Files Community

wgetdd commited on Aug 2, 2023

Commit

9e78939

•

1 Parent(s): 35313b8

Inference Code for trained model

Browse files

Files changed (2) hide show

gradio_app.py +54 -0
utils.py +151 -0

gradio_app.py ADDED Viewed

	@@ -0,0 +1,54 @@

+import gradio as gr
+from torchvision import transforms
+import torch
+from utils import CustomResnet, main_inference, get_misclassified_images, get_gradcam
+inv_normalize = transforms.Normalize(
+    mean=[-0.50/0.23, -0.50/0.23, -0.50/0.23],
+    std=[1/0.23, 1/0.23, 1/0.23]
+)
+model = CustomResnet()
+classes = ('plane', 'car', 'bird', 'cat', 'deer',
+           'dog', 'frog', 'horse', 'ship', 'truck')
+targets = None
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+model.to(device)
+# Define the input and output components of the Gradio app
+input_component = gr.inputs.Image(shape=(32, 32))
+num_of_output_classes = gr.inputs.Slider(minimum=0, maximum=10, default=5, step=1,label="Top class count")
+# Adding a checkbox to the interface to show/hide misclassified images
+show_misclassified_checkbox = gr.inputs.Checkbox(default=False, label="Show Misclassified Images")
+# Input field to specify the number of misclassified images to display
+num_images_input = gr.inputs.Slider(minimum=0, maximum=20, default=15, step=5,label="Missclassified Images Count")
+# Adding a checkbox to the interface to show/hide GradCAM output
+show_gradcam_checkbox = gr.inputs.Checkbox(default=False, label="Show GradCAM Output")
+# Slider for adjusting the opacity of the GradCAM overlay
+opacity_slider = gr.inputs.Slider(minimum=0, maximum=1, default=0.7,step=0.1,    label="GradCAM Opacity")
+gr.Interface(
+    fn=lambda image, num_of_output_classes,show_misclassified, num_images, show_gradcam, opacity: [main_inference(num_of_output_classes,classes,model,image),
+                                                                              get_misclassified_images(show_misclassified, num_images) if show_misclassified else None,
+                                                                              get_gradcam(model,image, opacity) if show_gradcam else None],
+    inputs=[input_component, num_of_output_classes,show_misclassified_checkbox, num_images_input, show_gradcam_checkbox, opacity_slider],
+    outputs=[gr.outputs.Label(), gr.Image(shape=(500, 500)), gr.Image(shape=(500, 500))],
+    examples=[
+        ["example_images/example_1.png",5,True,5,True,0.2],  # You can provide your own example input values here
+    ["example_images/example_2.png",5,False,5,True,0.3],
+    ["example_images/example_3.png",5,True,15,False,0.2] ,
+    ["example_images/example_4.png",5,True,20,True,0.5] ,
+    ["example_images/example_5.png",5,False,5,False,0.2] ,
+    ["example_images/example_6.png",5,True,10,True,0.3] ,
+    ["example_images/example_7.png",5,True,5,True,0.4] ,
+    ["example_images/example_8.png",5,False,5,False,0.6] ,
+    ["example_images/example_9.png",5,True,20,False,0.2] ,
+    ["example_images/example_10.png",5,False,5,True,0.7]
+    ],
+    layout="horizontal"
+).launch()

utils.py ADDED Viewed

	@@ -0,0 +1,151 @@

+import torch.nn as nn
+import torch.nn.functional as F
+import torch
+from torchvision import transforms
+import cv2
+import numpy as np
+from pytorch_grad_cam import GradCAM
+from pytorch_grad_cam import GradCAM
+from pytorch_grad_cam.utils.image import show_cam_on_image
+def apply_normalization(chennels):
+      return nn.BatchNorm2d(chennels)
+class CustomResnet(nn.Module):
+    def __init__(self):
+        super(CustomResnet, self).__init__()
+        # Input Block
+        drop = 0.0
+        # PrepLayer - Conv 3x3 s1, p1) >> BN >> RELU [64k]
+        self.preplayer = nn.Sequential(
+            nn.Conv2d(3, 64, (3, 3), padding=1, stride=1, bias=False), # 3
+            apply_normalization(64),
+            nn.ReLU(),
+        )
+        # Layer1 -
+        # X = Conv 3x3 (s1, p1) >> MaxPool2D >> BN >> RELU [128k]
+        self.convlayer1 = nn.Sequential(
+            nn.Conv2d(64, 128, (3, 3), padding=1, stride=1, bias=False), # 3
+            nn.MaxPool2d(2, 2),
+            apply_normalization(128),
+            nn.ReLU(),
+        )
+        # R1 = ResBlock( (Conv-BN-ReLU-Conv-BN-ReLU))(X) [128k]
+        self.reslayer1 = nn.Sequential(
+            nn.Conv2d(128, 128, (3, 3), padding=1, stride=1, bias=False), # 3
+            apply_normalization(128),
+            nn.ReLU(),
+            nn.Conv2d(128, 128, (3, 3), padding=1, stride=1, bias=False), # 3
+            apply_normalization(128),
+            nn.ReLU(),
+        )
+        # Conv 3x3 [256k]
+        self.convlayer2 = nn.Sequential(
+            nn.Conv2d(128, 256, (3, 3), padding=1, stride=1, bias=False), # 3
+            nn.MaxPool2d(2, 2),
+            apply_normalization(256),
+            nn.ReLU(),
+        )
+        # X = Conv 3x3 (s1, p1) >> MaxPool2D >> BN >> RELU [512k]
+        self.convlayer3 = nn.Sequential(
+            nn.Conv2d(256, 512, (3, 3), padding=1, stride=1, bias=False), # 3
+            nn.MaxPool2d(2, 2),
+            apply_normalization(512),
+            nn.ReLU(),
+        )
+        # R1 = ResBlock( (Conv-BN-ReLU-Conv-BN-ReLU))(X) [128k]
+        self.reslayer2 = nn.Sequential(
+            nn.Conv2d(512, 512, (3, 3), padding=1, stride=1, bias=False), # 3
+            apply_normalization(512),
+            nn.ReLU(),
+            nn.Conv2d(512, 512, (3, 3), padding=1, stride=1, bias=False), # 3
+            apply_normalization(512),
+            nn.ReLU(),
+        )
+        self.maxpool3 = nn.MaxPool2d(4, 2)
+        self.linear1 = nn.Linear(512,10)
+    def forward(self,x):
+        x = self.preplayer(x)
+        x1 = self.convlayer1(x)
+        x2 = self.reslayer1(x1)
+        x = x1+x2
+        x = self.convlayer2(x)
+        x = self.convlayer3(x)
+        x1 = self.reslayer2(x)
+        x = x+x1
+        x = self.maxpool3(x)
+        x = x.view(-1, 512)
+        x = self.linear1(x)
+        return F.log_softmax(x, dim=-1)
+# Function to run inference and return top classes
+def get_gradcam(model,input_img, opacity):
+    targets = None
+    inv_normalize = transforms.Normalize(
+        mean=[-0.50/0.23, -0.50/0.23, -0.50/0.23],
+        std=[1/0.23, 1/0.23, 1/0.23]
+    )
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    transform = transforms.ToTensor()
+    input_img = transform(input_img)
+    input_img = input_img.to(device)
+    input_img = input_img.unsqueeze(0)
+    outputs = model(input_img)
+    _, prediction = torch.max(outputs, 1)
+    target_layers = [model.convlayer3[-2]]
+    cam = GradCAM(model=model, target_layers=target_layers, use_cuda=True)
+    grayscale_cam = cam(input_tensor=input_img, targets=targets)
+    grayscale_cam = grayscale_cam[0, :]
+    img = input_img.squeeze(0).to('cpu')
+    img = inv_normalize(img)
+    rgb_img = np.transpose(img, (1, 2, 0))
+    rgb_img = rgb_img.numpy()
+    visualization = show_cam_on_image(rgb_img, grayscale_cam, use_rgb=True, image_weight=opacity)
+    return visualization
+def get_misclassified_images(show_misclassified,num):
+    if show_misclassified:
+        return cv2.imread(f"missclassified_images_examples/{int(num)}_missclassified.png")
+    else:
+        return None
+def main_inference(num_of_output_classes,classes,model,input_img):
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    transform = transforms.ToTensor()
+    input_img = transform(input_img)
+    input_img = input_img.to(device)
+    input_img = input_img.unsqueeze(0)
+    softmax = torch.nn.Softmax(dim=0)
+    outputs = model(input_img)
+    out = softmax(outputs.flatten())
+    _, prediction = torch.max(outputs, 1)
+    confidences = {classes[i]:float(out[i]) for i in range(num_of_output_classes)}
+    outputs = model(input_img)
+    _, prediction = torch.max(outputs, 1)
+    return confidences
+# def run_inference(input_img, num_of_output_classes,transparency):
+#     transform = transforms.ToTensor()
+#     input_img = transform(input_img)
+#     input_img = input_img.to(device)
+#     input_img = input_img.unsqueeze(0)
+#     softmax = torch.nn.Softmax(dim=0)
+#     outputs = model(input_img)
+#     out = softmax(outputs.flatten())
+#     _, prediction = torch.max(outputs, 1)
+#     confidences = {classes[i]:float(out[i]) for i in range(num_of_output_classes)}
+#     target_layers = [model.convlayer3[-2]]
+#     cam = GradCAM(model=model, target_layers=target_layers, use_cuda=True)
+#     grayscale_cam = cam(input_tensor=input_img, targets=targets)
+#     grayscale_cam = grayscale_cam[0, :]
+#     img = input_img.squeeze(0).to('cpu')
+#     img = inv_normalize(img)
+#     rgb_img = np.transpose(img, (1, 2, 0))
+#     rgb_img = rgb_img.numpy()
+#     visualization = show_cam_on_image(rgb_img, grayscale_cam, use_rgb=True, image_weight=transparency)
+#     return confidences, rgb_img, transparency,grayscale_cam