Spaces:

enesmanan
/

dl-animal-classifier

Sleeping

App Files Files Community

enesmanan commited on Dec 20, 2024

Commit

e1ab149

verified ·

1 Parent(s): 2ae907b

add deploy files

Browse files

Files changed (5) hide show

app.py +152 -0
checkpoints/cnn/cnn_best_model.pth +3 -0
checkpoints/efficientnet/efficientnet_best_model.pth +3 -0
model.py +160 -0
requirements.txt +12 -0

app.py ADDED Viewed

	@@ -0,0 +1,152 @@

+import os
+import gradio as gr
+import torch
+import torch.nn.functional as F
+import numpy as np
+from PIL import Image
+import torchvision.transforms as transforms
+import matplotlib.pyplot as plt
+from models.model import EfficientNetModel, CNNModel
+class AnimalClassifierApp:
+    def __init__(self):
+        """Initialize the application."""
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.labels = ["bird", "cat", "dog", "horse"]
+        # Image preprocessing
+        self.transform = transforms.Compose([
+            transforms.Resize((224, 224)),
+            transforms.ToTensor(),
+            transforms.Normalize(
+                mean=[0.485, 0.456, 0.406],
+                std=[0.229, 0.224, 0.225]
+            )
+        ])
+        # Load models
+        self.models = self.load_models()
+        if not self.models:
+            print("Warning: No models found in checkpoints directory!")
+    def load_models(self):
+        """Load both trained models."""
+        models = {}
+        # Load EfficientNet
+        try:
+            efficientnet = EfficientNetModel(num_classes=len(self.labels))
+            efficientnet_path = os.path.join("checkpoints", "efficientnet", "efficientnet_best_model.pth")
+            if os.path.exists(efficientnet_path):
+                checkpoint = torch.load(efficientnet_path, map_location=self.device, weights_only=True)
+                state_dict = checkpoint.get('model_state_dict', checkpoint)
+                efficientnet.load_state_dict(state_dict, strict=False)
+                efficientnet.eval()
+                models['EfficientNet'] = efficientnet
+                print("Successfully loaded EfficientNet model")
+        except Exception as e:
+            print(f"Error loading EfficientNet model: {str(e)}")
+        # Load CNN
+        try:
+            cnn = CNNModel(num_classes=len(self.labels))
+            cnn_path = os.path.join("checkpoints", "cnn", "cnn_best_model.pth")
+            if os.path.exists(cnn_path):
+                checkpoint = torch.load(cnn_path, map_location=self.device, weights_only=True)
+                state_dict = checkpoint.get('model_state_dict', checkpoint)
+                cnn.load_state_dict(state_dict, strict=False)
+                cnn.eval()
+                models['CNN'] = cnn
+                print("Successfully loaded CNN model")
+        except Exception as e:
+            print(f"Error loading CNN model: {str(e)}")
+        return models
+    def predict(self, image: Image.Image):
+        """Make predictions with both models and create comparison visualizations."""
+        if not self.models:
+            return "No trained models found. Please train the models first."
+        # Preprocess image
+        img_tensor = self.transform(image).unsqueeze(0).to(self.device)
+        # Get predictions from both models
+        results = {}
+        probabilities = {}
+        for model_name, model in self.models.items():
+            with torch.no_grad():
+                output = model(img_tensor)
+                probs = F.softmax(output, dim=1).squeeze().cpu().numpy()
+                probabilities[model_name] = probs
+                # Get top prediction
+                pred_idx = np.argmax(probs)
+                pred_label = self.labels[pred_idx]
+                pred_prob = probs[pred_idx]
+                results[model_name] = (pred_label, pred_prob)
+        # Create comparison plot
+        fig = plt.figure(figsize=(12, 5))
+        # Plot for EfficientNet
+        if 'EfficientNet' in probabilities:
+            plt.subplot(1, 2, 1)
+            plt.bar(self.labels, probabilities['EfficientNet'], color='skyblue')
+            plt.title('EfficientNet Predictions')
+            plt.ylim(0, 1)
+            plt.xticks(rotation=45)
+            plt.ylabel('Probability')
+        # Plot for CNN
+        if 'CNN' in probabilities:
+            plt.subplot(1, 2, 2)
+            plt.bar(self.labels, probabilities['CNN'], color='lightcoral')
+            plt.title('CNN Predictions')
+            plt.ylim(0, 1)
+            plt.xticks(rotation=45)
+            plt.ylabel('Probability')
+        plt.tight_layout()
+        # Create results text
+        text_results = "Model Predictions:\n\n"
+        for model_name, (label, prob) in results.items():
+            text_results += f"{model_name}:\n"
+            text_results += f"Top prediction: {label} ({prob:.2%})\n"
+            text_results += "All probabilities:\n"
+            for label, prob in zip(self.labels, probabilities[model_name]):
+                text_results += f"  {label}: {prob:.2%}\n"
+            text_results += "\n"
+        return [
+            fig,           # Probability plots
+            text_results   # Detailed text results
+        ]
+    def create_interface(self):
+        """Create Gradio interface."""
+        return gr.Interface(
+            fn=self.predict,
+            inputs=gr.Image(type="pil"),
+            outputs=[
+                gr.Plot(label="Prediction Probabilities"),
+                gr.Textbox(label="Detailed Results", lines=10)
+            ],
+            title="Animal Classifier - Model Comparison",
+            description="Upload an image of an animal to see predictions from both EfficientNet and CNN models."
+        )
+def main():
+    """Run the web application."""
+    app = AnimalClassifierApp()
+    interface = app.create_interface()
+    interface.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=True
+    )
+if __name__ == "__main__":
+    main()

checkpoints/cnn/cnn_best_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e20be6471690e71892f6b8bcc44f548cf8f876db51ca166953b1433c993e7bee
+size 1557014

checkpoints/efficientnet/efficientnet_best_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:754e2ec53c4f1f1c6d4a9398d38d0f415ac33a50c8794e2c6292137696ced2ee
+size 48638100

model.py ADDED Viewed

	@@ -0,0 +1,160 @@

+from typing import Dict, Any
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import timm
+class BaseModel(nn.Module):
+    """Base model class for animal classification."""
+    def predict(self, x: torch.Tensor) -> torch.Tensor:
+        """Get probability predictions."""
+        with torch.no_grad():
+            logits = self(x)
+            return F.softmax(logits, dim=1)
+    @classmethod
+    def load_from_checkpoint(
+        cls,
+        path: str,
+        map_location: Any = None
+    ) -> 'BaseModel':
+        """Load model from checkpoint."""
+        checkpoint = torch.load(path, map_location=map_location)
+        model = cls(num_classes=checkpoint['config']['num_classes'])
+        model.load_state_dict(checkpoint['model_state_dict'])
+        return model
+    def save_checkpoint(
+        self,
+        path: str,
+        extra_data: Dict[str, Any] = None
+    ) -> None:
+        """Save model checkpoint."""
+        data = {
+            'model_state_dict': self.state_dict(),
+            'config': {
+                'num_classes': self.get_num_classes(),
+                'model_type': self.__class__.__name__
+            }
+        }
+        if extra_data:
+            if 'config' in extra_data:
+                data['config'].update(extra_data['config'])
+                del extra_data['config']
+            data.update(extra_data)
+        torch.save(data, path)
+    def get_num_classes(self) -> int:
+        """Get number of output classes."""
+        raise NotImplementedError
+class CNNModel(BaseModel):
+    def __init__(self, num_classes: int, input_size: int = 224):
+        super(CNNModel, self).__init__()
+        self.conv_layers = nn.Sequential(
+            # First block: 32 filters
+            nn.Conv2d(3, 32, kernel_size=3, padding=1),
+            nn.BatchNorm2d(32),
+            nn.ReLU(),
+            nn.MaxPool2d(2),
+            # Second block: 64 filters
+            nn.Conv2d(32, 64, kernel_size=3, padding=1),
+            nn.BatchNorm2d(64),
+            nn.ReLU(),
+            nn.MaxPool2d(2),
+            # Third block: 128 filters
+            nn.Conv2d(64, 128, kernel_size=3, padding=1),
+            nn.BatchNorm2d(128),
+            nn.ReLU(),
+            nn.MaxPool2d(2),
+            # Global Average Pooling
+            nn.AdaptiveAvgPool2d(1)
+        )
+        self.classifier = nn.Sequential(
+            nn.Flatten(),
+            nn.Dropout(0.5),
+            nn.Linear(128, 256),
+            nn.ReLU(),
+            nn.Dropout(0.3),
+            nn.Linear(256, num_classes)
+        )
+        self._initialize_weights()
+    def _initialize_weights(self):
+        """Initialize model weights."""
+        for m in self.modules():
+            if isinstance(m, nn.Conv2d):
+                nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')
+                if m.bias is not None:
+                    nn.init.constant_(m.bias, 0)
+            elif isinstance(m, nn.BatchNorm2d):
+                nn.init.constant_(m.weight, 1)
+                nn.init.constant_(m.bias, 0)
+            elif isinstance(m, nn.Linear):
+                nn.init.normal_(m.weight, 0, 0.01)
+                nn.init.constant_(m.bias, 0)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.conv_layers(x)
+        return self.classifier(x)
+    def get_num_classes(self) -> int:
+        return self.classifier[-1].out_features
+class EfficientNetModel(BaseModel):
+    """EfficientNet-based model for animal classification."""
+    def __init__(
+        self,
+        num_classes: int,
+        model_name: str = "efficientnet_b0",
+        pretrained: bool = True
+    ):
+        super(EfficientNetModel, self).__init__()
+        self.base_model = timm.create_model(
+            model_name,
+            pretrained=pretrained,
+            num_classes=0
+        )
+        with torch.no_grad():
+            dummy_input = torch.randn(1, 3, 224, 224)
+            features = self.base_model(dummy_input)
+            feature_dim = features.shape[1]
+        # Simpler classifier structure matching the saved model
+        self.classifier = nn.Sequential(
+            nn.Dropout(0.2),
+            nn.Linear(feature_dim, num_classes)
+        )
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        features = self.base_model(x)
+        return self.classifier(features)
+    def get_num_classes(self) -> int:
+        return self.classifier[-1].out_features
+def get_model(model_type: str, num_classes: int, **kwargs) -> BaseModel:
+    """Factory function to get model by type."""
+    models = {
+        'cnn': CNNModel,
+        'efficientnet': EfficientNetModel
+    }
+    if model_type not in models:
+        raise ValueError(f"Model type {model_type} not supported. Available models: {list(models.keys())}")
+    return models[model_type](num_classes=num_classes, **kwargs)

requirements.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+torch==2.5.1
+torchvision==0.20.1
+timm==1.0.12
+pillow==10.4.0
+numpy==1.26.4
+opencv-python==4.10.0
+tqdm==4.67.1
+matplotlib==3.7.5
+gradio==5.9.1
+wandb==0.19.1
+datasets==3.2.0
+scikit-learn==1.4.2