Spaces:

soutrik
/

gradio_demo_CatDogClassifier

Runtime error

App Files Files Community

Soutrik commited on Nov 9, 2024

Commit

8931c9e

1 Parent(s): beb5662

infer script

Browse files

Files changed (6) hide show

artifacts/image_prediction.png +0 -0
configs/infer.yaml +4 -4
configs/test.yaml +0 -34
configs/train.yaml +1 -1
image.jpg +0 -0
src/infer.py +128 -0

artifacts/image_prediction.png ADDED Viewed

configs/infer.yaml CHANGED Viewed

@@ -4,8 +4,8 @@
 # order of defaults determines the order in which configs override each other
 defaults:
   - _self_
-  - data: dogbreed
-  - model: dogbreed_classifier
   - callbacks: default
   - logger: null # set logger here or use command line (e.g. `python train.py logger=tensorboard`)
   - trainer: default
@@ -13,7 +13,7 @@ defaults:
   - hydra: default
   # experiment configs allow for version control of specific hyperparameters
   # e.g. best hyperparameters for given model and datamodule
-  - experiment: dogbreed_experiment
   # debugging config (enable through command line, e.g. `python train.py debug=default)
   - debug: null
@@ -39,4 +39,4 @@ ckpt_path: ${paths.ckpt_dir}/best-checkpoint.ckpt
 seed: 42
 # name of the experiment
-name: "dogbreed_experiment"

 # order of defaults determines the order in which configs override each other
 defaults:
   - _self_
+  - data: catdog
+  - model: catdog_model
   - callbacks: default
   - logger: null # set logger here or use command line (e.g. `python train.py logger=tensorboard`)
   - trainer: default
   - hydra: default
   # experiment configs allow for version control of specific hyperparameters
   # e.g. best hyperparameters for given model and datamodule
+  - experiment: catdog_experiment
   # debugging config (enable through command line, e.g. `python train.py debug=default)
   - debug: null
 seed: 42
 # name of the experiment
+name: "catdog_experiment"

configs/test.yaml DELETED Viewed

@@ -1,34 +0,0 @@
-defaults:
-  - _self_
-  - data: dogbreed
-  - model: dogbreed_classifier
-  - callbacks: default
-  - logger: null
-  - trainer: default
-  - paths: default  # This should map to another config file if using hydra to merge
-task_name: train
-tags:
-  - dev
-train: true
-test: true
-ckpt_path: null
-seed: 42
-# Ensure paths section is present
-paths:
-  root_dir: ./  # Project root directory
-  data_dir: ./data  # Path to your dataset
-  log_dir: ./logs  # Path to logs directory
-  ckpt_dir: ./checkpoints  # Path to checkpoints
-  artifact_dir: ./artifacts  # Path to save artifacts
-  kaggle_dir: khushikhushikhushi/dog-breed-image-dataset  # Path for Kaggle dataset
-# Ensure data section is present
-data:
-  num_workers: 4
-  batch_size: 32
-  image_size: 224
-  train_split: 0.8
-  val_split: 0.1
-  test_split: 0.1

configs/train.yaml CHANGED Viewed

@@ -38,7 +38,7 @@ ckpt_path: ${paths.ckpt_dir}/best-checkpoint.ckpt
 seed: 42
 # name of the experiment
-name: "dogbreed_experiment"
 # optimization metric
 optimization_metric: "val_acc"

 seed: 42
 # name of the experiment
+name: "catdog_experiment"
 # optimization metric
 optimization_metric: "val_acc"

image.jpg ADDED Viewed

src/infer.py ADDED Viewed

	@@ -0,0 +1,128 @@

+from pathlib import Path
+import requests
+import torch
+import torch.nn.functional as F
+import matplotlib.pyplot as plt
+from PIL import Image
+from torchvision import transforms
+from src.models.catdog_model import ViTTinyClassifier
+from src.utils.logging_utils import setup_logger, task_wrapper, get_rich_progress
+import hydra
+from omegaconf import DictConfig, OmegaConf
+from dotenv import load_dotenv, find_dotenv
+import rootutils
+import time
+from loguru import logger
+# Load environment variables
+load_dotenv(find_dotenv(".env"))
+# Setup root directory
+root = rootutils.setup_root(__file__, indicator=".project-root")
+@task_wrapper
+def load_image(image_path: str, image_size: int):
+    """Load and preprocess an image."""
+    img = Image.open(image_path).convert("RGB")
+    transform = transforms.Compose(
+        [
+            transforms.Resize((image_size, image_size)),
+            transforms.ToTensor(),
+            transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
+        ]
+    )
+    return img, transform(img).unsqueeze(0)
+@task_wrapper
+def infer(model: torch.nn.Module, image_tensor: torch.Tensor, classes: list):
+    """Perform inference on the provided image tensor."""
+    model.eval()
+    with torch.no_grad():
+        output = model(image_tensor)
+        probabilities = F.softmax(output, dim=1)
+        predicted_class = torch.argmax(probabilities, dim=1).item()
+    predicted_label = classes[predicted_class]
+    confidence = probabilities[0][predicted_class].item()
+    return predicted_label, confidence
+@task_wrapper
+def save_prediction_image(
+    image: Image.Image, predicted_label: str, confidence: float, output_path: Path
+):
+    """Save the image with the prediction overlay."""
+    plt.figure(figsize=(10, 6))
+    plt.imshow(image)
+    plt.axis("off")
+    plt.title(f"Predicted: {predicted_label} (Confidence: {confidence:.2f})")
+    plt.tight_layout()
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    plt.savefig(output_path, dpi=300, bbox_inches="tight")
+    plt.close()
+@task_wrapper
+def download_image(cfg: DictConfig):
+    """Download an image from the web for inference."""
+    url = "https://github.com/laxmimerit/dog-cat-full-dataset/raw/master/data/train/dogs/dog.1.jpg"
+    headers = {
+        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/85.0.4183.121 Safari/537.36",
+    }
+    response = requests.get(url, headers=headers, allow_redirects=True)
+    if response.status_code == 200:
+        image_path = Path(cfg.paths.root_dir) / "image.jpg"
+        with open(image_path, "wb") as file:
+            file.write(response.content)
+        time.sleep(5)
+        print(f"Image downloaded successfully as {image_path}!")
+    else:
+        logger.error(f"Failed to download image. Status code: {response.status_code}")
+@hydra.main(config_path="../configs", config_name="infer", version_base="1.1")
+def main_infer(cfg: DictConfig):
+    # Print the configuration
+    logger.info(OmegaConf.to_yaml(cfg))
+    setup_logger(Path(cfg.paths.log_dir) / "infer.log")
+    # Remove the train_done flag if it exists
+    flag_file = Path(cfg.paths.ckpt_dir) / "train_done.flag"
+    if flag_file.exists():
+        flag_file.unlink()
+    # Load the trained model
+    model = ViTTinyClassifier.load_from_checkpoint(checkpoint_path=cfg.ckpt_path)
+    classes = ["dog", "cat"]
+    # Download an image for inference
+    download_image(cfg)
+    # Load images from directory and perform inference
+    image_files = [
+        f
+        for f in Path(cfg.paths.root_dir).iterdir()
+        if f.suffix in {".jpg", ".jpeg", ".png"}
+    ]
+    with get_rich_progress() as progress:
+        task = progress.add_task("[green]Processing images...", total=len(image_files))
+        for image_file in image_files:
+            img, img_tensor = load_image(image_file, cfg.data.image_size)
+            predicted_label, confidence = infer(
+                model, img_tensor.to(model.device), classes
+            )
+            output_file = (
+                Path(cfg.paths.artifact_dir) / f"{image_file.stem}_prediction.png"
+            )
+            save_prediction_image(img, predicted_label, confidence, output_file)
+            progress.advance(task)
+            logger.info(f"Processed {image_file}: {predicted_label} ({confidence:.2f})")
+if __name__ == "__main__":
+    main_infer()