feat: add prediction script and model file for MNIST digit classification

Browse files

Files changed (4) hide show

models/mnist_model_lr0.001_bs64_ep20.pth +3 -0
predict.py +58 -0
test/image.jpg +0 -0
torchvision.pyi +4 -1

models/mnist_model_lr0.001_bs64_ep20.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aead1b3223333f05acf8494c6a73aec8bdaa9e32d3f0c239b16e5e12a3a07a8f
+size 4803144

predict.py ADDED Viewed

	@@ -0,0 +1,58 @@

+import torch
+# mypy: ignore-errors
+import torchvision.transforms as transforms
+from PIL import Image
+from mnist_classifier.model import MNISTModel
+import torch.nn.functional as F
+def load_model(model_path):
+    """Load the trained model."""
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    model = MNISTModel().to(device)
+    model.load_state_dict(torch.load(model_path, weights_only=True))
+    model.eval()
+    return model, device
+def preprocess_image(image_path):
+    """Preprocess the input image."""
+    transform = transforms.Compose([
+        transforms.Grayscale(num_output_channels=1),
+        transforms.Resize((28, 28)),
+        transforms.ToTensor(),  # This converts PIL Image to tensor
+        transforms.Normalize((0.5,), (0.5,))
+    ])
+    image = Image.open(image_path)
+    image_tensor = transform(image)  # Now image_tensor is already a tensor
+    return image_tensor.unsqueeze(0)  # type: ignore # Add batch dimension using tensor method
+def predict(model, image, device):
+    """Make prediction on the input image."""
+    with torch.no_grad():
+        image = image.to(device)
+        output = model(image)
+        probabilities = F.softmax(output, dim=1)
+        pred = output.argmax(dim=1, keepdim=True)
+        return pred.item(), probabilities[0]
+def main():
+    # Path to your trained model
+    model_path = "./models/mnist_model_lr0.001_bs64_ep10.pth"
+    # Load model
+    model, device = load_model(model_path)
+    # Path to input image
+    image_path = "./test/image.jpg"
+    # Preprocess image and get prediction
+    image = preprocess_image(image_path)
+    prediction, probabilities = predict(model, image, device)
+    print(f"Predicted digit: {prediction}")
+    print("\nProbabilities for each digit:")
+    for digit, prob in enumerate(probabilities):
+        print(f"{digit}: {prob.item():.4f}")
+if __name__ == "__main__":
+    main()

test/image.jpg ADDED Viewed

torchvision.pyi CHANGED Viewed

@@ -6,4 +6,7 @@ class datasets:
 class transforms:
     Compose: Any
     ToTensor: Any
-    Normalize: Any

 class transforms:
     Compose: Any
     ToTensor: Any
+    Normalize: Any
+    Grayscale: Any
+    Resize: Any