Spaces:

mohakapoor
/

CaptchaOCR

Sleeping

App Files Files Community

mohakapoor commited on Aug 17

Commit

858aaf1

1 Parent(s): 04fdb24

update inference.py

Browse files

Files changed (4) hide show

Metrics/inference_results.png +2 -2
inference.py +18 -18
requirements.txt +17 -0
train.py +8 -8

Metrics/inference_results.png CHANGED Viewed

Git LFS Details

SHA256: 3f354ee931ae653ed9821adbfb33c715ad310aad312064770238e879579ef078
Pointer size: 131 Bytes
Size of remote file: 209 kB

Git LFS Details

SHA256: 93244e9da7d2a23effdba1e9580ff7bedff2b10ea1e814e4dc97e323939b5c4a
Pointer size: 131 Bytes
Size of remote file: 207 kB

inference.py CHANGED Viewed

@@ -19,7 +19,7 @@ def load_model(checkpoint_path="checkpoints/best_model.pth"):
     # Load checkpoint to the detected device
     checkpoint = torch.load(checkpoint_path, map_location=device)
-    print(f"✅ Loaded model from epoch {checkpoint['epoch']}")
     print(f"   Best validation loss: {checkpoint['best_val_loss']:.4f}")
     print(f"   Loading to device: {device}")
@@ -74,25 +74,25 @@ def generate_test_captcha(text, filename, width=160, height=60):
     image = ImageCaptcha(width=width, height=height)
     filepath = os.path.join(cfg.RESULT_DIR, filename)
     image.write(text, filepath)
-    print(f"📸 Generated test CAPTCHA: {filename}")
     return filepath
 def main():
     # Setup
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-    print(f"🚀 Using device: {device}")
     os.makedirs(cfg.RESULT_DIR, exist_ok=True)
     try:
         # Load trained model
-        print("📥 Loading trained model...")
         model = load_model()
         model = model.to(device)
-        print("✅ Model loaded successfully!")
         # Generate test CAPTCHAs
-        print("\n🎯 Generating test CAPTCHAs...")
         test_cases = []
         for i in range(4):
@@ -105,7 +105,7 @@ def main():
             test_cases.append((text, image_path, ""))  # Add empty prediction slot
         # Run inference
-        print("\n🔍 Running inference...")
         print("-" * 60)
         print(f"{'Target':<15} {'Prediction':<15} {'Correct':<10} {'Image':<20}")
         print("-" * 60)
@@ -128,16 +128,16 @@ def main():
                     correct_count += 1
                 # Display result
-                status = "✅" if is_correct else "❌"
                 print(f"{target_text:<15} {prediction:<15} {status:<10} {os.path.basename(image_path):<20}")
             except Exception as e:
-                print(f"❌ Error processing {image_path}: {e}")
         # Summary
         print("-" * 60)
         accuracy = (correct_count / len(test_cases)) * 100
-        print(f"📊 Overall Accuracy: {correct_count}/{len(test_cases)} ({accuracy:.1f}%)")
         # Calculate individual character accuracy
         total_chars = 0
@@ -154,14 +154,14 @@ def main():
         print(f"🔤 Character Accuracy: {correct_chars}/{total_chars} ({char_accuracy:.1f}%)")
         if accuracy >= 80:
-            print("🎉 Excellent performance!")
         elif accuracy >= 60:
-            print("👍 Good performance!")
         else:
-            print("🤔 Room for improvement...")
         # Create and save results plot
-        print("\n📊 Generating results visualization...")
         try:
             metrics = TrainingMetrics()
             image_paths = [case[1] for case in test_cases]
@@ -173,14 +173,14 @@ def main():
             # Plot results
             metrics.plot_results(image_paths, predictions, targets)
-            print("✅ Results plot generated successfully!")
         except Exception as e:
-            print(f"⚠️  Warning: Could not generate plot: {e}")
     except Exception as e:
-        print(f"❌ Error: {e}")
-        print("💡 Make sure you have a trained model in checkpoints/best_model.pth")
 if __name__ == "__main__":
     main()

     # Load checkpoint to the detected device
     checkpoint = torch.load(checkpoint_path, map_location=device)
+    print(f"Loaded model from epoch {checkpoint['epoch']}")
     print(f"   Best validation loss: {checkpoint['best_val_loss']:.4f}")
     print(f"   Loading to device: {device}")
     image = ImageCaptcha(width=width, height=height)
     filepath = os.path.join(cfg.RESULT_DIR, filename)
     image.write(text, filepath)
+    print(f"Generated test CAPTCHA: {filename}")
     return filepath
 def main():
     # Setup
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    print(f"Using device: {device}")
     os.makedirs(cfg.RESULT_DIR, exist_ok=True)
     try:
         # Load trained model
+        print("Loading trained model...")
         model = load_model()
         model = model.to(device)
+        print("Model loaded successfully!")
         # Generate test CAPTCHAs
+        print("\nGenerating test CAPTCHAs...")
         test_cases = []
         for i in range(4):
             test_cases.append((text, image_path, ""))  # Add empty prediction slot
         # Run inference
+        print("\nRunning inference...")
         print("-" * 60)
         print(f"{'Target':<15} {'Prediction':<15} {'Correct':<10} {'Image':<20}")
         print("-" * 60)
                     correct_count += 1
                 # Display result
+                status = "CORRECT" if is_correct else "WRONG"
                 print(f"{target_text:<15} {prediction:<15} {status:<10} {os.path.basename(image_path):<20}")
             except Exception as e:
+                print(f"Error processing {image_path}: {e}")
         # Summary
         print("-" * 60)
         accuracy = (correct_count / len(test_cases)) * 100
+        print(f"Overall Accuracy: {correct_count}/{len(test_cases)} ({accuracy:.1f}%)")
         # Calculate individual character accuracy
         total_chars = 0
         print(f"🔤 Character Accuracy: {correct_chars}/{total_chars} ({char_accuracy:.1f}%)")
         if accuracy >= 80:
+            print("Excellent performance!")
         elif accuracy >= 60:
+            print("Good performance!")
         else:
+            print("Room for improvement...")
         # Create and save results plot
+        print("\nGenerating results visualization...")
         try:
             metrics = TrainingMetrics()
             image_paths = [case[1] for case in test_cases]
             # Plot results
             metrics.plot_results(image_paths, predictions, targets)
+            print("Results plot generated successfully!")
         except Exception as e:
+            print(f"Warning: Could not generate plot: {e}")
     except Exception as e:
+        print(f"Error: {e}")
+        print("Make sure you have a trained model in checkpoints/best_model.pth")
 if __name__ == "__main__":
     main()

requirements.txt ADDED Viewed

	@@ -0,0 +1,17 @@

+# CAPTCHA OCR Project Dependencies
+# Core ML Framework (install separately with CUDA 12.8 support)
+# pip3 install torch torchvision --index-url https://download.pytorch.org/whl/cu128
+# Computer Vision
+opencv-python>=4.8.0
+Pillow>=9.0.0
+# CAPTCHA Generation
+captcha>=0.4.0
+# Data Processing
+numpy>=1.21.0
+pandas>=1.3.0
+# Visualization and Plotting
+matplotlib>=3.5.0

train.py CHANGED Viewed

@@ -147,8 +147,8 @@ def main():
         if avg_val_loss < best_val_loss:
             best_val_loss = avg_val_loss
             patience_counter = 0
-            print(f"  🎯 New best validation loss: {best_val_loss:.4f}")
-            print(f"  📊 Val/Train ratio: {val_train_ratio:.3f}")
             # Save best model checkpoint with metadata
             checkpoint = {
@@ -169,19 +169,19 @@ def main():
                 }
             }
             torch.save(checkpoint, "checkpoints/best_model.pth")
-            print(f"  💾 Best model saved to checkpoints/best_model.pth")
         else:
             patience_counter += 1
-            print(f"  ⚠️  No improvement for {patience_counter} epochs")
-            print(f"  📊 Val/Train ratio: {val_train_ratio:.3f}")
         # Enhanced early stopping: Check both absolute loss and ratio
         if patience_counter >= patience or val_train_ratio > 3.0:  # Stop if ratio > 3x
             if val_train_ratio > 3.0:
-                print(f"  🛑 Early stopping triggered! Val/Train ratio too high: {val_train_ratio:.3f}")
             else:
-                print(f"  🛑 Early stopping triggered! No improvement for {patience} epochs")
             early_stop = True
             break
@@ -253,7 +253,7 @@ def main():
         }
     }
     torch.save(final_checkpoint, "checkpoints/final_model.pth")
-    print(f"💾 Final model saved to checkpoints/final_model.pth")
     print("\nGenerating training metrics and plots...")
     os.makedirs("Metrics", exist_ok=True)

         if avg_val_loss < best_val_loss:
             best_val_loss = avg_val_loss
             patience_counter = 0
+            print(f"  New best validation loss: {best_val_loss:.4f}")
+            print(f"  Val/Train ratio: {val_train_ratio:.3f}")
             # Save best model checkpoint with metadata
             checkpoint = {
                 }
             }
             torch.save(checkpoint, "checkpoints/best_model.pth")
+            print(f"  Best model saved to checkpoints/best_model.pth")
         else:
             patience_counter += 1
+            print(f"  No improvement for {patience_counter} epochs")
+            print(f"  Val/Train ratio: {val_train_ratio:.3f}")
         # Enhanced early stopping: Check both absolute loss and ratio
         if patience_counter >= patience or val_train_ratio > 3.0:  # Stop if ratio > 3x
             if val_train_ratio > 3.0:
+                print(f"  Early stopping triggered! Val/Train ratio too high: {val_train_ratio:.3f}")
             else:
+                print(f" Early stopping triggered! No improvement for {patience} epochs")
             early_stop = True
             break
         }
     }
     torch.save(final_checkpoint, "checkpoints/final_model.pth")
+    print(f"Final model saved to checkpoints/final_model.pth")
     print("\nGenerating training metrics and plots...")
     os.makedirs("Metrics", exist_ok=True)