Spaces:

nguyennp86
/

vietnamese-receipt-classification

Sleeping

App Files Files Community

nguyennp86 commited on Sep 4

Commit

bdcf915

verified ·

1 Parent(s): 7e3aa86

Update app.py

Browse files

Files changed (1) hide show

app.py +274 -133

app.py CHANGED Viewed

@@ -1,10 +1,7 @@
 #!/usr/bin/env python3
 """
 Vietnamese Receipt Classification App for Hugging Face Spaces
-Features:
-1. Train model on startup
-2. Vision Language Model for bill description
-3. Classification prediction
 """
 import os
@@ -19,7 +16,6 @@ import threading
 import time
 import io
 from PIL import Image
-import base64
 # Add paths for imports
 current_dir = os.path.dirname(os.path.abspath(__file__))
@@ -48,6 +44,7 @@ vectorizers = None
 label_encoder = None
 training_status = "Not started"
 training_log = []
 # ====================================
 # GOOGLE AI VISION SETUP
@@ -57,7 +54,6 @@ def setup_google_ai():
     if not GOOGLE_AI_AVAILABLE:
         return None
-    # Get API key from environment or Hugging Face secrets
     api_key = os.getenv('GOOGLE_AI_API_KEY') or os.getenv('GOOGLE_API_KEY')
     if not api_key:
@@ -66,8 +62,6 @@ def setup_google_ai():
     try:
         genai.configure(api_key=api_key)
-        # Initialize vision model
         model = genai.GenerativeModel('gemini-1.5-flash')
         print("✅ Google AI Vision model initialized")
         return model
@@ -82,9 +76,10 @@ google_vision_model = setup_google_ai()
 # ====================================
 def train_model_background():
     """Train model in background thread"""
-    global trained_model, feature_type, vectorizers, label_encoder, training_status, training_log
     try:
         training_status = "Starting training..."
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] Starting training...")
@@ -92,9 +87,10 @@ def train_model_background():
         if not os.path.exists(Config.DATA_FILE):
             training_status = "Error: Dataset not found"
             training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] ❌ Dataset {Config.DATA_FILE} not found")
             return
-        training_status = "Training in progress..."
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] 🚀 Training started")
         # Initialize trainer
@@ -110,24 +106,33 @@ def train_model_background():
         label_encoder = trainer.data_loader.label_encoder
         accuracy = results.get('accuracy', 0)
-        training_status = f"Training completed! Accuracy: {accuracy:.4f}"
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] ✅ Training completed with {accuracy:.4f} accuracy")
     except Exception as e:
-        training_status = f"Training failed: {str(e)}"
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] ❌ Training failed: {str(e)}")
 def get_training_status():
     """Get current training status"""
-    log_text = "\n".join(training_log[-10:])  # Last 10 messages
     return training_status, log_text
 def start_training():
     """Start training process"""
     thread = threading.Thread(target=train_model_background)
     thread.daemon = True
     thread.start()
-    return "Training started in background...", ""
 # ====================================
 # VISION MODEL FUNCTIONS
@@ -135,7 +140,7 @@ def start_training():
 def extract_bill_description(image):
     """Extract bill description using Google Vision AI"""
     if not GOOGLE_AI_AVAILABLE or google_vision_model is None:
-        return "❌ Google AI Vision không khả dụng. Vui lòng nhập mô tả thủ công."
     try:
         if image is None:
@@ -184,10 +189,10 @@ def predict_bill_class(description):
     global trained_model, feature_type, vectorizers, label_encoder
     if trained_model is None:
-        return "❌ Model chưa được train. Vui lòng đợi quá trình training hoàn tất.", "", ""
     if not description or description.strip() == "":
-        return "❌ Vui lòng nhập mô tả hóa đơn", "", ""
     try:
         # Predict
@@ -209,11 +214,12 @@ def predict_bill_class(description):
         result_text = f"🎯 Dự đoán: {predicted_class}\n📊 Độ tin cậy: {confidence:.3f}"
         top_3_text = "📊 Top 3 dự đoán:\n" + "\n".join(top_3_results)
-        return result_text, top_3_text, f"Đã phân loại thành công với độ tin cậy {confidence:.1%}"
     except Exception as e:
-        return f"❌ Lỗi khi dự đoán: {str(e)}", "", ""
 def predict_from_image_and_text(image, manual_description):
     """Combined prediction from image and manual text"""
@@ -221,21 +227,24 @@ def predict_from_image_and_text(image, manual_description):
     # Use manual description if provided, otherwise extract from image
     if manual_description and manual_description.strip():
         description = manual_description.strip()
-        source = "📝 Sử dụng mô tả thủ công"
     elif image is not None:
         description = extract_bill_description(image)
-        source = "🖼️ Trích xuất từ ảnh"
         # Check if extraction failed
         if description.startswith("❌"):
-            return description, "", "", description
     else:
-        return "❌ Vui lòng upload ảnh hoặc nhập mô tả thủ công", "", "", ""
     # Make prediction
     result, top_3, status = predict_bill_class(description)
-    return result, top_3, status, f"{source}\n📄 Mô tả: {description}"
 # ====================================
 # GRADIO INTERFACE
@@ -243,197 +252,322 @@ def predict_from_image_and_text(image, manual_description):
 def create_interface():
     """Create Gradio interface"""
-    with gr.Blocks(title="Vietnamese Receipt Classification", theme=gr.themes.Soft()) as interface:
         gr.HTML("""
-        <div style="text-align: center; margin: 20px;">
             <h1>🧾 Vietnamese Receipt Classification</h1>
-            <p>Ứng dụng phân loại hóa đơn Việt Nam sử dụng GA-optimized Voting Ensemble</p>
         </div>
         """)
-        with gr.Tabs():
             # ====================================
             # TAB 1: MODEL TRAINING
             # ====================================
-            with gr.Tab("🚀 Model Training"):
-                gr.HTML("<h3>Training Status</h3>")
                 with gr.Row():
                     with gr.Column(scale=1):
-                        train_btn = gr.Button("🏋️ Start Training", variant="primary", size="lg")
                     with gr.Column(scale=1):
-                        refresh_btn = gr.Button("🔄 Refresh Status", variant="secondary")
-                status_text = gr.Textbox(
-                    label="Training Status",
-                    value="Click 'Start Training' to begin",
-                    interactive=False
-                )
-                log_text = gr.Textbox(
-                    label="Training Log",
-                    lines=8,
-                    max_lines=10,
-                    interactive=False
-                )
                 gr.HTML("""
-                <div style="margin-top: 20px; padding: 15px; background-color: #f0f0f0; border-radius: 5px;">
-                    <h4>📋 Training Information:</h4>
-                    <ul>
-                        <li>Algorithm: GA-optimized Voting Ensemble (KNN + Decision Tree + Naive Bayes)</li>
-                        <li>Features: BoW, TF-IDF, Sentence Embeddings</li>
-                        <li>Optimization: Genetic Algorithm with 30 population, 15 generations</li>
-                        <li>Training time: ~5-15 minutes depending on dataset size</li>
                     </ul>
                 </div>
                 """)
-                # Event handlers
-                train_btn.click(start_training, outputs=[status_text, log_text])
-                refresh_btn.click(get_training_status, outputs=[status_text, log_text])
             # ====================================
             # TAB 2: BILL CLASSIFICATION
             # ====================================
-            with gr.Tab("🔮 Bill Classification"):
-                gr.HTML("<h3>Phân loại hóa đơn từ ảnh hoặc mô tả</h3>")
                 with gr.Row():
                     with gr.Column(scale=1):
                         gr.HTML("<h4>📸 Upload ảnh hóa đơn</h4>")
                         image_input = gr.Image(
                             label="Ảnh hóa đơn",
                             type="pil",
-                            height=300
                         )
-                        extract_btn = gr.Button("🔍 Trích xuất mô tả từ ảnh", variant="secondary")
                         gr.HTML("<h4>📝 Hoặc nhập mô tả thủ công</h4>")
                         manual_input = gr.Textbox(
                             label="Mô tả hóa đơn",
                             placeholder="Ví dụ: Hóa đơn thanh toán tại cửa hàng cà phê Feel Coffee với món Yogurt Very Berry giá 22.000 VND",
-                            lines=3,
-                            max_lines=5
                         )
-                        predict_btn = gr.Button("🎯 Dự đoán phân loại", variant="primary", size="lg")
                     with gr.Column(scale=1):
-                        gr.HTML("<h4>📄 Mô tả đã trích xuất</h4>")
-                        extracted_text = gr.Textbox(
-                            label="Thông tin hóa đơn",
-                            lines=4,
                             interactive=False
                         )
                         gr.HTML("<h4>🎯 Kết quả phân loại</h4>")
-                        result_text = gr.Textbox(
-                            label="Kết quả dự đoán",
-                            lines=2,
                             interactive=False
                         )
-                        top3_text = gr.Textbox(
                             label="Top 3 dự đoán",
                             lines=4,
                             interactive=False
                         )
-                        status_msg = gr.Textbox(
                             label="Trạng thái",
-                            lines=1,
                             interactive=False
                         )
-                # Example section
-                gr.HTML("""
-                <div style="margin-top: 20px;">
-                    <h4>💡 Ví dụ các loại hóa đơn:</h4>
-                    <ul>
-                        <li><strong>Ăn uống ngoài hàng:</strong> Hóa đơn nhà hàng, quán cà phê, quán ăn</li>
-                        <li><strong>Siêu thị tổng hợp:</strong> VinMart, Co.opMart, Big C, Lotte Mart</li>
-                        <li><strong>Sữa & Đồ uống:</strong> Sữa, nước ngọt, đồ uống các loại</li>
-                        <li><strong>Tiện ích:</strong> Tiền điện, nước, internet, điện thoại</li>
-                    </ul>
-                </div>
-                """)
-                # Event handlers
                 extract_btn.click(
-                    process_image_and_extract,
                     inputs=[image_input],
                     outputs=[manual_input]
                 )
                 predict_btn.click(
-                    predict_from_image_and_text,
                     inputs=[image_input, manual_input],
-                    outputs=[result_text, top3_text, status_msg, extracted_text]
                 )
             # ====================================
-            # TAB 3: ABOUT
             # ====================================
-            with gr.Tab("ℹ️ About"):
                 gr.HTML("""
-                <div style="padding: 20px;">
-                    <h3>🧾 Vietnamese Receipt Classification System</h3>
-                    <h4>🎯 Tính năng chính:</h4>
-                    <ul>
-                        <li><strong>AI Vision:</strong> Trích xuất mô tả từ ảnh hóa đơn bằng Google Gemini Vision</li>
-                        <li><strong>GA Optimization:</strong> Tối ưu hóa ensemble classifier bằng Genetic Algorithm</li>
-                        <li><strong>Multi-feature:</strong> Kết hợp BoW, TF-IDF và Sentence Embeddings</li>
-                        <li><strong>Voting Ensemble:</strong> KNN + Decision Tree + Naive Bayes</li>
-                    </ul>
-                    <h4>🔧 Công nghệ sử dụng:</h4>
-                    <ul>
-                        <li><strong>Machine Learning:</strong> scikit-learn, sentence-transformers</li>
-                        <li><strong>Optimization:</strong> DEAP (Genetic Algorithm)</li>
-                        <li><strong>Computer Vision:</strong> Google Gemini Vision API</li>
-                        <li><strong>Interface:</strong> Gradio, Hugging Face Spaces</li>
-                    </ul>
-                    <h4>📊 Performance:</h4>
-                    <ul>
-                        <li><strong>Accuracy:</strong> ~85-95% (tùy thuộc dataset)</li>
-                        <li><strong>Training time:</strong> 5-15 phút</li>
-                        <li><strong>Prediction time:</strong> <1 giây</li>
-                    </ul>
-                    <h4>⚙️ Cấu hình GA:</h4>
-                    <ul>
-                        <li><strong>Population:</strong> 30 individuals</li>
-                        <li><strong>Generations:</strong> 15</li>
-                        <li><strong>Cross-validation:</strong> 3-fold</li>
-                        <li><strong>Selection:</strong> Tournament (size=3)</li>
-                    </ul>
-                    <div style="margin-top: 30px; padding: 15px; background-color: #e8f4fd; border-left: 4px solid #2196F3;">
-                        <h4>🚀 Hướng dẫn sử dụng:</h4>
                         <ol>
-                            <li>Bắt đầu bằng tab "Model Training" để train model</li>
-                            <li>Đợi training hoàn tất (~5-15 phút)</li>
-                            <li>Chuyển sang tab "Bill Classification"</li>
-                            <li>Upload ảnh hóa đơn hoặc nhập mô tả thủ công</li>
-                            <li>Nhấn "Dự đoán phân loại" để xem kết quả</li>
                         </ol>
                     </div>
-                    <div style="margin-top: 20px; text-align: center;">
-                        <p><strong>Developed with ❤️ for Vietnamese Receipt Classification</strong></p>
                     </div>
                 </div>
                 """)
-        # Auto-refresh training status every 10 seconds
-        interface.load(get_training_status, outputs=[status_text, log_text], every=10)
     return interface
@@ -442,6 +576,7 @@ def create_interface():
 # ====================================
 if __name__ == "__main__":
     print("🚀 Starting Vietnamese Receipt Classification App...")
     # Check dependencies
     print("📋 Checking dependencies...")
@@ -449,21 +584,27 @@ if __name__ == "__main__":
     if GOOGLE_AI_AVAILABLE and google_vision_model is not None:
         print("✅ Google AI Vision: Ready")
     else:
-        print("⚠️ Google AI Vision: Not available (set GOOGLE_AI_API_KEY)")
     # Check dataset
     if os.path.exists(Config.DATA_FILE):
         print(f"✅ Dataset: Found {Config.DATA_FILE}")
     else:
         print(f"⚠️ Dataset: {Config.DATA_FILE} not found")
     print("🎨 Creating Gradio interface...")
     app = create_interface()
     print("🌐 Launching app...")
     app.launch(
-        share=True,
         server_name="0.0.0.0",
         server_port=7860,
-        show_error=True
-    )

 #!/usr/bin/env python3
 """
 Vietnamese Receipt Classification App for Hugging Face Spaces
+Compatible with current Gradio version
 """
 import os
 import time
 import io
 from PIL import Image
 # Add paths for imports
 current_dir = os.path.dirname(os.path.abspath(__file__))
 label_encoder = None
 training_status = "Not started"
 training_log = []
+is_training = False
 # ====================================
 # GOOGLE AI VISION SETUP
     if not GOOGLE_AI_AVAILABLE:
         return None
     api_key = os.getenv('GOOGLE_AI_API_KEY') or os.getenv('GOOGLE_API_KEY')
     if not api_key:
     try:
         genai.configure(api_key=api_key)
         model = genai.GenerativeModel('gemini-1.5-flash')
         print("✅ Google AI Vision model initialized")
         return model
 # ====================================
 def train_model_background():
     """Train model in background thread"""
+    global trained_model, feature_type, vectorizers, label_encoder, training_status, training_log, is_training
     try:
+        is_training = True
         training_status = "Starting training..."
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] Starting training...")
         if not os.path.exists(Config.DATA_FILE):
             training_status = "Error: Dataset not found"
             training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] ❌ Dataset {Config.DATA_FILE} not found")
+            is_training = False
             return
+        training_status = "Training in progress... (This may take 10-15 minutes)"
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] 🚀 Training started")
         # Initialize trainer
         label_encoder = trainer.data_loader.label_encoder
         accuracy = results.get('accuracy', 0)
+        training_status = f"✅ Training completed! Accuracy: {accuracy:.4f}"
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] ✅ Training completed with {accuracy:.4f} accuracy")
     except Exception as e:
+        training_status = f"❌ Training failed: {str(e)}"
         training_log.append(f"[{datetime.now().strftime('%H:%M:%S')}] ❌ Training failed: {str(e)}")
+    finally:
+        is_training = False
 def get_training_status():
     """Get current training status"""
+    log_text = "\n".join(training_log[-15:])  # Last 15 messages
     return training_status, log_text
 def start_training():
     """Start training process"""
+    global is_training
+    if is_training:
+        return "⚠️ Training already in progress...", "\n".join(training_log[-15:])
     thread = threading.Thread(target=train_model_background)
     thread.daemon = True
     thread.start()
+    return "🚀 Training started in background...", "Training initiated..."
 # ====================================
 # VISION MODEL FUNCTIONS
 def extract_bill_description(image):
     """Extract bill description using Google Vision AI"""
     if not GOOGLE_AI_AVAILABLE or google_vision_model is None:
+        return "❌ Google AI Vision không khả dụng. Vui lòng thiết lập GOOGLE_AI_API_KEY hoặc nhập mô tả thủ công."
     try:
         if image is None:
     global trained_model, feature_type, vectorizers, label_encoder
     if trained_model is None:
+        return "❌ Model chưa được train. Vui lòng đợi quá trình training hoàn tất.", "", "Model not ready"
     if not description or description.strip() == "":
+        return "❌ Vui lòng nhập mô tả hóa đơn", "", "Empty description"
     try:
         # Predict
         result_text = f"🎯 Dự đoán: {predicted_class}\n📊 Độ tin cậy: {confidence:.3f}"
         top_3_text = "📊 Top 3 dự đoán:\n" + "\n".join(top_3_results)
+        status = f"✅ Đã phân loại thành công với độ tin cậy {confidence:.1%}"
+        return result_text, top_3_text, status
     except Exception as e:
+        return f"❌ Lỗi khi dự đoán: {str(e)}", "", f"Error: {str(e)}"
 def predict_from_image_and_text(image, manual_description):
     """Combined prediction from image and manual text"""
     # Use manual description if provided, otherwise extract from image
     if manual_description and manual_description.strip():
         description = manual_description.strip()
+        source_info = "📝 Sử dụng mô tả thủ công"
     elif image is not None:
         description = extract_bill_description(image)
+        source_info = "🖼️ Trích xuất từ ảnh"
         # Check if extraction failed
         if description.startswith("❌"):
+            return description, "", description, description
     else:
+        return "❌ Vui lòng upload ảnh hoặc nhập mô tả thủ công", "", "No input provided", ""
     # Make prediction
     result, top_3, status = predict_bill_class(description)
+    # Prepare full description info
+    full_description = f"{source_info}\n\n📄 Mô tả hóa đơn:\n{description}"
+    return result, top_3, status, full_description
 # ====================================
 # GRADIO INTERFACE
 def create_interface():
     """Create Gradio interface"""
+    # Custom CSS
+    css = """
+    .gradio-container {
+        max-width: 1200px !important;
+    }
+    .main-header {
+        text-align: center;
+        margin: 20px 0;
+        padding: 20px;
+        background: linear-gradient(90deg, #667eea 0%, #764ba2 100%);
+        color: white;
+        border-radius: 10px;
+    }
+    .tab-nav {
+        margin: 10px 0;
+    }
+    .status-box {
+        border: 2px solid #e1e5e9;
+        border-radius: 8px;
+        padding: 15px;
+        margin: 10px 0;
+    }
+    .success-status {
+        border-color: #28a745;
+        background-color: #f8fff9;
+    }
+    .error-status {
+        border-color: #dc3545;
+        background-color: #fff8f8;
+    }
+    .warning-status {
+        border-color: #ffc107;
+        background-color: #fffbf0;
+    }
+    """
+    with gr.Blocks(title="Vietnamese Receipt Classification", css=css, theme=gr.themes.Soft()) as interface:
+        # Header
         gr.HTML("""
+        <div class="main-header">
             <h1>🧾 Vietnamese Receipt Classification</h1>
+            <p>Ứng dụng phân loại hóa đơn Việt Nam sử dụng GA-optimized Ensemble + Google AI Vision</p>
         </div>
         """)
+        with gr.Tabs() as tabs:
             # ====================================
             # TAB 1: MODEL TRAINING
             # ====================================
+            with gr.Tab("🚀 Model Training", id="training"):
+                with gr.Row():
+                    gr.HTML("<h3>🏋️ Training Management</h3>")
                 with gr.Row():
                     with gr.Column(scale=1):
+                        train_btn = gr.Button(
+                            "🚀 Start Training",
+                            variant="primary",
+                            size="lg"
+                        )
                     with gr.Column(scale=1):
+                        refresh_btn = gr.Button(
+                            "🔄 Refresh Status",
+                            variant="secondary",
+                            size="lg"
+                        )
+                with gr.Row():
+                    status_display = gr.Textbox(
+                        label="📊 Training Status",
+                        value="Click 'Start Training' to begin",
+                        interactive=False,
+                        lines=2
+                    )
+                with gr.Row():
+                    log_display = gr.Textbox(
+                        label="📝 Training Log",
+                        lines=10,
+                        max_lines=15,
+                        interactive=False,
+                        placeholder="Training logs will appear here..."
+                    )
+                # Training info
                 gr.HTML("""
+                <div style="margin-top: 20px; padding: 20px; background-color: #f8f9fa; border-radius: 8px; border-left: 4px solid #007bff;">
+                    <h4>📋 Training Information</h4>
+                    <ul style="margin: 10px 0; padding-left: 20px;">
+                        <li><strong>Algorithm:</strong> GA-optimized Voting Ensemble (KNN + Decision Tree + Naive Bayes)</li>
+                        <li><strong>Features:</strong> BoW, TF-IDF, Sentence Embeddings (all-MiniLM-L6-v2)</li>
+                        <li><strong>Optimization:</strong> Genetic Algorithm (Population: 20, Generations: 10)</li>
+                        <li><strong>Evaluation:</strong> 3-fold Cross-Validation</li>
+                        <li><strong>Expected Time:</strong> 10-15 minutes on free tier</li>
+                        <li><strong>Expected Accuracy:</strong> 85-95% depending on dataset quality</li>
                     </ul>
                 </div>
                 """)
+                # Event handlers for training tab
+                train_btn.click(
+                    fn=start_training,
+                    outputs=[status_display, log_display]
+                )
+                refresh_btn.click(
+                    fn=get_training_status,
+                    outputs=[status_display, log_display]
+                )
             # ====================================
             # TAB 2: BILL CLASSIFICATION
             # ====================================
+            with gr.Tab("🔮 Bill Classification", id="classification"):
+                gr.HTML("<h3>🎯 Phân loại hóa đơn từ ảnh hoặc text</h3>")
                 with gr.Row():
+                    # Left column - Input
                     with gr.Column(scale=1):
                         gr.HTML("<h4>📸 Upload ảnh hóa đơn</h4>")
                         image_input = gr.Image(
                             label="Ảnh hóa đơn",
                             type="pil",
+                            height=250
                         )
+                        extract_btn = gr.Button(
+                            "🔍 Trích xuất mô tả từ ảnh",
+                            variant="secondary",
+                            size="sm"
+                        )
                         gr.HTML("<h4>📝 Hoặc nhập mô tả thủ công</h4>")
                         manual_input = gr.Textbox(
                             label="Mô tả hóa đơn",
                             placeholder="Ví dụ: Hóa đơn thanh toán tại cửa hàng cà phê Feel Coffee với món Yogurt Very Berry giá 22.000 VND",
+                            lines=4,
+                            max_lines=6
                         )
+                        predict_btn = gr.Button(
+                            "🎯 Dự đoán phân loại",
+                            variant="primary",
+                            size="lg"
+                        )
+                    # Right column - Output
                     with gr.Column(scale=1):
+                        gr.HTML("<h4>📄 Thông tin đã xử lý</h4>")
+                        processed_info = gr.Textbox(
+                            label="Nguồn và mô tả",
+                            lines=6,
                             interactive=False
                         )
                         gr.HTML("<h4>🎯 Kết quả phân loại</h4>")
+                        result_display = gr.Textbox(
+                            label="Dự đoán chính",
+                            lines=3,
                             interactive=False
                         )
+                        top3_display = gr.Textbox(
                             label="Top 3 dự đoán",
                             lines=4,
                             interactive=False
                         )
+                        status_output = gr.Textbox(
                             label="Trạng thái",
+                            lines=2,
                             interactive=False
                         )
+                # Examples section
+                with gr.Row():
+                    gr.HTML("""
+                    <div style="margin-top: 20px; padding: 15px; background-color: #e8f4fd; border-radius: 8px;">
+                        <h4>💡 Ví dụ các loại hóa đơn</h4>
+                        <div style="display: grid; grid-template-columns: 1fr 1fr; gap: 20px; margin-top: 10px;">
+                            <div>
+                                <ul style="margin: 0; padding-left: 20px;">
+                                    <li><strong>Ăn uống ngoài hàng:</strong> Nhà hàng, quán cà phê, fast food</li>
+                                    <li><strong>Siêu thị tổng hợp:</strong> VinMart, Co.opMart, Big C, Lotte</li>
+                                </ul>
+                            </div>
+                            <div>
+                                <ul style="margin: 0; padding-left: 20px;">
+                                    <li><strong>Sữa & Đồ uống:</strong> Sữa, nước ngọt, đồ uống các loại</li>
+                                    <li><strong>Tiện ích:</strong> Điện, nước, internet, di động</li>
+                                </ul>
+                            </div>
+                        </div>
+                    </div>
+                    """)
+                # Event handlers for classification tab
                 extract_btn.click(
+                    fn=process_image_and_extract,
                     inputs=[image_input],
                     outputs=[manual_input]
                 )
                 predict_btn.click(
+                    fn=predict_from_image_and_text,
                     inputs=[image_input, manual_input],
+                    outputs=[result_display, top3_display, status_output, processed_info]
                 )
             # ====================================
+            # TAB 3: ABOUT & HELP
             # ====================================
+            with gr.Tab("ℹ️ About & Help", id="about"):
                 gr.HTML("""
+                <div style="padding: 20px; max-width: 800px; margin: 0 auto;">
+                    <h2>🧾 Vietnamese Receipt Classification System</h2>
+                    <div style="margin: 20px 0; padding: 15px; background-color: #f8f9fa; border-radius: 8px;">
+                        <h3>🎯 Tính năng chính</h3>
+                        <ul>
+                            <li><strong>🤖 AI Vision:</strong> Trích xuất mô tả từ ảnh hóa đơn bằng Google Gemini Vision API</li>
+                            <li><strong>🧬 GA Optimization:</strong> Tối ưu hóa ensemble classifier bằng Genetic Algorithm</li>
+                            <li><strong>📊 Multi-feature:</strong> Kết hợp BoW, TF-IDF và Sentence Embeddings</li>
+                            <li><strong>🗳️ Voting Ensemble:</strong> KNN + Decision Tree + Naive Bayes với trọng số tối ưu</li>
+                            <li><strong>⚡ Real-time:</strong> Training và prediction trực tiếp trên web</li>
+                        </ul>
+                    </div>
+                    <div style="margin: 20px 0; padding: 15px; background-color: #e8f4fd; border-radius: 8px;">
+                        <h3>🔧 Công nghệ sử dụng</h3>
+                        <div style="display: grid; grid-template-columns: 1fr 1fr; gap: 15px;">
+                            <div>
+                                <h4>Machine Learning:</h4>
+                                <ul>
+                                    <li>scikit-learn</li>
+                                    <li>sentence-transformers</li>
+                                    <li>DEAP (Genetic Algorithm)</li>
+                                </ul>
+                            </div>
+                            <div>
+                                <h4>AI Vision:</h4>
+                                <ul>
+                                    <li>Google Gemini Vision</li>
+                                    <li>PIL (Image Processing)</li>
+                                    <li>Base64 Encoding</li>
+                                </ul>
+                            </div>
+                        </div>
+                    </div>
+                    <div style="margin: 20px 0; padding: 15px; background-color: #f0f8f0; border-radius: 8px;">
+                        <h3>📊 Performance Metrics</h3>
+                        <table style="width: 100%; border-collapse: collapse;">
+                            <tr>
+                                <td style="padding: 8px; border: 1px solid #ddd;"><strong>Accuracy</strong></td>
+                                <td style="padding: 8px; border: 1px solid #ddd;">85-95%</td>
+                            </tr>
+                            <tr>
+                                <td style="padding: 8px; border: 1px solid #ddd;"><strong>Training Time</strong></td>
+                                <td style="padding: 8px; border: 1px solid #ddd;">10-15 minutes</td>
+                            </tr>
+                            <tr>
+                                <td style="padding: 8px; border: 1px solid #ddd;"><strong>Prediction Time</strong></td>
+                                <td style="padding: 8px; border: 1px solid #ddd;">&lt; 2 seconds</td>
+                            </tr>
+                            <tr>
+                                <td style="padding: 8px; border: 1px solid #ddd;"><strong>Model Size</strong></td>
+                                <td style="padding: 8px; border: 1px solid #ddd;">~5MB (lightweight mode)</td>
+                            </tr>
+                        </table>
+                    </div>
+                    <div style="margin: 20px 0; padding: 15px; background-color: #fff8dc; border-radius: 8px;">
+                        <h3>🚀 Hướng dẫn sử dụng</h3>
                         <ol>
+                            <li><strong>Training:</strong> Bắt đầu với tab "🚀 Model Training", click "Start Training" và đợi 10-15 phút</li>
+                            <li><strong>Classification:</strong> Chuyển sang tab "🔮 Bill Classification"</li>
+                            <li><strong>Upload ảnh:</strong> Kéo thả ảnh hóa đơn vào khung "Upload ảnh hóa đơn"</li>
+                            <li><strong>Extract text:</strong> Click "🔍 Trích xuất mô tả từ ảnh" (cần Google AI API key)</li>
+                            <li><strong>Manual input:</strong> Hoặc nhập mô tả thủ công vào text box</li>
+                            <li><strong>Predict:</strong> Click "🎯 Dự đoán phân loại" để xem kết quả</li>
+                            <li><strong>Results:</strong> Xem dự đoán chính + top 3 alternatives với confidence scores</li>
                         </ol>
                     </div>
+                    <div style="margin: 20px 0; padding: 15px; background-color: #ffe6e6; border-radius: 8px;">
+                        <h3>⚠️ Lưu ý quan trọng</h3>
+                        <ul>
+                            <li><strong>Google AI API:</strong> Để sử dụng tính năng trích xuất từ ảnh, cần thiết lập GOOGLE_AI_API_KEY trong environment variables</li>
+                            <li><strong>Dataset:</strong> App cần file viet_receipt_categorized_label.xlsx để training</li>
+                            <li><strong>Memory:</strong> Training có thể tốn nhiều RAM, nên dùng trên máy có đủ bộ nhớ</li>
+                            <li><strong>Time:</strong> Quá trình training mất 10-15 phút, vui lòng kiên nhẫn</li>
+                        </ul>
+                    </div>
+                    <div style="text-align: center; margin-top: 30px; padding: 20px; background: linear-gradient(45deg, #667eea, #764ba2); color: white; border-radius: 8px;">
+                        <h3>🎉 Developed with ❤️ for Vietnamese NLP Community</h3>
+                        <p>Powered by Hugging Face 🤗 | Google AI Studio | Gradio</p>
                     </div>
                 </div>
                 """)
+        # Load initial status when interface starts
+        interface.load(
+            fn=get_training_status,
+            outputs=[status_display, log_display]
+        )
     return interface
 # ====================================
 if __name__ == "__main__":
     print("🚀 Starting Vietnamese Receipt Classification App...")
+    print("="*60)
     # Check dependencies
     print("📋 Checking dependencies...")
     if GOOGLE_AI_AVAILABLE and google_vision_model is not None:
         print("✅ Google AI Vision: Ready")
     else:
+        print("⚠️ Google AI Vision: Not available")
+        print("   💡 Set GOOGLE_AI_API_KEY environment variable to enable")
     # Check dataset
     if os.path.exists(Config.DATA_FILE):
         print(f"✅ Dataset: Found {Config.DATA_FILE}")
     else:
         print(f"⚠️ Dataset: {Config.DATA_FILE} not found")
+        print("   💡 Upload dataset file to enable training")
     print("🎨 Creating Gradio interface...")
     app = create_interface()
     print("🌐 Launching app...")
+    print("="*60)
+    # Launch with appropriate settings
     app.launch(
         server_name="0.0.0.0",
         server_port=7860,
+        share=False,  # Set to True for public sharing
+        show_error=True,
+        show_tips=True,
+        enable_queue=True