Spaces:

j2damax
/

serendip-experiential-backend

Running

+# Base image with Python
+FROM python:3.10-slim
+# Set up a non-root user for security
+RUN useradd -m -u 1000 user
+USER user
+ENV PATH="/home/user/.local/bin:$PATH"
+WORKDIR /app
+# Install dependencies
+COPY --chown=user requirements.txt .
+RUN pip install --no-cache-dir --upgrade -r requirements.txt
+# Copy application files
+COPY --chown=user . .
+# Hugging Face Spaces uses port 7860
+ENV PORT=7860
+# Use the api.py file as your entry point
+CMD ["uvicorn", "api:app", "--host", "0.0.0.0", "--port", "7860"]

Dockerfile.hf ADDED Viewed

	@@ -0,0 +1,15 @@

+FROM python:3.10-slim
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+# For Hugging Face Spaces - it expects port 7860 by default
+ENV PORT=7860
+# Entry point that will be used by Hugging Face Spaces
+CMD ["uvicorn", "api:app", "--host", "0.0.0.0", "--port", "${PORT}"]

README.md ADDED Viewed

	@@ -0,0 +1,45 @@

+---
+title: Serendip Experiential Backend
+emoji: 🚀
+colorFrom: blue
+colorTo: indigo
+sdk: docker
+sdk_version: "3.10"
+app_file: api.py
+pinned: false
+license: mit
+---
+# Serendip Experiential Backend
+This Space hosts the FastAPI backend for the Serendip Experiential Engine, which serves the j2damax/serendip-travel-classifier model.
+## API Endpoints
+- `GET /`: Health check endpoint
+- `POST /predict`: Analyzes a tourism review text and returns experiential dimension scores
+- `POST /explain`: Provides explainability for prediction results using SHAP
+## Usage
+This backend API is designed to be used with the [Serendip Experiential Frontend](https://huggingface.co/spaces/j2damax/serendip-experiential-frontend).
+## Technologies
+- FastAPI
+- Hugging Face Transformers
+- SHAP for explainability
+- PyTorch
+## Model
+This application uses the `j2damax/serendip-travel-classifier` model, which was trained to identify four key experiential dimensions in Sri Lankan tourism reviews:
+- 🌱 Regenerative & Eco-Tourism
+- 🧘 Integrated Wellness
+- 🍜 Immersive Culinary
+- 🌄 Off-the-Beaten-Path Adventure
+---
+<a href="https://github.com/j2damax/explainable-tourism-nlp" target="_blank">View on GitHub</a>

api.py ADDED Viewed

	@@ -0,0 +1,442 @@

+"""
+API module for BertForSequenceClassification model loading and inference
+with storage optimization for Hugging Face Spaces
+"""
+import os
+import shutil
+import tempfile
+from typing import List, Dict, Any, Optional
+import logging
+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+import torch
+import numpy as np
+from transformers import (
+    AutoTokenizer,
+    AutoModelForSequenceClassification,
+    pipeline
+)
+# Configure logging - use stderr to avoid filling up disk with log files
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+    handlers=[logging.StreamHandler()]  # Log to stderr instead of files
+)
+logger = logging.getLogger(__name__)
+# Model constants
+MODEL_NAME = "j2damax/serendip-travel-classifier"
+NUM_LABELS = 4
+MAX_LENGTH = 512
+# Dimension labels
+DIMENSIONS = [
+    "Regenerative & Eco-Tourism",
+    "Integrated Wellness",
+    "Immersive Culinary",
+    "Off-the-Beaten-Path Adventure"
+]
+# Set up a temporary cache directory for HuggingFace Transformers
+# This prevents filling up the persistent storage on HF Spaces
+os.environ['TRANSFORMERS_CACHE'] = os.path.join(tempfile.gettempdir(), 'hf_transformers_cache')
+os.environ['HF_HOME'] = os.path.join(tempfile.gettempdir(), 'hf_home')
+os.makedirs(os.environ['TRANSFORMERS_CACHE'], exist_ok=True)
+os.makedirs(os.environ['HF_HOME'], exist_ok=True)
+# Initialize FastAPI app
+app = FastAPI(
+    title="Serendip Travel Classifier API",
+    description="API for classifying experiential dimensions in Sri Lankan tourism reviews using BERT",
+    version="0.1.0",
+)
+# Request and response models
+class PredictRequest(BaseModel):
+    review_text: str
+class PredictionResult(BaseModel):
+    label: str
+    score: float
+class ExplainRequest(BaseModel):
+    review_text: str
+    top_n_words: int = 10
+# Global variables for model, tokenizer, and classifier
+model = None
+tokenizer = None
+classifier = None
+def cleanup_unused_files():
+    """Clean up temporary files and caches to save space"""
+    try:
+        # Clear transformers cache
+        cache_dir = os.environ.get('TRANSFORMERS_CACHE')
+        if cache_dir and os.path.exists(cache_dir):
+            logger.info(f"Cleaning up transformers cache: {cache_dir}")
+            # Instead of deleting everything, just remove files older than 1 hour
+            import time
+            for root, dirs, files in os.walk(cache_dir):
+                for f in files:
+                    file_path = os.path.join(root, f)
+                    try:
+                        if time.time() - os.path.getmtime(file_path) > 3600:
+                            os.remove(file_path)
+                    except Exception as e:
+                        logger.warning(f"Error removing file {file_path}: {str(e)}")
+        # Remove other temp files
+        temp_dir = tempfile.gettempdir()
+        for f in os.listdir(temp_dir):
+            if f.startswith('tmp') and not f.endswith('.py'):
+                try:
+                    file_path = os.path.join(temp_dir, f)
+                    if os.path.isfile(file_path) and time.time() - os.path.getmtime(file_path) > 3600:
+                        os.remove(file_path)
+                except Exception:
+                    pass
+    except Exception as e:
+        logger.warning(f"Error during cleanup: {str(e)}")
+def load_model_if_needed():
+    """Load the model and tokenizer if they're not already loaded"""
+    global model, tokenizer, classifier
+    if model is None or tokenizer is None or classifier is None:
+        try:
+            logger.info("Loading model and tokenizer...")
+            # Clean up any existing cache to prevent storage issues
+            cleanup_unused_files()
+            # Use device setting
+            device = "cuda" if torch.cuda.is_available() else "cpu"
+            logger.info(f"Using device: {device}")
+            # Load tokenizer
+            tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
+            # Load model with optimization settings
+            model = AutoModelForSequenceClassification.from_pretrained(
+                MODEL_NAME,
+                num_labels=NUM_LABELS,
+                problem_type="multi_label_classification",
+                low_cpu_mem_usage=True  # Lower memory usage
+            )
+            # Create classifier pipeline
+            classifier = pipeline(
+                "text-classification",
+                model=model,
+                tokenizer=tokenizer,
+                function_to_apply="sigmoid",
+                top_k=None,
+                device=-1 if device == "cpu" else 0
+            )
+            logger.info("Model loaded successfully!")
+            return True
+        except Exception as e:
+            logger.error(f"Failed to load model: {str(e)}")
+            raise HTTPException(status_code=500, detail=f"Failed to load model: {str(e)}")
+    return True
+@app.on_event("startup")
+async def startup_event():
+    """Run startup tasks"""
+    logger.info("Starting API server. Model will be loaded on first request.")
+    # Clean up unused files from previous runs
+    import time  # Required for cleanup function
+    cleanup_unused_files()
+@app.get("/")
+def read_root():
+    """Health check endpoint"""
+    global model, tokenizer, classifier
+    model_status = "loaded" if model is not None else "not_loaded"
+    return {
+        "status": "active",
+        "model": MODEL_NAME,
+        "model_status": model_status
+    }
+@app.post("/predict", response_model=List[PredictionResult])
+async def predict(request: PredictRequest):
+    """
+    Classify a tourism review into experiential dimensions
+    This endpoint processes the review text and returns prediction scores for all dimensions.
+    """
+    # Load model if needed (using our new optimized function)
+    load_model_if_needed()
+    try:
+        logger.info(f"Processing review: {request.review_text[:50]}...")
+        # Run inference
+        result = classifier(request.review_text)
+        # Print the raw result for debugging
+        print(f"Raw prediction result: {result}")
+        # Extract predictions and format response
+        if isinstance(result, list) and len(result) > 0:
+            if isinstance(result[0], list) and len(result[0]) > 0:
+                # Handle nested list structure [[{...}, {...}, ...]]
+                predictions = result[0]
+                formatted_results = []
+                # Create a mapping from label names to scores
+                label_scores = {item['label']: item['score'] for item in predictions}
+                # Ensure we have results for all dimensions in the expected order
+                for label in DIMENSIONS:
+                    score = label_scores.get(label, 0.0)
+                    if isinstance(score, torch.Tensor):
+                        score = score.item()
+                    formatted_results.append({
+                        "label": label,
+                        "score": float(score)
+                    })
+            elif isinstance(result[0], dict):
+                # Handle the case where the pipeline returns a list with one dict
+                scores = result[0]
+                # Format output as a list of label-score pairs
+                formatted_results = []
+                for idx, label in enumerate(DIMENSIONS):
+                    label_id = f"LABEL_{idx}"
+                    score = scores.get(label_id, 0.0)
+                    if isinstance(score, torch.Tensor):
+                        score = score.item()
+                    formatted_results.append({
+                        "label": label,
+                        "score": float(score)
+                    })
+            # Sort by score in descending order
+            formatted_results.sort(key=lambda x: x["score"], reverse=True)
+            return formatted_results
+        else:
+            # If the pipeline returns something unexpected, try to convert it
+            formatted_results = []
+            for i, label in enumerate(DIMENSIONS):
+                score = 0.0
+                if i < len(result):
+                    if isinstance(result[i], dict) and "score" in result[i]:
+                        score = result[i]["score"]
+                    elif isinstance(result[i], (int, float, np.number, torch.Tensor)):
+                        score = float(result[i])
+                formatted_results.append({
+                    "label": label,
+                    "score": float(score)
+                })
+            return formatted_results
+    except Exception as e:
+        logger.error(f"Error during prediction: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"Prediction error: {str(e)}")
+@app.post("/explain")
+async def explain(request: ExplainRequest):
+    """
+    Generate explanations for a review's classification
+    This endpoint returns both HTML visualization and top influencing words,
+    using a simple attribution method for reliability.
+    """
+    # Load model if needed (using our new optimized function)
+    load_model_if_needed()
+    try:
+        # Get the input text
+        review_text = request.review_text
+        # Tokenize the text by word (use simple space splitting for visualization)
+        # NOTE: This is not the same as model tokenization, it's just for display
+        words = review_text.split()
+        if len(words) < 2:
+            raise ValueError("Review text must contain at least 2 words for explanation")
+        # Generate word importance for all dimensions using simpler method
+        dimension_scores = {}
+        for i, dimension in enumerate(DIMENSIONS):
+            dimension_scores[dimension] = []
+        # 1. Get the baseline prediction for the full text
+        with torch.no_grad():
+            inputs = tokenizer(
+                review_text,
+                return_tensors="pt",
+                truncation=True,
+                padding=True,
+                max_length=MAX_LENGTH
+            )
+            outputs = model(**inputs)
+            predictions = torch.sigmoid(outputs.logits)
+            baseline_scores = predictions.detach().numpy()[0]
+        # 2. For each word, measure its importance by removing it
+        for i, word in enumerate(words):
+            if len(words) <= 1:  # Skip if only one word
+                continue
+            # Create text with this word removed
+            words_without_i = words.copy()
+            words_without_i.pop(i)
+            modified_text = " ".join(words_without_i)
+            # Get prediction without the word
+            with torch.no_grad():
+                mod_inputs = tokenizer(
+                    modified_text,
+                    return_tensors="pt",
+                    truncation=True,
+                    padding=True,
+                    max_length=MAX_LENGTH
+                )
+                mod_outputs = model(**mod_inputs)
+                mod_predictions = torch.sigmoid(mod_outputs.logits)
+                mod_scores = mod_predictions.detach().numpy()[0]
+            # For each dimension, calculate importance as difference in scores
+            for dim_idx, dimension in enumerate(DIMENSIONS):
+                importance = float(baseline_scores[dim_idx] - mod_scores[dim_idx])
+                dimension_scores[dimension].append({
+                    "word": word,
+                    "value": importance,
+                    "is_positive": importance > 0
+                })
+        # 3. For each dimension, sort words by absolute importance and take top N
+        top_words = {}
+        for dimension in DIMENSIONS:
+            if dimension_scores[dimension]:
+                # Sort by absolute importance (largest effect first)
+                sorted_words = sorted(
+                    dimension_scores[dimension],
+                    key=lambda x: abs(x["value"]),
+                    reverse=True
+                )
+                # Take top N words
+                top_words[dimension] = sorted_words[:request.top_n_words]
+            else:
+                top_words[dimension] = []
+        # 4. Create visualization using matplotlib
+        try:
+            import matplotlib
+            matplotlib.use('Agg')
+            import matplotlib.pyplot as plt
+            from io import BytesIO
+            import base64
+            # Create visualization for the top dimension
+            top_dim_idx = np.argmax(baseline_scores)
+            top_dimension = DIMENSIONS[top_dim_idx]
+            # Extract top words for visualization
+            top_words_for_viz = top_words[top_dimension]
+            # Configure matplotlib to use smaller sizes and lower quality to save memory
+            plt.rcParams['figure.dpi'] = 80  # Lower DPI
+            plt.rcParams['savefig.dpi'] = 100  # Lower save DPI
+            # Create figure with a smaller size to reduce memory usage
+            fig, ax = plt.subplots(figsize=(8, 5))
+            # Prepare data for visualization - limit to top 8 words to reduce image size
+            viz_words = [item["word"] for item in top_words_for_viz[:8]]
+            viz_values = [item["value"] for item in top_words_for_viz[:8]]
+            # Create horizontal bar chart with simplified styling
+            bars = ax.barh(
+                viz_words,
+                viz_values,
+                color=['#FF4444' if v > 0 else '#3366CC' for v in viz_values],
+                height=0.7,
+                edgecolor='black',
+                linewidth=0.5
+            )
+            # Add simple labels and title
+            ax.set_title(f"Words influencing '{top_dimension}'", fontsize=12)
+            ax.set_xlabel("Impact on score", fontsize=10)
+            # Add a vertical line at x=0 with simplified styling
+            ax.axvline(x=0, color='black', linestyle='-', linewidth=1)
+            # Add simple legend to explain colors
+            from matplotlib.patches import Patch
+            legend_elements = [
+                Patch(facecolor='#FF4444', edgecolor='black', label='Increases score'),
+                Patch(facecolor='#3366CC', edgecolor='black', label='Decreases score')
+            ]
+            ax.legend(handles=legend_elements, loc='lower right', fontsize=8)
+            # Convert plot to HTML image with lower resolution
+            buffer = BytesIO()
+            fig.tight_layout()
+            plt.savefig(buffer, format='png', dpi=80, bbox_inches='tight')
+            buffer.seek(0)
+            img_str = base64.b64encode(buffer.read()).decode()
+            # Create simplified HTML with inline image
+            html = f"""
+            <div style="text-align: center;">
+                <h3>Words influencing '{top_dimension}'</h3>
+                <img src="data:image/png;base64,{img_str}" style="width:100%; max-width:600px;" />
+                <p>Red bars increase prediction score, blue bars decrease it.</p>
+            </div>
+            """
+            # Close the figure to free memory
+            plt.close(fig)
+            plt.close(fig)
+        except Exception as viz_error:
+            logger.error(f"Error creating visualization: {str(viz_error)}")
+            html = f"<p>Could not generate visualization: {str(viz_error)}</p>"
+        # Return the HTML and top words in the format expected by the frontend
+        return {
+            "explanation": {
+                "html": html,
+                "top_words": top_words
+            }
+        }
+    except Exception as e:
+        logger.error(f"Error during explanation: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"Explanation error: {str(e)}")
+@app.on_event("shutdown")
+async def shutdown_event():
+    """Clean up resources when shutting down"""
+    logger.info("Shutting down API server")
+    cleanup_unused_files()
+    # Clear global model references to help garbage collection
+    global model, tokenizer, classifier
+    model = None
+    tokenizer = None
+    classifier = None
+if __name__ == "__main__":
+    import uvicorn
+    import time  # Required for cleanup function
+    # Determine the host and port from environment variables or use defaults
+    host = os.environ.get("HOST", "0.0.0.0")
+    port = int(os.environ.get("PORT", 8000))
+    # Run the application - disable reload in production to save memory
+    uvicorn.run("api:app", host=host, port=port, reload=False)

app.py ADDED Viewed

	@@ -0,0 +1,8 @@

+"""
+Entry point for Hugging Face Spaces deployment
+"""
+# Import your FastAPI app
+from api import app
+# This is the entry point for Hugging Face Spaces
+# It will automatically be detected and run

deploy_to_huggingface.sh ADDED Viewed

	@@ -0,0 +1,119 @@

+#!/bin/bash
+# Deployment script for Serendip Experiential Backend to Hugging Face Spaces
+# Check if HF_TOKEN is set
+if [ -z "$HF_TOKEN" ]; then
+    echo "Error: HF_TOKEN environment variable not set"
+    echo "Please set it with: export HF_TOKEN=your_hugging_face_token"
+    exit 1
+fi
+# Define variables
+SPACE_NAME="j2damax/serendip-experiential-backend"
+REPO_URL="https://huggingface.co/spaces/$SPACE_NAME"
+LOCAL_DIR="$(pwd)"
+echo "Deploying backend to Hugging Face Spaces: $SPACE_NAME"
+# Create a temporary directory
+TMP_DIR=$(mktemp -d)
+cd $TMP_DIR
+# Initialize git and set credentials
+git init
+git config --local user.email "you@example.com"
+git config --local user.name "Your Name"
+# Clone the space if it exists, otherwise create from scratch
+if curl --fail --silent -H "Authorization: Bearer $HF_TOKEN" $REPO_URL > /dev/null; then
+    echo "Space exists, cloning repository..."
+    # Format for Hugging Face API token authentication
+    git clone "https://huggingface.co/spaces/$SPACE_NAME" .
+    git config --local credential.helper store
+    echo "https://oauth2:$HF_TOKEN@huggingface.co" > ~/.git-credentials
+    # Remove all files except .git to ensure clean state
+    find . -mindepth 1 -not -path "./.git*" -delete
+else
+    echo "Creating new space..."
+    # Will push later to create the repository
+fi
+# Copy all files from the backend directory
+echo "Copying files from $LOCAL_DIR to temporary directory..."
+cp -r $LOCAL_DIR/* .
+# Remove any unnecessary files
+echo "Cleaning up unnecessary files..."
+rm -rf __pycache__ .ipynb_checkpoints .pytest_cache .venv
+# Use the Hugging Face specific Dockerfile
+if [ -f "Dockerfile.huggingface" ]; then
+    echo "Using Hugging Face specific Dockerfile..."
+    mv Dockerfile.huggingface Dockerfile
+fi
+# Copy the README.md file with proper YAML metadata
+if [ -f "$LOCAL_DIR/README.md" ]; then
+    echo "Using existing README.md with YAML metadata..."
+    cp "$LOCAL_DIR/README.md" ./README.md
+else
+    echo "# Creating default README.md with YAML metadata..."
+    cat > README.md << EOL
+---
+title: Serendip Experiential Backend
+emoji: 🚀
+colorFrom: blue
+colorTo: indigo
+sdk: docker
+sdk_version: "3.10"
+app_file: api.py
+pinned: false
+license: mit
+---
+# Serendip Experiential Backend
+FastAPI backend for the Serendip Experiential Engine
+EOL
+fi
+# Create .gitignore
+echo ".env
+__pycache__/
+*.py[cod]
+*$py.class
+.pytest_cache/
+.coverage
+htmlcov/
+.ipynb_checkpoints
+*.ipynb
+venv/
+.venv/" > .gitignore
+# Create Hugging Face Space metadata file
+mkdir -p .hf
+cat > .hf/metadata.json << EOL
+{
+    "app_port": 7860,
+    "app_file": "api.py"
+}
+EOL
+# Add all files to git
+git add .
+# Commit changes
+git commit -m "Deploy backend to Hugging Face Spaces"
+# Push to Hugging Face Spaces
+echo "Pushing to Hugging Face Spaces..."
+# Use stored credential helper instead of embedding in URL
+git remote add origin "https://huggingface.co/spaces/$SPACE_NAME"
+git push -f origin main
+# Clean up
+cd - > /dev/null
+rm -rf $TMP_DIR
+echo "Deployment complete! Your backend should be available at:"
+echo "https://huggingface.co/spaces/$SPACE_NAME"

docker-compose.yml ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ dockerfile: Dockerfile.hf
2	+ base_path: /app

main.py ADDED Viewed

	@@ -0,0 +1,91 @@

+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+import numpy as np
+from typing import Dict, List
+import logging
+import os
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+# Initialize FastAPI app
+app = FastAPI(
+    title="Serendip Experiential Engine API",
+    description="API for classifying experiential dimensions in Sri Lankan tourism reviews",
+    version="0.1.0"
+)
+class ReviewRequest(BaseModel):
+    text: str
+class ExplanationItem(BaseModel):
+    word: str
+    value: float
+class ClassificationResponse(BaseModel):
+    predictions: Dict[str, float]
+    explanation: Dict[str, List[ExplanationItem]]
+# Define the experiential dimensions
+DIMENSIONS = [
+    "Regenerative & Eco-Tourism",
+    "Integrated Wellness",
+    "Immersive Culinary",
+    "Off-the-Beaten-Path Adventure"
+]
+@app.get("/")
+def read_root():
+    """Root endpoint for health checking"""
+    return {"status": "active", "service": "Serendip Experiential Engine API"}
+@app.get("/dimensions")
+def get_dimensions():
+    """Get all available experiential dimensions"""
+    return {"dimensions": DIMENSIONS}
+@app.post("/classify", response_model=ClassificationResponse)
+async def classify_review(request: ReviewRequest):
+    """
+    Classify a tourism review into experiential dimensions
+    """
+    try:
+        logger.info(f"Processing review: {request.text[:50]}...")
+        # TODO: Replace this with actual model inference
+        # This is just placeholder logic that returns random values
+        mock_predictions = {
+            dim: float(np.random.random()) for dim in DIMENSIONS
+        }
+        # Mock explanation data (in a real app, this would come from SHAP or similar)
+        mock_explanation = {
+            dim: [
+                {"word": "beautiful", "value": float(np.random.random())},
+                {"word": "amazing", "value": float(np.random.random())},
+                {"word": "sustainable", "value": float(np.random.random())}
+            ] for dim in DIMENSIONS
+        }
+        return {
+            "predictions": mock_predictions,
+            "explanation": mock_explanation
+        }
+    except Exception as e:
+        logger.error(f"Error processing review: {str(e)}")
+        raise HTTPException(status_code=500, detail=f"Error processing review: {str(e)}")
+if __name__ == "__main__":
+    import uvicorn
+    # Determine the host and port from environment variables or use defaults
+    host = os.environ.get("HOST", "0.0.0.0")
+    port = int(os.environ.get("PORT", 8000))
+    # Run the application
+    uvicorn.run("main:app", host=host, port=port, reload=True)

requirements.txt ADDED Viewed

	@@ -0,0 +1,16 @@

+# Backend requirements
+fastapi>=0.100.0
+uvicorn>=0.23.0
+pydantic>=2.0.0
+numpy>=1.24.0
+pandas>=2.0.0
+python-dotenv>=1.0.0
+loguru>=0.7.0
+requests>=2.31.0
+# ML/NLP requirements
+torch>=2.0.0
+transformers>=4.30.0
+shap>=0.42.0
+huggingface-hub>=0.16.0
+matplotlib>=3.7.0

routers/__init__.py ADDED Viewed

	@@ -0,0 +1,23 @@

+from fastapi import APIRouter, HTTPException
+from pydantic import BaseModel
+from typing import Dict, List
+router = APIRouter(
+    prefix="/api/v1",
+    tags=["model"],
+    responses={404: {"description": "Not found"}},
+)
+class ReviewRequest(BaseModel):
+    text: str
+class ClassificationResponse(BaseModel):
+    predictions: Dict[str, float]
+    explanation: Dict[str, List[Dict[str, float]]]
+@router.get("/health")
+async def health_check():
+    """Check if the model is healthy and ready to serve predictions"""
+    return {"status": "ok", "model": "active"}
+# Additional model-related endpoints can be added here

routers/model.py ADDED Viewed

	@@ -0,0 +1,78 @@

+from fastapi import APIRouter, HTTPException, Depends
+from pydantic import BaseModel
+from typing import Dict, List
+import numpy as np
+import logging
+logger = logging.getLogger(__name__)
+router = APIRouter(
+    prefix="/api/v1",
+    tags=["model"],
+    responses={404: {"description": "Not found"}},
+)
+class ReviewRequest(BaseModel):
+    text: str
+class ExplanationItem(BaseModel):
+    word: str
+    value: float
+class ClassificationResponse(BaseModel):
+    predictions: Dict[str, float]
+    explanation: Dict[str, List[ExplanationItem]]
+# Define the experiential dimensions
+DIMENSIONS = [
+    "Regenerative & Eco-Tourism",
+    "Integrated Wellness",
+    "Immersive Culinary",
+    "Off-the-Beaten-Path Adventure"
+]
+@router.get("/health")
+async def health_check():
+    """Check if the model is healthy and ready to serve predictions"""
+    return {"status": "ok", "model": "active"}
+@router.get("/dimensions")
+async def get_dimensions():
+    """Get all available experiential dimensions"""
+    return {"dimensions": DIMENSIONS}
+# NOTE: This endpoint was removed as it's not currently used by the frontend
+# The frontend uses its own implementation with OpenAI API directly
+# If you need this endpoint in the future, uncomment the code below
+# @router.post("/classify", response_model=ClassificationResponse)
+# async def classify_review(request: ReviewRequest):
+#     """
+#     Classify a tourism review into experiential dimensions
+#     """
+#     try:
+#         logger.info(f"Processing review: {request.text[:50]}...")
+#
+#         # TODO: Replace this with actual model inference
+#         # This is just placeholder logic that returns random values
+#         mock_predictions = {
+#             dim: float(np.random.random()) for dim in DIMENSIONS
+#         }
+#
+#         # Mock explanation data (in a real app, this would come from SHAP or similar)
+#         mock_explanation = {
+#             dim: [
+#                 {"word": "beautiful", "value": float(np.random.random())},
+#                 {"word": "amazing", "value": float(np.random.random())},
+#                 {"word": "sustainable", "value": float(np.random.random())}
+#             ] for dim in DIMENSIONS
+#         }
+#
+#         return {
+#             "predictions": mock_predictions,
+#             "explanation": mock_explanation
+#         }
+#
+#     except Exception as e:
+#         logger.error(f"Error processing review: {str(e)}")
+#         raise HTTPException(status_code=500, detail=f"Error processing review: {str(e)}")