Spaces:

PsalmsJava
/

emotion-detection-api

No application file

App Files Files Community

PsalmsJava commited on 28 days ago

Commit

c6d98fa

1 Parent(s): 8c45515

Initial deployment of emotion detection API

Browse files

Files changed (8) hide show

README.md +24 -4
app/audio/preprocessor.py +92 -0
app/auth.py +0 -0
app/config.py +0 -0
app/main.py +192 -0
app/models/ensemble.py +0 -0
app/utils/logger.py +12 -0
requirements.txt +28 -0

README.md CHANGED Viewed

@@ -1,12 +1,32 @@
 ---
-title: Emotion Detection Api
-emoji: 🏆
 colorFrom: blue
 colorTo: purple
 sdk: docker
 pinned: false
 license: mit
-short_description: Emotion Detection API for The MoodSync Project
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Emotion Detection Ensemble API
+emoji: 🎭
 colorFrom: blue
 colorTo: purple
 sdk: docker
+app_port: 7860
 pinned: false
 license: mit
 ---
+# 🎭 Emotion Detection Ensemble API
+A production-ready emotion detection API that combines 5 state-of-the-art models for accurate emotion recognition from speech.
+## ✨ Features
+- **Ensemble Learning**: Combines 5 models with weighted voting
+- **Advanced Audio Processing**: VAD, noise reduction, format conversion
+- **Multi-Emotion Output**: Returns probability distribution across 7 emotions
+- **Secure Authentication**: Bearer token authentication
+- **Interactive Docs**: Built-in Swagger UI
+## 🚀 Quick Start
+### API Endpoints
+- `GET /health` - Health check
+- `GET /models` - List all models
+- `POST /analyze` - Analyze emotion from audio
+- `POST /analyze-batch` - Analyze multiple files
+### Authentication
+Include your API token in the header:

app/audio/preprocessor.py ADDED Viewed

	@@ -0,0 +1,92 @@

+import os
+import tempfile
+import subprocess
+import numpy as np
+import librosa
+from fastapi import UploadFile, HTTPException
+from typing import Tuple
+import logging
+from ..config import config
+logger = logging.getLogger(__name__)
+class AudioPreprocessor:
+    """Simplified audio preprocessing for Hugging Face"""
+    def __init__(self):
+        self.target_sr = config.AUDIO_CONFIG["target_sample_rate"]
+        self.max_duration = config.AUDIO_CONFIG["max_duration"]
+        self.max_size_mb = config.AUDIO_CONFIG["max_file_size_mb"]
+    async def validate_and_preprocess(self, file: UploadFile) -> Tuple[np.ndarray, int, dict]:
+        """
+        Validate and preprocess audio file
+        Simplified for Hugging Face deployment
+        """
+        # Read file
+        contents = await file.read()
+        file_size_mb = len(contents) / (1024 * 1024)
+        # Validate size
+        if file_size_mb > self.max_size_mb:
+            raise HTTPException(
+                status_code=400,
+                detail=f"File too large: {file_size_mb:.1f}MB (max: {self.max_size_mb}MB)"
+            )
+        # Save to temp file
+        with tempfile.NamedTemporaryFile(delete=False, suffix=f".{file.filename.split('.')[-1]}") as tmp_input:
+            tmp_input.write(contents)
+            input_path = tmp_input.name
+        try:
+            # Convert to WAV using FFmpeg
+            with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_output:
+                output_path = tmp_output.name
+            # FFmpeg command
+            cmd = [
+                "ffmpeg",
+                "-i", input_path,
+                "-ar", str(self.target_sr),
+                "-ac", "1",
+                "-acodec", "pcm_s16le",
+                "-y",
+                output_path
+            ]
+            result = subprocess.run(cmd, capture_output=True, text=True)
+            if result.returncode != 0:
+                raise HTTPException(status_code=400, detail="Audio conversion failed")
+            # Load audio
+            audio, sr = librosa.load(output_path, sr=self.target_sr)
+            # Check duration
+            duration = len(audio) / sr
+            if duration > self.max_duration:
+                audio = audio[:int(self.max_duration * sr)]
+            # Simple normalization
+            audio = audio / np.max(np.abs(audio)) if np.max(np.abs(audio)) > 0 else audio
+            metadata = {
+                "filename": file.filename,
+                "duration": round(len(audio) / sr, 2),
+                "sample_rate": sr,
+                "size_mb": round(file_size_mb, 2)
+            }
+            return audio, sr, metadata
+        except Exception as e:
+            logger.error(f"Audio processing failed: {str(e)}")
+            raise HTTPException(status_code=500, detail="Audio processing failed")
+        finally:
+            # Cleanup
+            for path in [input_path, output_path]:
+                if os.path.exists(path):
+                    os.unlink(path)
+audio_preprocessor = AudioPreprocessor()

app/auth.py ADDED Viewed

File without changes

app/config.py ADDED Viewed

File without changes

app/main.py ADDED Viewed

	@@ -0,0 +1,192 @@

+from fastapi import FastAPI, File, UploadFile, Depends, HTTPException, Request
+from fastapi.security import HTTPBearer
+from fastapi.responses import JSONResponse
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.openapi.docs import get_swagger_ui_html
+import aiohttp
+import time
+import hashlib
+import logging
+from datetime import datetime
+from typing import Optional
+import os
+from .config import config
+from .auth import auth_handler
+from .audio.preprocessor import audio_preprocessor
+from .models.ensemble import ensemble_fusion
+# Setup logging
+logging.basicConfig(level=getattr(logging, config.LOG_LEVEL))
+logger = logging.getLogger(__name__)
+# Initialize FastAPI
+app = FastAPI(
+    title=config.API_TITLE,
+    version=config.API_VERSION,
+    docs_url=None  # We'll create custom docs
+)
+# CORS
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# Simple cache
+prediction_cache = {}
+http_session = None
+@app.on_event("startup")
+async def startup():
+    """Initialize on startup"""
+    global http_session
+    http_session = aiohttp.ClientSession()
+    logger.info(f"🚀 API started with {len(config.MODELS)} models")
+    logger.info(f"HF_TOKEN present: {bool(config.HF_TOKEN)}")
+@app.on_event("shutdown")
+async def shutdown():
+    """Cleanup on shutdown"""
+    if http_session:
+        await http_session.close()
+@app.get("/", include_in_schema=False)
+async def root():
+    """Root endpoint"""
+    return {
+        "service": config.API_TITLE,
+        "version": config.API_VERSION,
+        "docs": "/docs",
+        "health": "/health"
+    }
+@app.get("/health")
+async def health_check():
+    """Health check for Hugging Face"""
+    return {
+        "status": "healthy",
+        "timestamp": datetime.utcnow().isoformat(),
+        "models": len(config.MODELS),
+        "hf_token_configured": bool(config.HF_TOKEN)
+    }
+@app.get("/models")
+async def list_models():
+    """List all models in ensemble"""
+    return {
+        "models": [
+            {
+                "name": name,
+                "weight": model["weight"],
+                "description": model.get("description", "")
+            }
+            for name, model in config.MODELS.items()
+        ]
+    }
+@app.post("/analyze")
+async def analyze_emotion(
+    request: Request,
+    file: UploadFile = File(...),
+    token: str = Depends(auth_handler.verify_token)
+):
+    """
+    Analyze emotion from audio file
+    """
+    start_time = time.time()
+    try:
+        # Check cache
+        file_content = await file.read()
+        await file.seek(0)
+        cache_key = hashlib.md5(file_content).hexdigest()
+        if cache_key in prediction_cache:
+            logger.info(f"Cache hit for {cache_key}")
+            return prediction_cache[cache_key]
+        # Process audio
+        logger.info(f"Processing: {file.filename}")
+        audio, sr, metadata = await audio_preprocessor.validate_and_preprocess(file)
+        # Get file bytes again
+        await file.seek(0)
+        audio_bytes = await file.read()
+        # Query models
+        logger.info("Querying models...")
+        model_outputs = await ensemble_fusion.query_all_models(http_session, audio_bytes)
+        if len(model_outputs) < config.ENSEMBLE_CONFIG["min_models_for_prediction"]:
+            raise HTTPException(
+                status_code=503,
+                detail=f"Only {len(model_outputs)}/{len(config.MODELS)} models responded"
+            )
+        # Fuse predictions
+        result = ensemble_fusion.fuse_predictions(model_outputs)
+        # Add metadata
+        result["processing_time"] = round(time.time() - start_time, 2)
+        result["audio_metadata"] = metadata
+        result["timestamp"] = datetime.utcnow().isoformat()
+        # Cache result
+        if len(prediction_cache) < config.CACHE_CONFIG["max_size"]:
+            prediction_cache[cache_key] = result
+        logger.info(f"Analysis complete: {result['primary_emotion']} ({result['processing_time']}s)")
+        return result
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.error(f"Error: {str(e)}", exc_info=True)
+        raise HTTPException(status_code=500, detail=str(e))
+@app.get("/docs", include_in_schema=False)
+async def custom_docs():
+    """Custom Swagger UI"""
+    return get_swagger_ui_html(
+        openapi_url="/openapi.json",
+        title=f"{config.API_TITLE} - Docs",
+        swagger_js_url="https://cdn.jsdelivr.net/npm/swagger-ui-dist@5/swagger-ui-bundle.js",
+        swagger_css_url="https://cdn.jsdelivr.net/npm/swagger-ui-dist@5/swagger-ui.css",
+    )
+@app.get("/openapi.json", include_in_schema=False)
+async def get_openapi():
+    """Custom OpenAPI schema"""
+    from fastapi.openapi.utils import get_openapi
+    if app.openapi_schema:
+        return app.openapi_schema
+    openapi_schema = get_openapi(
+        title=config.API_TITLE,
+        version=config.API_VERSION,
+        description="Emotion detection API using ensemble of 5 models",
+        routes=app.routes,
+    )
+    # Add security
+    openapi_schema["components"]["securitySchemes"] = {
+        "bearerAuth": {
+            "type": "http",
+            "scheme": "bearer",
+            "description": "Enter your API token"
+        }
+    }
+    openapi_schema["security"] = [{"bearerAuth": []}]
+    app.openapi_schema = openapi_schema
+    return app.openapi_schema
+if __name__ == "__main__":
+    import uvicorn
+    port = int(os.getenv("PORT", 8000))
+    uvicorn.run(app, host="0.0.0.0", port=port)

app/models/ensemble.py ADDED Viewed

File without changes

app/utils/logger.py ADDED Viewed

	@@ -0,0 +1,12 @@

+import logging
+import sys
+def setup_logging():
+    """Simple logging setup"""
+    logging.basicConfig(
+        level=logging.INFO,
+        format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
+        handlers=[
+            logging.StreamHandler(sys.stdout)
+        ]
+    )

requirements.txt ADDED Viewed

	@@ -0,0 +1,28 @@

+# Core Framework
+fastapi==0.104.1
+uvicorn[standard]==0.24.0
+pydantic==2.5.0
+python-dotenv==1.0.0
+# Authentication
+python-jose[cryptography]==3.3.0
+passlib[bcrypt]==1.7.4
+python-multipart==0.0.6
+# HTTP & Async
+aiohttp==3.9.1
+httpx==0.25.1
+# Audio Processing
+librosa==0.10.1
+soundfile==0.12.1
+pydub==0.25.1
+ffmpeg-python==0.2.0
+# Scientific Computing
+numpy==1.24.3
+scipy==1.11.4
+scikit-learn==1.3.2
+# Rate Limiting
+slowapi==0.1.8