Spaces:

rajendrakumarv
/

Anomaly-detection

Runtime error

App Files Files Community

rajendrakumarv

tejovk311 commited on May 28

Commit

ab3e631

verified ·

1 Parent(s): 73769bb

Upload 3 files (#2)

Browse files

- Upload 3 files (3ba492afdd98f2f37520efca605563be71e92e5a)

Co-authored-by: Kattamuri Tejo Vardhan <tejovk311@users.noreply.huggingface.co>

Files changed (3) hide show

Dockerfile.unknown +35 -0
app.py +167 -0
requirements.txt +15 -0

Dockerfile.unknown ADDED Viewed

	@@ -0,0 +1,35 @@

+FROM python:3.9-slim
+# Install system dependencies for video processing
+RUN apt-get update && apt-get install -y \
+    ffmpeg \
+    libsm6 \
+    libxext6 \
+    libxrender-dev \
+    libgl1-mesa-glx \
+    && rm -rf /var/lib/apt/lists/*
+# Set working directory
+WORKDIR /app
+# Copy requirements file
+COPY requirements.txt .
+# Install Python dependencies
+RUN pip install --no-cache-dir -r requirements.txt
+# Copy application code
+COPY app.py .
+# Create a directory for temporary files
+RUN mkdir -p /tmp/video_processing && chmod 777 /tmp/video_processing
+# Set environment variables
+ENV PYTHONUNBUFFERED=1
+ENV PORT=5000
+# Expose port
+EXPOSE 5000
+# Command to run the application
+CMD ["python", "app.py"]

app.py ADDED Viewed

	@@ -0,0 +1,167 @@

+from flask import Flask, request, jsonify
+import os
+import numpy as np
+import torch
+import av
+import cv2
+import tempfile
+import shutil
+import logging
+from transformers import VideoMAEForVideoClassification, VideoMAEImageProcessor
+from PIL import Image
+from torchvision.transforms import Compose, Resize, ToTensor
+app = Flask(__name__)
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Global variables to store model and processor
+device = "cuda" if torch.cuda.is_available() else "cpu"
+model = None
+processor = None
+transform = None
+def load_model():
+    """Load the model and processor"""
+    global model, processor, transform
+    if model is None:
+        model_name = "OPear/videomae-large-finetuned-UCF-Crime"
+        logger.info(f"Loading model {model_name} on {device}...")
+        model = VideoMAEForVideoClassification.from_pretrained(model_name).to(device)
+        processor = VideoMAEImageProcessor.from_pretrained(model_name)
+        transform = Compose([
+            Resize((224, 224)),
+            ToTensor(),
+        ])
+        logger.info("Model loaded successfully")
+    return model, processor, transform
+def sample_frame_indices(clip_len=16, frame_sample_rate=1, seg_len=0):
+    """Samples exactly 16 frames uniformly from the video."""
+    if seg_len <= clip_len:
+        indices = np.linspace(0, seg_len - 1, num=clip_len, dtype=int)
+    else:
+        end_idx = np.random.randint(clip_len, seg_len)
+        start_idx = max(0, end_idx - clip_len)
+        indices = np.linspace(start_idx, end_idx - 1, num=clip_len, dtype=int)
+    return np.clip(indices, 0, seg_len - 1)
+def process_video(video_path):
+    try:
+        container = av.open(video_path)
+        video_stream = container.streams.video[0]
+        seg_len = video_stream.frames if video_stream.frames > 0 else int(cv2.VideoCapture(video_path).get(cv2.CAP_PROP_FRAME_COUNT))
+    except Exception as e:
+        logger.error(f"Error opening video: {str(e)}")
+        return None, None
+    indices = sample_frame_indices(clip_len=16, seg_len=seg_len)
+    frames = []
+    try:
+        container.seek(0)
+        for i, frame in enumerate(container.decode(video=0)):
+            if i > indices[-1]:
+                break
+            if i in indices:
+                frames.append(frame.to_ndarray(format="rgb24"))
+    except Exception as e:
+        logger.error(f"Error decoding video with PyAV: {str(e)}")
+    if not frames:
+        logger.info("Falling back to OpenCV for frame extraction")
+        cap = cv2.VideoCapture(video_path)
+        for i in indices:
+            cap.set(cv2.CAP_PROP_POS_FRAMES, i)
+            ret, frame = cap.read()
+            if ret:
+                frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+                frames.append(frame)
+        cap.release()
+    if len(frames) != 16:
+        logger.error(f"Could not extract 16 frames, got {len(frames)}")
+        return None, None
+    return np.stack(frames), indices
+def predict_video(frames):
+    """Processes frames and runs VideoMAE classification."""
+    model, processor, transform = load_model()
+    video_tensor = torch.stack([transform(Image.fromarray(frame)) for frame in frames])
+    video_tensor = video_tensor.unsqueeze(0)  # Add batch dimension
+    inputs = processor(list(video_tensor[0]), return_tensors="pt", do_rescale=False)
+    inputs = {k: v.to(device) for k, v in inputs.items()}
+    with torch.no_grad():  # Disable gradient calculation for inference
+        outputs = model(**inputs)
+    logits = outputs.logits
+    predicted_class = logits.argmax(-1).item()
+    id2label = model.config.id2label
+    return id2label.get(predicted_class, "Unknown")
+@app.route('/classify-video', methods=['POST'])
+def classify_video():
+    if 'video' not in request.files:
+        logger.warning("No video file in request")
+        return jsonify({'error': 'No video file provided'}), 400
+    video_file = request.files['video']
+    if video_file.filename == '':
+        logger.warning("Empty video filename")
+        return jsonify({'error': 'No video selected'}), 400
+    # Create temporary directory
+    temp_dir = tempfile.mkdtemp()
+    video_path = os.path.join(temp_dir, video_file.filename)
+    try:
+        # Save the uploaded video
+        logger.info(f"Saving uploaded video to {video_path}")
+        video_file.save(video_path)
+        # Process the video
+        logger.info("Processing video...")
+        frames, indices = process_video(video_path)
+        if frames is None:
+            return jsonify({'error': 'Failed to process video file'}), 400
+        # Get the prediction
+        logger.info("Running prediction...")
+        prediction = predict_video(frames)
+        logger.info(f"Prediction result: {prediction}")
+        return jsonify({'prediction': prediction})
+    except Exception as e:
+        logger.exception(f"Error processing video: {str(e)}")
+        return jsonify({'error': f'Error processing video: {str(e)}'}), 500
+    finally:
+        # Clean up the temporary directory and its contents
+        if os.path.exists(temp_dir):
+            logger.info(f"Cleaning up temporary directory: {temp_dir}")
+            shutil.rmtree(temp_dir)
+@app.route('/health', methods=['GET'])
+def health_check():
+    """Endpoint to check if the service is up and running"""
+    return jsonify({"status": "healthy"}), 200
+if __name__ == '__main__':
+    # Load model at startup
+    logger.info("Initializing application...")
+    load_model()
+    # Get port from environment variable or use 5000 as default
+    port = int(os.environ.get('PORT', 7860))
+    logger.info(f"Starting Flask application on port {port}")
+    app.run(host='0.0.0.0', port=port, debug=False)

requirements.txt ADDED Viewed

	@@ -0,0 +1,15 @@

+Flask==3.1.1
+av==14.4.0
+opencv-python==4.11.0.86
+numpy==2.0.2
+pillow==11.2.1
+torch==2.7.0
+torchvision==0.22.0
+transformers==4.52.3
+huggingface-hub==0.32.0
+requests==2.32.3
+pyyaml==6.0.2
+tqdm==4.67.1
+regex==2024.11.6
+filelock==3.18.0
+packaging==24.2