Spaces:

Abs6187
/

Suspicious-Activity-Detector-App

Sleeping

App Files Files Community

Abs6187 commited on Dec 1, 2024

Commit

47ee765

•

1 Parent(s): f4defdf

Update app.py

Browse files

Files changed (1) hide show

app.py +97 -38

app.py CHANGED Viewed

@@ -1,51 +1,110 @@
-# app.py
 import gradio as gr
 import cv2
 import numpy as np
-from model import SuspiciousActivityModel  # Import the model
-# Initialize the model paths
-lstm_model_path = 'suspicious_activity_model.h5'  # Path to your LSTM model
-yolo_model_path = 'yolov8n-pose.pt'  # Path to your YOLO model
-# Initialize the suspicious activity model
-model = SuspiciousActivityModel(lstm_model_path, yolo_model_path)
-# Function to process video frame
-def process_video(video_frame):
-    # Check if the input frame is a valid NumPy array
-    if isinstance(video_frame, np.ndarray):
-        print(f"Frame shape: {video_frame.shape}")  # Print the shape of the frame for debugging
-        # Convert frame from BGR to RGB (OpenCV uses BGR by default)
-        try:
-            frame_rgb = cv2.cvtColor(video_frame, cv2.COLOR_BGR2RGB)
-        except cv2.error as e:
-            print(f"Error in cvtColor: {e}")
-            return video_frame  # Return the original frame if error occurs
-        # Call model to detect activity in the frame
-        label = model.detect_activity(frame_rgb)
-        # Add label to the frame (Optional: you can also draw bounding boxes)
-        cv2.putText(frame_rgb, label, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 255, 0), 2, cv2.LINE_AA)
-        # Convert back to BGR for Gradio (since it expects BGR format)
-        frame_bgr = cv2.cvtColor(frame_rgb, cv2.COLOR_RGB2BGR)
-        return frame_bgr
-    else:
-        print("Received invalid frame format")
-        return video_frame  # Return the original frame if it's not valid
-# Gradio interface
 iface = gr.Interface(
-    fn=process_video,  # Function that processes each frame
-    inputs=gr.Video(type="webcam", streaming=True),  # Use webcam as input
-    outputs=gr.Video(),  # Output is also a video
-    live=True,  # Stream the video in real time
-    title="Suspicious Activity Detection"  # Interface title
 )
-# Launch the app with public link
-if __name__ == "__main__":
-    iface.launch(share=True)  # Set share=True to create a public link

 import gradio as gr
 import cv2
 import numpy as np
+from tensorflow.keras.models import load_model
+from sklearn.preprocessing import StandardScaler
+from ultralytics import YOLO
+# Load models
+lstm_model = load_model('suspicious_activity_model.h5')
+yolo_model = YOLO('yolov8n-pose.pt')  # Ensure this model supports keypoint detection
+scaler = StandardScaler()
+def extract_keypoints(frame):
+    """
+    Extracts normalized keypoints from a frame using YOLO pose model.
+    """
+    results = yolo_model(frame, verbose=False)
+    for r in results:
+        if r.keypoints is not None and len(r.keypoints) > 0:
+            # Extract the first detected person's keypoints
+            keypoints = r.keypoints.xyn.tolist()[0]  # Use the first person's keypoints
+            flattened_keypoints = [kp for keypoint in keypoints for kp in keypoint[:2]]  # Flatten x, y values
+            return flattened_keypoints
+    return None  # Return None if no keypoints are detected
+def process_frame(frame):
+    """
+    Process each frame for suspicious activity detection
+    """
+    # Perform YOLO detection
+    results = yolo_model(frame, verbose=False)
+    for box in results[0].boxes:
+        cls = int(box.cls[0])  # Class ID
+        confidence = float(box.conf[0])
+        # Detect persons only (class_id 0 for 'person')
+        if cls == 0 and confidence > 0.5:
+            x1, y1, x2, y2 = map(int, box.xyxy[0])  # Bounding box coordinates
+            # Extract ROI for classification
+            roi = frame[y1:y2, x1:x2]
+            if roi.size > 0:
+                # Preprocess ROI to extract keypoints
+                keypoints = extract_keypoints(roi)
+                if keypoints is not None and len(keypoints) > 0:
+                    # Standardize and reshape keypoints for LSTM input
+                    keypoints_scaled = scaler.fit_transform([keypoints])  # Standardize features
+                    keypoints_reshaped = keypoints_scaled.reshape((1, 1, len(keypoints)))  # Reshape for LSTM
+                    # Predict with LSTM model
+                    prediction = (lstm_model.predict(keypoints_reshaped) > 0.5).astype(int)[0][0]
+                    # Draw bounding box and label
+                    color = (0, 0, 255) if prediction == 1 else (0, 255, 0)
+                    label = 'Suspicious' if prediction == 1 else 'Normal'
+                    cv2.rectangle(frame, (x1, y1), (x2, y2), color, 2)
+                    cv2.putText(frame, label, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)
+                else:
+                    print("No valid keypoints detected for ROI. Skipping frame.")
+            else:
+                print("ROI size is zero. Skipping frame.")
+    return frame
+def detect_suspicious_activity(input_video):
+    """
+    Main function to process video for suspicious activity detection
+    """
+    # Open video capture
+    cap = cv2.VideoCapture(input_video)
+    # Prepare to save output video
+    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    fps = cap.get(cv2.CAP_PROP_FPS)
+    # Create VideoWriter object
+    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+    out = cv2.VideoWriter('output_video.mp4', fourcc, fps, (width, height))
+    # Process each frame
+    while cap.isOpened():
+        ret, frame = cap.read()
+        if not ret:
+            break
+        # Process and annotate frame
+        processed_frame = process_frame(frame)
+        # Write processed frame to output video
+        out.write(processed_frame)
+    # Release resources
+    cap.release()
+    out.release()
+    return 'output_video.mp4'
+# Create Gradio interface
 iface = gr.Interface(
+    fn=detect_suspicious_activity,
+    inputs=gr.Video(label="Upload Video"),
+    outputs=gr.Video(label="Processed Video"),
+    title="Suspicious Activity Detection",
+    description="Upload a video to detect suspicious activities using YOLO and LSTM models"
 )
+# Launch the interface
+iface.launch()