# -*- coding: utf-8 -*-
"""app.ipynb

Automatically generated by Colaboratory.

Original file is located at
    https://colab.research.google.com/drive/1WeNkl1pYnT0qeOTsUFooLFLJ1arRHC00
"""

# %pip install ultralytics -q
# %pip install gradio -q

import cv2
import os
import PIL.Image as Image
import gradio as gr
import numpy as np
from ultralytics import YOLO

# load trained model
model = YOLO("best.onnx")

# image inference function
def predict_image(img, conf_threshold, iou_threshold):
    results = model.predict(
        source=img,
        conf=conf_threshold,
        iou=iou_threshold,
        show_labels=True,
        show_conf=True,
        imgsz=640,
    )

    for r in results:
        im_array = r.plot()
        im = Image.fromarray(im_array[..., ::-1])

    return im

# directory for examples
image_directory = "/home/user/app/image"
video_directory = "/home/user/app/video"

# interface gradio setting for image
image_iface = gr.Interface(
    fn=predict_image,
    inputs=[
        gr.Image(type="pil", label="Upload Image"),
        gr.Slider(minimum=0, maximum=1, value=0.25, label="Confidence threshold"),
        gr.Slider(minimum=0, maximum=1, value=0.45, label="IoU threshold")
    ],
    outputs=gr.Image(type="pil", label="Result"),
    title="Fire Detection using YOLOv8n on Gradio",
    description="Upload images for inference. The Ultralytics YOLOv8n trained model is used for this.",
    examples=[
        [os.path.join(image_directory, "fire_image_1.jpg"), 0.25, 0.45],
        [os.path.join(image_directory, "fire_image_3.jpg"), 0.25, 0.45],
        
    ]
)

# convert PIL image objects to numpy arrays 
def pil_to_cv2(pil_image):
    open_cv_image = cv2.cvtColor(np.array(pil_image), cv2.COLOR_RGB2BGR)
    return open_cv_image

# process video, convert frame to PIL image 
def process_video(video_path):
    cap = cv2.VideoCapture(video_path)
    
    while cap.isOpened():
        ret, frame = cap.read()
        if not ret:
            break
        # Model expects PIL Image format
        pil_img = Image.fromarray(frame[..., ::-1])  # Convert BGR to RGB
        result = model.predict(source=pil_img)
        for r in result:
            im_array = r.plot()
            processed_frame = Image.fromarray(im_array[..., ::-1])  # Convert RGB back to BGR
        yield processed_frame # generate frame one by one
    cap.release()
    
    # You may choose to display each frame or compile them back using cv2 or a similar library
    # Display the processed frames
    
    # return processed_frames[-1]  # Example, returning the last processed frame

# interface setting for video
video_iface = gr.Interface(
    fn=process_video,
    inputs=[
        gr.Video(label="Upload Video", interactive=True)
    ],
    outputs=gr.Image(type="pil",label="Result"),
    title="Fire Detection using YOLOv8n on Gradio",
    description="Upload video for inference. The Ultralytics YOLOv8n trained model is used for inference.",
    examples=[
        [os.path.join(video_directory, "video_fire_1.mp4")],
        [os.path.join(video_directory, "video_fire_2.mp4")],
    ]
)


demo = gr.TabbedInterface([image_iface, video_iface], ["Image Inference", "Video Inference"])

if __name__ == '__main__':
    iface.launch()