Spaces:

kios
/

yolo_vessel_weights

Runtime error

App Files Files Community

yolo_vessel_weights / app.py

kios

Fixed error in app.py where if no objects were detected, output was an error

254290f almost 3 years ago

raw

history blame contribute delete

8.09 kB

	# Imports
	import cv2
	from detector import Detector
	from pathlib import Path
	import gradio as gr
	import os
	import numpy as np
	import csv
	import matplotlib.pyplot as plt
	import pandas as pd

	# Choose weights, names and config file
	chosen_weights = "cfg/vessels_tyv4.weights"
	chosen_config_file = "cfg/vessels_tyv4.cfg"
	chosen_names = "cfg/vessel.names"

	with open(chosen_names, "r") as f:
	classes = [line.strip() for line in f.readlines()]
	labels = np.array(classes, dtype=str)

	# Function for analyzing images
	def analyze_image(selected_image, chosen_conf_thresh, chosen_nms_thresh):

	# Delete existing output files
	if os.path.exists("Classes.csv"):
	os.remove("Classes.csv")

	if selected_image is None:
	raise RuntimeError("No image found!")

	print("Starting image scan")

	# Initialize the detector
	detector = Detector(weights = str(chosen_weights), config_file = str(chosen_config_file), classes_file = chosen_names, conf_thresh = chosen_conf_thresh, nms_thresh = chosen_nms_thresh)

	# Detect the image
	img_det, classes_id, scores, boxes = detector.detect(selected_image)

	class_names = []

	for _class in classes_id:
	class_names.append(labels[_class])

	tags = []

	for i in range(len(class_names)):
	tags.append([str(class_names[i]), str(boxes[i][0]), str(boxes[i][1]), str(boxes[i][2]), str(boxes[i][3]), str(scores[i])])

	print("Image scan finished succefully.")

	# Save tags in a csv file
	with open("Classes.csv", "w") as f:
	write = csv.writer(f)
	write.writerow(["Class", "X", "Y", "Width", "Height", "Score"])
	write.writerows(tags)
	f.close()

	df = pd.DataFrame(tags, columns = ["Class", "X", "Y", "Width", "Height", "Score"])

	return img_det, "Classes.csv", df.head(10)

	# Function for analyzing video
	def analyze_video(selected_video, chosen_conf_thresh, chosen_nms_thresh, start_sec, duration):

	# Delete existing output files
	if os.path.exists("demo_film.mp4"):
	os.remove("demo_film.mp4")
	if os.path.exists("output.mp4"):
	os.remove("output.mp4")
	if os.path.exists("Classes.csv"):
	os.remove("Classes.csv")

	if selected_video is None:
	raise RuntimeError("No video found!")

	print("Starting video scan")

	# Capture the video input
	video = cv2.VideoCapture(selected_video)
	ret, frame = video.read()
	if not ret: # Checking
	raise RuntimeError("Cannot read video stream!")

	# Calculate start and end frame
	total_frames = round(video.get(cv2.CAP_PROP_FRAME_COUNT))
	fps = video.get(cv2.CAP_PROP_FPS)
	start_frame = round(start_sec * fps)
	end_frame = round(start_frame + (duration * fps))

	# Initialize the detector
	detector = Detector(weights = str(chosen_weights), config_file = str(chosen_config_file), classes_file = chosen_names, conf_thresh = chosen_conf_thresh, nms_thresh = chosen_nms_thresh)

	frame_id = 0
	vid_out = []
	save_file_name = "demo_film.mp4"

	tags = []
	unique_objects = []

	if start_frame > total_frames:
	raise RuntimeError("Start second is out of bounds!")

	while True:
	# Read the image
	ret, frame = video.read()

	if not ret: # Error or end of stream heck
	break
	if frame is None: continue

	if start_frame <= frame_id <= end_frame:
	class_names = []
	# Detect the image
	img_det, classes_id, scores, boxes = detector.detect(frame)

	for _class in classes_id:
	class_names.append(labels[_class])

	if unique_objects.count(labels[_class]) == 0:
	unique_objects.append(labels[_class])

	for i in range(len(class_names)):
	tags.append([str(class_names[i]), str(boxes[i][0]), str(boxes[i][1]), str(boxes[i][2]), str(boxes[i][3]), str(scores[i]), str(frame_id)])

	# video writer
	if frame_id == start_frame:
	Height, Width = img_det.shape[:2]
	fps = video.get(cv2.CAP_PROP_FPS) if 15 < video.get(cv2.CAP_PROP_FPS) <= 30 else 15
	vid_out = cv2.VideoWriter(save_file_name, cv2.VideoWriter_fourcc(*"MP4V"), fps, (Width, Height))
	vid_out.write(img_det)

	if frame_id > end_frame:
	break

	frame_id += 1

	# Release videos
	video.release()
	vid_out.release()

	# Save tags in a csv file
	with open("Classes.csv", "w") as f:
	write = csv.writer(f)
	write.writerow(["Class", "X", "Y", "Width", "Height", "Score","Frame"])
	write.writerows(tags)
	f.close()

	if end_frame > total_frames:
	end_frame = total_frames

	# Create graph
	plt.switch_backend("agg")
	fig = plt.figure()

	df = pd.DataFrame(tags, columns = ["Class", "X", "Y", "Width", "Height", "Score", "Frame"])

	# For every different object found, check how many times it appears in each frame
	for unique_object in unique_objects:
	object_array = df[df["Class"].str.fullmatch(unique_object)==True]
	obj_per_frame = []

	for i in range(start_frame, end_frame + 1):
	temp_array = []
	temp_array = object_array[object_array["Frame"].astype("str").str.fullmatch(str(i))==True]
	rows = temp_array.shape[0]
	obj_per_frame.append(rows)

	# Plot line graph for every individual object found
	plt.plot(list(range(start_frame, end_frame+1)), obj_per_frame, label = unique_object)

	plt.title("Objects per frame")
	plt.ylabel("Objects")
	plt.xlabel("Frame")
	plt.legend()

	print("Video scan finished succefully.")

	# Changes video fourcc to h264 so that it can be displayed in the browser
	os.system("ffmpeg -i demo_film.mp4 -vcodec libx264 -f mp4 output.mp4")

	return "output.mp4", fig, "Classes.csv", df.head(10)


	# Dradio interfaces take mandatory parameters an input function, the input type(s) and output type(s)
	# Demo is hosted on http://localhost:7860/

	# Examples
	image_examples = [
	["examples/vessels.png", 0.20, 0.40],
	["examples/boat.png", 0.25, 0.40],
	]
	video_examples =[["examples/vessels.mp4", 0.25, 0.40, 0, 10]]

	# Image interface
	image_interface = gr.Interface(fn = analyze_image,
	inputs = [gr.Image(label = "Image"),
	gr.Slider(0, 1, value = 0.25, label = "Confidence Threshold"),
	gr.Slider(0, 1, value = 0.40, label = "Non Maxima Supression threshold")],
	outputs = [gr.Image(label="Image"), gr.File(label="All classes"), gr.Dataframe(label="Ten first classes", headers = ["Class", "X", "Y", "Width", "Height", "Score"])],
	allow_flagging = False,
	cache_examples = False,
	examples = image_examples)

	# Video interface
	video_interface = gr.Interface(fn = analyze_video,
	inputs = [gr.Video(label = "Video"),
	gr.Slider(0, 1, value = 0.25, label = "Confidence Threshold"),
	gr.Slider(0, 1, value = 0.40, label = "Non Maxima Supression threshold"),
	gr.Slider(0, 60, value = 0, label = "Start Second", step = 1),
	gr.Slider(1, 10, value = 4, label = "Duration", step = 1)],
	outputs = [gr.Video(label="Video"), gr.Plot(label="Objects per frame"), gr.File(label="All classes"), gr.Dataframe(label=" Ten first classes", headers = ["Class", "X", "Y", "Width", "Height", "Score", "Frame"])],
	allow_flagging = False,
	cache_examples = False,
	examples = video_examples)

	gr.TabbedInterface(
	[video_interface, image_interface],
	["Scan Videos", "Scan Images"]
	).launch()