Spaces:

caltech-fish-counting
/

fisheye-experimental

Runtime error

App Files Files Community

fisheye-experimental / annotation_handler.py

oskarastrom

Upload old results

592e4db 11 months ago

raw

history blame

No virus

2.32 kB

	from dataloader import create_dataloader_aris
	from aris import BEAM_WIDTH_DIR
	import json
	import cv2
	import base64

	VIDEO_HEIGHT = 700

	def load_frames(video_path, preds):
	"""Load frames for annotation editing
	"""

	dataloader, dataset = create_dataloader_aris(video_path, BEAM_WIDTH_DIR, None)

	didson = dataset.didson

	frames = didson.load_frames(start_frame=0)
	frame_info, h, w = get_frame_info(frames, preds)

	return frame_info

	def get_frame_info(frames, preds):
	"""Get visualized video frames ready for output, given raw ARIS/DIDSON frames.
	Warning: all frames in frames will be stored in memory - careful of OOM errors. Consider processing large files
	in batches, such as in generate_video_batches()

	Returns:
	list(np.ndarray), height (int), width (int)
	"""
	color_map = { fish['id'] : fish['color'] for fish in preds['fish'] }

	frame_info = []
	if len(frames):
	# assumes all frames the same size
	h, w = frames[0].shape

	# enforce a standard size so that text/box thickness is consistent
	scale_factor = VIDEO_HEIGHT / h
	h = VIDEO_HEIGHT
	w = int(scale_factor*w)

	num_frames = min(len(frames), len(preds['frames']))

	for i, frame_raw in enumerate(frames[:num_frames]):
	image = cv2.resize(cv2.cvtColor(frame_raw, cv2.COLOR_GRAY2BGR), (w,h))
	retval, buffer = cv2.imencode('.jpg', image)
	jpg_as_text = base64.b64encode(buffer).decode("utf-8")

	frame = {
	'annotations': [],
	'frame': jpg_as_text
	}
	for fish in preds['frames'][i]['fish']:
	xmin, ymin, xmax, ymax = fish['bbox']
	hexx = color_map[fish['fish_id']].lstrip('#')
	frame['annotations'].append({
	'bbox': {
	'left': int(round(xmin * w)),
	'right': int(round(xmax * w)),
	'top': int(round(ymin * h)),
	'bottom': int(round(ymax * h)),
	},
	'id': str(fish['fish_id']),
	'conf': fish['conf']
	})
	frame_info.append(frame)

	return frame_info, h, w