Spaces:

stevengrove
/

YOLO-World

Running on T4

YOLO-World / yolo_world /easydeploy /examples /main_onnxruntime.py

stevengrove

initial commit

186701e 9 months ago

3.74 kB

	import math
	import sys
	from argparse import ArgumentParser
	from pathlib import Path

	import cv2
	import onnxruntime
	from config import (CLASS_COLORS, CLASS_NAMES, ModelType, YOLOv5_ANCHORS,
	YOLOv7_ANCHORS)
	from cv2_nms import non_max_suppression
	from numpy_coder import Decoder
	from preprocess import Preprocess
	from tqdm import tqdm

	# Add __FILE__ to sys.path
	sys.path.append(str(Path(__file__).resolve().parents[0]))

	IMG_EXTENSIONS = ('.jpg', '.jpeg', '.png', '.ppm', '.bmp', '.pgm', '.tif',
	'.tiff', '.webp')


	def path_to_list(path: str):
	path = Path(path)
	if path.is_file() and path.suffix in IMG_EXTENSIONS:
	res_list = [str(path.absolute())]
	elif path.is_dir():
	res_list = [
	str(p.absolute()) for p in path.iterdir()
	if p.suffix in IMG_EXTENSIONS
	]
	else:
	raise RuntimeError
	return res_list


	def parse_args():
	parser = ArgumentParser()
	parser.add_argument(
	'img', help='Image path, include image file, dir and URL.')
	parser.add_argument('onnx', type=str, help='Onnx file')
	parser.add_argument('--type', type=str, help='Model type')
	parser.add_argument(
	'--img-size',
	nargs='+',
	type=int,
	default=[640, 640],
	help='Image size of height and width')
	parser.add_argument(
	'--out-dir', default='./output', type=str, help='Path to output file')
	parser.add_argument(
	'--show', action='store_true', help='Show the detection results')
	parser.add_argument(
	'--score-thr', type=float, default=0.3, help='Bbox score threshold')
	parser.add_argument(
	'--iou-thr', type=float, default=0.7, help='Bbox iou threshold')
	args = parser.parse_args()
	return args


	def main():
	args = parse_args()
	out_dir = Path(args.out_dir)
	model_type = ModelType(args.type.lower())

	if not args.show:
	out_dir.mkdir(parents=True, exist_ok=True)

	files = path_to_list(args.img)
	session = onnxruntime.InferenceSession(
	args.onnx, providers=['CPUExecutionProvider'])
	preprocessor = Preprocess(model_type)
	decoder = Decoder(model_type, model_only=True)
	if model_type == ModelType.YOLOV5:
	anchors = YOLOv5_ANCHORS
	elif model_type == ModelType.YOLOV7:
	anchors = YOLOv7_ANCHORS
	else:
	anchors = None

	for file in tqdm(files):
	image = cv2.imread(file)
	image_h, image_w = image.shape[:2]
	img, (ratio_w, ratio_h) = preprocessor(image, args.img_size)
	features = session.run(None, {'images': img})
	decoder_outputs = decoder(
	features,
	args.score_thr,
	num_labels=len(CLASS_NAMES),
	anchors=anchors)
	nmsd_boxes, nmsd_scores, nmsd_labels = non_max_suppression(
	*decoder_outputs, args.score_thr, args.iou_thr)
	for box, score, label in zip(nmsd_boxes, nmsd_scores, nmsd_labels):
	x0, y0, x1, y1 = box
	x0 = math.floor(min(max(x0 / ratio_w, 1), image_w - 1))
	y0 = math.floor(min(max(y0 / ratio_h, 1), image_h - 1))
	x1 = math.ceil(min(max(x1 / ratio_w, 1), image_w - 1))
	y1 = math.ceil(min(max(y1 / ratio_h, 1), image_h - 1))
	cv2.rectangle(image, (x0, y0), (x1, y1), CLASS_COLORS[label], 2)
	cv2.putText(image, f'{CLASS_NAMES[label]}: {score:.2f}',
	(x0, y0 - 5), cv2.FONT_HERSHEY_SIMPLEX, 0.5,
	(0, 255, 255), 2)
	if args.show:
	cv2.imshow('result', image)
	cv2.waitKey(0)
	else:
	cv2.imwrite(f'{out_dir / Path(file).name}', image)


	if __name__ == '__main__':
	main()