Spaces:

hantech
/

EasyOCR-VietOCR

Runtime error

App Files Files Community

EasyOCR-VietOCR / app.py

hantech

Update app.py

1527fb7 about 1 year ago

raw

history blame

3.95 kB

	import pandas as pd
	import PIL
	from PIL import Image
	from PIL import ImageDraw
	import gradio as gr
	import torch
	import easyocr
	import omegaconf

	from vietocr.model.transformerocr import VietOCR
	from vietocr.model.vocab import Vocab
	from vietocr.translate import translate, process_input

	config = omegaconf.OmegaConf.load("vgg-seq2seq.yaml")
	config = omegaconf.OmegaConf.to_container(config, resolve=True)

	vocab = Vocab(config['vocab'])
	model = VietOCR(len(vocab),
	config['backbone'],
	config['cnn'],
	config['transformer'],
	config['seq_modeling'])
	model.load_state_dict(torch.load('train_old.pth', map_location=torch.device('cpu')))

	torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/english.png', 'english.png')
	torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/thai.jpg', 'thai.jpg')
	torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/french.jpg', 'french.jpg')
	torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/chinese.jpg', 'chinese.jpg')
	torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/japanese.jpg', 'japanese.jpg')
	torch.hub.download_url_to_file('https://github.com/JaidedAI/EasyOCR/raw/master/examples/korean.png', 'korean.png')
	torch.hub.download_url_to_file('https://i.imgur.com/mwQFd7G.jpeg', 'Hindi.jpeg')

	def draw_boxes(image, bounds, color='yellow', width=2):
	draw = ImageDraw.Draw(image)
	for bound in bounds:
	p0, p1, p2, p3 = bound[0]
	draw.line([p0, p1, p2, p3, *p0], fill=color, width=width)
	return image

	def inference(filepath, lang):
	reader = easyocr.Reader(lang)
	bounds = reader.readtext(filepath)
	new_bounds=[]
	for (bbox, text, prob) in bounds:
	x1,y1 = bbox[0]
	x2,y2 = bbox[1]
	x3,y3 = bbox[2]
	x4,y4 = bbox[3]

	# crop the region of interest (ROI)
	img = Image.open(filepath)
	#img = img[y0:y1, x0:x1]
	width, height =img.size
	img = img.crop((max(0,x1-5), max(0,y1-5), min(x3+5,width), min(y3+5, height))) # crop the image
	img = process_input(img, config['dataset']['image_height'],
	config['dataset']['image_min_width'], config['dataset']['image_max_width'])
	out = translate(img, model)[0].tolist()
	out = vocab.decode(out)
	new_bounds.append((bbox,text, out, prob))
	im = PIL.Image.open(filepath)
	draw_boxes(im, bounds)
	im.save('result.jpg')
	return ['result.jpg', pd.DataFrame(new_bounds).iloc[: , 1:]]

	title = 'EasyOCR'
	description = 'Gradio demo for EasyOCR. EasyOCR demo supports 80+ languages.To use it, simply upload your image and choose a language from the dropdown menu, or click one of the examples to load them. Read more at the links below.'
	article = "<p style='text-align: center'><a href='https://www.jaided.ai/easyocr/'>Ready-to-use OCR with 80+ supported languages and all popular writing scripts including Latin, Chinese, Arabic, Devanagari, Cyrillic and etc.</a> \| <a href='https://github.com/JaidedAI/EasyOCR'>Github Repo</a></p>"
	examples = [['english.png',['en']],['thai.jpg',['th']],['french.jpg',['fr', 'en']],['chinese.jpg',['ch_sim', 'en']],['japanese.jpg',['ja', 'en']],['korean.png',['ko', 'en']],['Hindi.jpeg',['hi', 'en']]]
	css = ".output_image, .input_image {height: 40rem !important; width: 100% !important;}"
	choices = [
	"vi"
	]
	gr.Interface(
	inference,
	[gr.inputs.Image(type='filepath', label='Input'),gr.inputs.CheckboxGroup(choices, type="value", default=['vi'], label='language')],
	[gr.outputs.Image(type='pil', label='Output'), gr.outputs.Dataframe(type='pandas', headers=['easyOCR','vietOCR', 'confidence'])],
	title=title,
	description=description,
	article=article,
	examples=examples,
	css=css,
	enable_queue=True
	).launch(debug=True)