Spaces:

phyloforfun
/

VoucherVision

Running

App Files Files Community

VoucherVision / vouchervision /OCR_google_cloud_vision.py

phyloforfun

update api prices, openai dev day

e9f4039 9 months ago

raw

history blame

No virus

3.21 kB

	import os, io, sys, inspect
	from google.cloud import vision, storage
	from PIL import Image, ImageDraw

	currentdir = os.path.dirname(os.path.abspath(
	inspect.getfile(inspect.currentframe())))
	parentdir = os.path.dirname(currentdir)
	sys.path.append(parentdir)

	def draw_boxes(image, bounds, color):
	if bounds:
	draw = ImageDraw.Draw(image)
	width, height = image.size
	line_width = int((width + height) / 2 * 0.001) # This sets the line width as 0.5% of the average dimension

	for bound in bounds:
	draw.polygon(
	[
	bound["vertices"][0]["x"], bound["vertices"][0]["y"],
	bound["vertices"][1]["x"], bound["vertices"][1]["y"],
	bound["vertices"][2]["x"], bound["vertices"][2]["y"],
	bound["vertices"][3]["x"], bound["vertices"][3]["y"],
	],
	outline=color,
	width=line_width
	)
	return image

	def detect_text(path, client):
	# client = vision.ImageAnnotatorClient()
	with io.open(path, 'rb') as image_file:
	content = image_file.read()
	image = vision.Image(content=content)
	response = client.document_text_detection(image=image)
	texts = response.text_annotations

	if response.error.message:
	raise Exception(
	'{}\nFor more info on error messages, check: '
	'https://cloud.google.com/apis/design/errors'.format(
	response.error.message))

	# Extract bounding boxes
	bounds = []
	text_to_box_mapping = {}
	for text in texts[1:]: # Skip the first entry, as it represents the entire detected text
	# Convert BoundingPoly to dictionary
	bound_dict = {
	"vertices": [
	{"x": vertex.x, "y": vertex.y} for vertex in text.bounding_poly.vertices
	]
	}
	bounds.append(bound_dict)
	text_to_box_mapping[str(bound_dict)] = text.description

	if texts:
	# cleaned_text = texts[0].description.replace("\n", " ").replace("\t", " ").replace("\|", " ")
	cleaned_text = texts[0].description
	return cleaned_text, bounds, text_to_box_mapping
	else:
	return '', None, None

	def overlay_boxes_on_image(path, bounds,do_create_OCR_helper_image):
	if do_create_OCR_helper_image:
	image = Image.open(path)
	draw_boxes(image, bounds, "green")
	return image
	else:
	image = Image.open(path)
	return image





















	# ''' Google Vision'''
	# def detect_text(path):
	# """Detects text in the file located in the local filesystem."""
	# client = vision.ImageAnnotatorClient()

	# with io.open(path, 'rb') as image_file:
	# content = image_file.read()

	# image = vision.Image(content=content)

	# response = client.document_text_detection(image=image)
	# texts = response.text_annotations

	# if response.error.message:
	# raise Exception(
	# '{}\nFor more info on error messages, check: '
	# 'https://cloud.google.com/apis/design/errors'.format(
	# response.error.message))

	# return texts[0].description if texts else ''