ScreenCoder

Paused

App Files Files Community

ScreenCoder / screencoder /UIED /detect_text /ocr.py

Jimmyzheng-10

Add app.py and the screencoder repo

a383d0e 4 months ago

raw

history blame

2.17 kB

	import cv2
	import os
	import requests
	import json
	from base64 import b64encode
	import time


	def Google_OCR_makeImageData(imgpath):
	with open(imgpath, 'rb') as f:
	ctxt = b64encode(f.read()).decode()
	img_req = {
	'image': {
	'content': ctxt
	},
	'features': [{
	'type': 'DOCUMENT_TEXT_DETECTION',
	# 'type': 'TEXT_DETECTION',
	'maxResults': 1
	}]
	}
	return json.dumps({"requests": img_req}).encode()


	def ocr_detection_google(imgpath):
	start = time.perf_counter()
	url = 'https://vision.googleapis.com/v1/images:annotate'
	api_key = 'AIzaSyDUc4iOUASJQYkVwSomIArTKhE2C6bHK8U' # * Replace with your own Key *
	imgdata = Google_OCR_makeImageData(imgpath)
	response = requests.post(url,
	data=imgdata,
	params={'key': api_key},
	headers={'Content_Type': 'application/json'})
	# print('* Text Detection Time Taken:%.3fs *' % (time.perf_counter() - start))
	print("* Please replace the Google OCR key at detect_text/ocr.py line 28 with your own (apply in https://cloud.google.com/vision) *")

	response_json = response.json()
	if 'error' in response_json:
	error_msg = response_json['error']
	if 'BILLING_DISABLED' in str(error_msg):
	raise Exception("Google Vision API requires billing to be enabled. Please:\n"
	"1. Visit https://console.developers.google.com/billing/enable?project=718250946490\n"
	"2. Enable billing for your project\n"
	"3. Wait a few minutes for changes to propagate\n"
	"4. Or use PaddleOCR instead by setting method='paddle'")
	else:
	raise Exception(f"Google Vision API error: {error_msg}")

	if 'responses' not in response_json:
	raise Exception(response_json)
	if response_json['responses'] == [{}]:
	# No Text
	return None
	else:
	return response_json['responses'][0]['textAnnotations'][1:]