Spaces:

sageco214
/

Axon_OCR

Sleeping

Axon_OCR / ocr_functions.py

Sage

added verifier

ca92e41 about 2 years ago

2.96 kB

	from azure.core.credentials import AzureKeyCredential
	from azure.ai.formrecognizer import DocumentAnalysisClient
	from io import BytesIO
	from helpers import format_polygon, Logger
	import logging
	import os
	import sys

	logging.basicConfig(filename='app.log', level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
	sys.stdout = Logger("output.log")

	endpoint = os.environ['AZURE_API_ENDPOINT']
	key = os.environ['AZURE_API_KEY']

	def detect_document(content):
	document_analysis_client = DocumentAnalysisClient(
	endpoint=endpoint, credential=AzureKeyCredential(key)
	)

	with open(content.name, "rb") as f:
	poller = document_analysis_client.begin_analyze_document(
	"prebuilt-document", document=f
	)
	result = poller.result()

	text_content = result.content
	logging.info(result.content)
	print(text_content)

	pair_content = "----Key-value pairs found in document----\n"
	for kv_pair in result.key_value_pairs:
	if kv_pair.key and kv_pair.value:
	pair_content += "Key '{}' with Value '{}' \n".format(
	kv_pair.key.content,
	kv_pair.value.content
	)
	logging.info(pair_content)
	print(pair_content)
	document_content = "----Lines found in document----\n"
	for page in result.pages:
	for line_idx, line in enumerate(page.lines):
	document_content += "...Line # {} text '{}' within bounding polygon '{}' \n".format(
	line_idx,
	line.content,
	format_polygon(line.polygon),
	)
	logging.info(document_content)
	print(document_content)
	table_content = "----Tables found in document----\n"
	for table_idx, table in enumerate(result.tables):
	table_content += "Table # {} has {} rows and {} columns\n".format(
	table_idx, table.row_count, table.column_count
	)
	for cell in table.cells:
	table_content += "...Cell[{}][{}] has content '{}'\n".format(
	cell.row_index,
	cell.column_index,
	cell.content,
	)
	logging.info(table_content)
	print(table_content)
	name = content.name.split('\\')[-1]
	name = name.split("/")[-1]
	name = name.split('.')[0]
	return (text_content, pair_content, document_content, table_content, name)

	def detect_image(content):
	document_analysis_client = DocumentAnalysisClient(
	endpoint=endpoint, credential=AzureKeyCredential(key)
	)
	byte_stream = BytesIO()
	content.save(byte_stream, format='PNG') # or 'JPEG', 'BMP', etc. depending on your image
	byte_stream.seek(0) # reset pointer back to the start of the stream
	poller = document_analysis_client.begin_analyze_document(
	"prebuilt-read", document=byte_stream
	)

	result = poller.result()
	logging.info(result.content)
	print(result.content)
	return(result.content)