Spaces:

hantech
/

EasyOCR-VietOCR

Runtime error

App Files Files Community

EasyOCR-VietOCR / vietocr /vietocr /tool /create_dataset.py

hantech

Upload 38 files

bd22b5e 12 months ago

raw

history blame contribute delete

No virus

2.95 kB

	import sys
	import os
	import lmdb # install lmdb by "pip install lmdb"
	import cv2
	import numpy as np
	from tqdm import tqdm

	def checkImageIsValid(imageBin):
	isvalid = True
	imgH = None
	imgW = None

	imageBuf = np.fromstring(imageBin, dtype=np.uint8)
	try:
	img = cv2.imdecode(imageBuf, cv2.IMREAD_GRAYSCALE)

	imgH, imgW = img.shape[0], img.shape[1]
	if imgH * imgW == 0:
	isvalid = False
	except Exception as e:
	isvalid = False

	return isvalid, imgH, imgW

	def writeCache(env, cache):
	with env.begin(write=True) as txn:
	for k, v in cache.items():
	txn.put(k.encode(), v)

	def createDataset(outputPath, root_dir, annotation_path):
	"""
	Create LMDB dataset for CRNN training.
	ARGS:
	outputPath : LMDB output path
	imagePathList : list of image path
	labelList : list of corresponding groundtruth texts
	lexiconList : (optional) list of lexicon lists
	checkValid : if true, check the validity of every image
	"""

	annotation_path = os.path.join(root_dir, annotation_path)
	annotations = []
	with open(annotation_path, 'r') as ann_file:
	lines = ann_file.readlines()
	# for l in lines:
	# try:
	# annotations.append(l.strip().split('\t'))
	# except:
	# pass
	annotations = [l.strip().split('\t') for l in lines]

	nSamples = len(annotations)
	env = lmdb.open(outputPath, map_size=1099511627776)
	cache = {}
	cnt = 0
	error = 0

	pbar = tqdm(range(nSamples), ncols = 100, desc='Create {}'.format(outputPath))
	for i in pbar:
	if len(annotations[i]) >= 2:
	imageFile, label = annotations[i]
	else:
	print("Error: Not enough values to unpack")
	#sys.exit()

	#imageFile, label = annotations[i]
	imagePath = os.path.join(root_dir, imageFile)

	if not os.path.exists(imagePath):
	error += 1
	continue

	with open(imagePath, 'rb') as f:
	imageBin = f.read()
	isvalid, imgH, imgW = checkImageIsValid(imageBin)

	if not isvalid:
	error += 1
	continue

	imageKey = 'image-%09d' % cnt
	labelKey = 'label-%09d' % cnt
	pathKey = 'path-%09d' % cnt
	dimKey = 'dim-%09d' % cnt

	cache[imageKey] = imageBin
	cache[labelKey] = label.encode()
	cache[pathKey] = imageFile.encode()
	cache[dimKey] = np.array([imgH, imgW], dtype=np.int32).tobytes()

	cnt += 1

	if cnt % 1000 == 0:
	writeCache(env, cache)
	cache = {}

	nSamples = cnt-1
	cache['num-samples'] = str(nSamples).encode()
	writeCache(env, cache)

	if error > 0:
	print('Remove {} invalid images'.format(error))
	print('Created dataset with %d samples' % nSamples)
	sys.stdout.flush()