Spaces:

hantech
/

EasyOCR-VietOCR

Runtime error

App Files Files Community

EasyOCR-VietOCR / vietocr /config /base.yml

hantech

Upload 38 files

bd22b5e 10 months ago

raw history blame contribute delete

No virus

1.81 kB

	# change to list chars of your dataset or use default vietnamese chars
	vocab: 'aAàÀảẢãÃáÁạẠăĂằẰẳẲẵẴắẮặẶâÂầẦẩẨẫẪấẤậẬbBcCdDđĐeEèÈẻẺẽẼéÉẹẸêÊềỀểỂễỄếẾệỆfFgGhHiIìÌỉỈĩĨíÍịỊjJkKlLmMnNoOòÒỏỎõÕóÓọỌôÔồỒổỔỗỖốỐộỘơƠờỜởỞỡỠớỚợỢpPqQrRsStTuUùÙủỦũŨúÚụỤưƯừỪửỬữỮứỨựỰvVwWxXyYỳỲỷỶỹỸýÝỵỴzZ0123456789!"#$%&''()*+,-./:;<=>?@[\]^_`{\|}~ '

	# cpu, cuda, cuda:0
	device: cuda:0

	seq_modeling: transformer
	transformer:
	d_model: 256
	nhead: 8
	num_encoder_layers: 6
	num_decoder_layers: 6
	dim_feedforward: 2048
	max_seq_length: 1024
	pos_dropout: 0.1
	trans_dropout: 0.1

	optimizer:
	max_lr: 0.0003
	pct_start: 0.1

	trainer:
	batch_size: 32
	print_every: 200
	valid_every: 4000
	iters: 100000
	# where to save our model for prediction
	export: ./weights/transformerocr.pth
	checkpoint: ./checkpoint/transformerocr_checkpoint.pth
	log: ./train.log
	# null to disable compuate accuracy, or change to number of sample to enable validiation while training
	metrics: null

	dataset:
	# name of your dataset
	name: data
	# path to annotation and image
	data_root: ./img/
	train_annotation: annotation_train.txt
	valid_annotation: annotation_val_small.txt
	# resize image to 32 height, larger height will increase accuracy
	image_height: 32
	image_min_width: 32
	image_max_width: 512

	dataloader:
	num_workers: 3
	pin_memory: True

	aug:
	image_aug: true
	masked_language_model: true

	predictor:
	# disable or enable beamsearch while prediction, use beamsearch will be slower
	beamsearch: False

	quiet: False