|
project: vietocr_new
|
|
name: Train
|
|
|
|
device: cuda:0
|
|
|
|
|
|
vocab: 'aAàÀảẢãÃáÁạẠăĂằẰẳẲẵẴắẮặẶâÂầẦẩẨẫẪấẤậẬbBcCdDđĐeEèÈẻẺẽẼéÉẹẸêÊềỀểỂễỄếẾệỆfFgGhHiIìÌỉỈĩĨíÍịỊjJkKlLmMnNoOòÒỏỎõÕóÓọỌôÔồỒổỔỗỖốỐộỘơƠờỜởỞỡỠớỚợỢpPqQrRsStTuUùÙủỦũŨúÚụỤưƯừỪửỬữỮứỨựỰvVwWxXyYỳỲỷỶỹỸýÝỵỴzZ0123456789!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~ '
|
|
|
|
seq_modeling: seq2seq
|
|
transformer:
|
|
encoder_hidden: 256
|
|
decoder_hidden: 256
|
|
img_channel: 256
|
|
decoder_embedded: 256
|
|
dropout: 0.1
|
|
|
|
optimizer:
|
|
max_lr: 0.001
|
|
pct_start: 0.1
|
|
|
|
trainer:
|
|
batch_size: 128
|
|
print_every: 100
|
|
valid_every: 500
|
|
test_every: 500
|
|
iters: 10000
|
|
|
|
export: weights/train_model.pth
|
|
checkpoint: ./checkpoint/checkpoint_model.pth
|
|
log: ./train.log
|
|
|
|
metrics: 49228
|
|
test_metrics: 28918
|
|
pretrained: false
|
|
|
|
dataset:
|
|
|
|
data_root: /mnt/disk3/CGGANv2
|
|
|
|
train_annotation: datasets/labels/train.txt
|
|
valid_annotation: datasets/labels/valid.txt
|
|
test_annotation: datasets/labels/test.txt
|
|
|
|
train_lmdb: datasets/lmdb/train
|
|
valid_lmdb: datasets/lmdb/valid
|
|
test_lmdb: datasets/lmdb/test
|
|
|
|
|
|
image_height: 32
|
|
image_min_width: 32
|
|
image_max_width: 512
|
|
|
|
dataloader:
|
|
num_workers: 12
|
|
pin_memory: true
|
|
|
|
aug:
|
|
image_aug: false
|
|
masked_language_model: false
|
|
|
|
predictor:
|
|
|
|
beamsearch: false
|
|
|
|
quiet: false
|
|
|
|
|
|
pretrain: https://vocr.vn/data/vietocr/vgg_seq2seq.pth
|
|
|
|
|
|
weights: https://vocr.vn/data/vietocr/vgg_seq2seq.pth
|
|
|
|
backbone: vgg19_bn
|
|
cnn:
|
|
|
|
ss:
|
|
- [2, 2]
|
|
- [2, 2]
|
|
- [2, 1]
|
|
- [2, 1]
|
|
- [1, 1]
|
|
|
|
ks:
|
|
- [2, 2]
|
|
- [2, 2]
|
|
- [2, 1]
|
|
- [2, 1]
|
|
- [1, 1]
|
|
|
|
hidden: 256
|
|
|