|
project: vietocr_new |
|
name: Train |
|
|
|
device: cuda:0 |
|
|
|
|
|
vocab: 'aAàÀảẢãÃáÁạẠăĂằẰẳẲẵẴắẮặẶâÂầẦẩẨẫẪấẤậẬbBcCdDđĐeEèÈẻẺẽẼéÉẹẸêÊềỀểỂễỄếẾệỆfFgGhHiIìÌỉỈĩĨíÍịỊjJkKlLmMnNoOòÒỏỎõÕóÓọỌôÔồỒổỔỗỖốỐộỘơƠờỜởỞỡỠớỚợỢpPqQrRsStTuUùÙủỦũŨúÚụỤưƯừỪửỬữỮứỨựỰvVwWxXyYỳỲỷỶỹỸýÝỵỴzZ0123456789!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~ ' |
|
|
|
seq_modeling: seq2seq |
|
transformer: |
|
encoder_hidden: 256 |
|
decoder_hidden: 256 |
|
img_channel: 256 |
|
decoder_embedded: 256 |
|
dropout: 0.1 |
|
|
|
optimizer: |
|
max_lr: 0.001 |
|
pct_start: 0.1 |
|
|
|
trainer: |
|
batch_size: 128 |
|
print_every: 100 |
|
valid_every: 500 |
|
test_every: 500 |
|
iters: 10000 |
|
|
|
export: weights/train_model.pth |
|
checkpoint: ./checkpoint/checkpoint_model.pth |
|
log: ./train.log |
|
|
|
metrics: 49228 |
|
test_metrics: 28918 |
|
pretrained: false |
|
|
|
dataset: |
|
|
|
data_root: /mnt/disk3/CGGANv2 |
|
|
|
train_annotation: datasets/labels/train.txt |
|
valid_annotation: datasets/labels/valid.txt |
|
test_annotation: datasets/labels/test.txt |
|
|
|
train_lmdb: datasets/lmdb/train |
|
valid_lmdb: datasets/lmdb/valid |
|
test_lmdb: datasets/lmdb/test |
|
|
|
|
|
image_height: 32 |
|
image_min_width: 32 |
|
image_max_width: 512 |
|
|
|
dataloader: |
|
num_workers: 12 |
|
pin_memory: true |
|
|
|
aug: |
|
image_aug: false |
|
masked_language_model: false |
|
|
|
predictor: |
|
|
|
beamsearch: false |
|
|
|
quiet: false |
|
|
|
|
|
pretrain: https://vocr.vn/data/vietocr/vgg_seq2seq.pth |
|
|
|
|
|
weights: https://vocr.vn/data/vietocr/vgg_seq2seq.pth |
|
|
|
backbone: vgg19_bn |
|
cnn: |
|
|
|
ss: |
|
- [2, 2] |
|
- [2, 2] |
|
- [2, 1] |
|
- [2, 1] |
|
- [1, 1] |
|
|
|
ks: |
|
- [2, 2] |
|
- [2, 2] |
|
- [2, 1] |
|
- [2, 1] |
|
- [1, 1] |
|
|
|
hidden: 256 |
|
|