File size: 1,648 Bytes
bd22b5e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
aug:
  image_aug: true
  masked_language_model: true
backbone: vgg19_bn
cnn:
  hidden: 256
  ks:
  - - 2
    - 2
  - - 2
    - 2
  - - 2
    - 1
  - - 2
    - 1
  - - 1
    - 1
  pretrained: true
  ss:
  - - 2
    - 2
  - - 2
    - 2
  - - 2
    - 1
  - - 2
    - 1
  - - 1
    - 1
dataloader:
  num_workers: 0
  pin_memory: true
dataset:
  data_root: /Users/bmd1905/Desktop/dataset/data_line
  image_height: 32
  image_max_width: 512
  image_min_width: 32
  name: hw
  train_annotation: train_line_annotation.txt
  valid_annotation: test_line_annotation.txt
device: mps
optimizer:
  max_lr: 0.0003
  pct_start: 0.1
predictor:
  beamsearch: false
pretrain: https://vocr.vn/data/vietocr/vgg_transformer.pth
quiet: false
seq_modeling: transformer
trainer:
  batch_size: 1
  checkpoint: ./checkpoint/transformerocr_checkpoint.pth
  export: ./weights/seq2seq_test_local.pth
  iters: 100
  log: ./train.log
  metrics: 100
  print_every: 1
  valid_every: 10
transformer:
  d_model: 256
  dim_feedforward: 2048
  max_seq_length: 1024
  nhead: 8
  num_decoder_layers: 6
  num_encoder_layers: 6
  pos_dropout: 0.1
  trans_dropout: 0.1
vocab: 'aAร ร€แบฃแบขรฃรƒรกรแบกแบ ฤƒฤ‚แบฑแบฐแบณแบฒแบตแบดแบฏแบฎแบทแบถรขร‚แบงแบฆแบฉแบจแบซแบชแบฅแบคแบญแบฌbBcCdDฤ‘ฤeEรจรˆแบปแบบแบฝแบผรฉร‰แบนแบธรชรŠแปแป€แปƒแป‚แป…แป„แบฟแบพแป‡แป†fFgGhHiIรฌรŒแป‰แปˆฤฉฤจรญรแป‹แปŠjJkKlLmMnNoOรฒร’แปแปŽรตร•รณร“แปแปŒรดร”แป“แป’แป•แป”แป—แป–แป‘แปแป™แป˜ฦกฦ แปแปœแปŸแปžแปกแป แป›แปšแปฃแปขpPqQrRsStTuUรนร™แปงแปฆลฉลจรบรšแปฅแปคฦฐฦฏแปซแปชแปญแปฌแปฏแปฎแปฉแปจแปฑแปฐvVwWxXyYแปณแปฒแปทแปถแปนแปธรฝรแปตแปดzZ0123456789!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~ '
weights: https://vocr.vn/data/vietocr/vgg_transformer.pth