Spaces:
Runtime error
Runtime error
# change to list chars of your dataset or use default vietnamese chars | |
vocab: 'aAàÀảẢãÃáÁạẠăĂằẰẳẲẵẴắẮặẶâÂầẦẩẨẫẪấẤậẬbBcCdDđĐeEèÈẻẺẽẼéÉẹẸêÊềỀểỂễỄếẾệỆfFgGhHiIìÌỉỈĩĨíÍịỊjJkKlLmMnNoOòÒỏỎõÕóÓọỌôÔồỒổỔỗỖốỐộỘơƠờỜởỞỡỠớỚợỢpPqQrRsStTuUùÙủỦũŨúÚụỤưƯừỪửỬữỮứỨựỰvVwWxXyYỳỲỷỶỹỸýÝỵỴzZ0123456789!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~ ' | |
# cpu, cuda, cuda:0 | |
device: cuda:0 | |
seq_modeling: transformer | |
transformer: | |
d_model: 256 | |
nhead: 8 | |
num_encoder_layers: 6 | |
num_decoder_layers: 6 | |
dim_feedforward: 2048 | |
max_seq_length: 1024 | |
pos_dropout: 0.1 | |
trans_dropout: 0.1 | |
optimizer: | |
max_lr: 0.0003 | |
pct_start: 0.1 | |
trainer: | |
batch_size: 32 | |
print_every: 200 | |
valid_every: 4000 | |
iters: 100000 | |
# where to save our model for prediction | |
export: ./weights/transformerocr.pth | |
checkpoint: ./checkpoint/transformerocr_checkpoint.pth | |
log: ./train.log | |
# null to disable compuate accuracy, or change to number of sample to enable validiation while training | |
metrics: null | |
dataset: | |
# name of your dataset | |
name: data | |
# path to annotation and image | |
data_root: ./img/ | |
train_annotation: annotation_train.txt | |
valid_annotation: annotation_val_small.txt | |
# resize image to 32 height, larger height will increase accuracy | |
image_height: 32 | |
image_min_width: 32 | |
image_max_width: 512 | |
dataloader: | |
num_workers: 3 | |
pin_memory: True | |
aug: | |
image_aug: true | |
masked_language_model: true | |
predictor: | |
# disable or enable beamsearch while prediction, use beamsearch will be slower | |
beamsearch: False | |
quiet: False | |