batch_size: 32 | |
clip_grad: 5 | |
data_strategy: shuffle_batches | |
dev_datasets: | |
pos_ours: | |
dir: data | |
mode: BMES | |
name: pos_ours | |
repeat_times: 1 | |
samples_num: 1000 | |
split: test | |
seg_ours: | |
dir: data | |
mode: BMES | |
name: seg_ours | |
repeat_times: 1 | |
samples_num: 1000 | |
split: test | |
epoch_num: 1 | |
head_config: | |
dropout: 0.1 | |
layers_num: 1 | |
use_crf: false | |
heads: | |
- seg | |
- pos | |
learning_rate: 1.0e-05 | |
part_data: false | |
pos_labels: | |
- w | |
- e | |
- g | |
- o | |
- mq | |
- f | |
- h | |
- a | |
- j | |
- id | |
- k | |
- v | |
- c | |
- u | |
- nz | |
- r | |
- q | |
- s | |
- x | |
- m | |
- np | |
- p | |
- d | |
- ns | |
- t | |
- n | |
- ni | |
pretrained_bert_model: /data03/private/chengzhili/pretrain/output/2023-06-09_21-23-00/save | |
saved_path: output/pos | |
seg_labels: | |
- B | |
- M | |
- E | |
- S | |
train_datasets: | |
pos_ours: | |
dir: data | |
mode: BMES | |
name: pos_ours | |
repeat_times: 1 | |
samples_num: 0 | |
split: train | |
seg_ours: | |
dir: data | |
mode: BMES | |
name: seg_ours | |
repeat_times: 1 | |
samples_num: 0 | |
split: train | |
warmup_steps: 0.1 | |
weight_decay: 0.01 | |