|
['run_entity.py', '--do_train', '--do_eval', '--eval_test', '--learning_rate=1e-5', '--task_learning_rate=5e-4', '--train_batch_size=32', '--context_window', '0', '--task', 'ko', '--data_dir', 'sh_aug+klue', '--model', 'monologg/kobert', '--output_dir', 'sh_aug+klue_dir']
|
|
Namespace(bert_model_dir=None, bertadam=False, context_window=0, data_dir='sh_aug+klue', dev_data='sh_aug+klue\\dev.json', dev_pred_filename='ent_pred_dev.json', do_eval=True, do_train=True, eval_batch_size=32, eval_per_epoch=1, eval_test=True, learning_rate=1e-05, max_span_length=8, model='monologg/kobert', num_epoch=20, output_dir='sh_aug+klue_dir', print_loss_step=100, seed=0, task='ko', task_learning_rate=0.0005, test_data='sh_aug+klue\\test.json', test_pred_filename='ent_pred_test.json', train_batch_size=32, train_data='sh_aug+klue\\train.json', train_shuffle=False, use_albert=False, warmup_proportion=0.1)
|
|
Moving to CUDA...
|
|
|
|
|
|
Extracted 5574 samples from 5574 documents, with 16074 NER labels, 30.600 avg input length, 93 max length
|
|
Max Length: 93, max NER: 16
|
|
|
|
Extracted 22849 samples from 22849 documents, with 57142 NER labels, 28.977 avg input length, 111 max length
|
|
Max Length: 111, max NER: 23
|
|
Epoch=0, iter=99, loss=382.98039
|
|
Epoch=0, iter=199, loss=92.19124
|
|
Epoch=0, iter=299, loss=18.17063
|
|
Epoch=0, iter=399, loss=17.86108
|
|
Epoch=0, iter=499, loss=17.41379
|
|
Epoch=0, iter=599, loss=17.11055
|
|
Epoch=0, iter=699, loss=14.89083
|
|
Evaluating...
|
|
Accuracy: 0.986949
|
|
Cor: 0, Pred TOT: 0, Gold TOT: 16074
|
|
P: 0.00000, R: 0.00000, F1: 0.00000
|
|
Used time: 43.244831
|
|
Epoch=1, iter=84, loss=12.58960
|
|
Epoch=1, iter=184, loss=10.30858
|
|
Epoch=1, iter=284, loss=8.34273
|
|
Epoch=1, iter=384, loss=6.43022
|
|
Epoch=1, iter=484, loss=5.32054
|
|
Epoch=1, iter=584, loss=4.63362
|
|
Epoch=1, iter=684, loss=4.06674
|
|
Evaluating...
|
|
Accuracy: 0.994374
|
|
Cor: 11197, Pred TOT: 13860, Gold TOT: 16074
|
|
P: 0.80786, R: 0.69659, F1: 0.74811
|
|
Used time: 44.417693
|
|
!!! Best valid (epoch=1): 74.81
|
|
Saving model to sh_aug+klue_dir...
|
|
Epoch=2, iter=69, loss=3.59020
|
|
Epoch=2, iter=169, loss=3.38379
|
|
Epoch=2, iter=269, loss=3.14521
|
|
Epoch=2, iter=369, loss=2.92039
|
|
Epoch=2, iter=469, loss=2.76133
|
|
Epoch=2, iter=569, loss=2.57549
|
|
Epoch=2, iter=669, loss=2.55223
|
|
Evaluating...
|
|
Accuracy: 0.995934
|
|
Cor: 13018, Pred TOT: 15461, Gold TOT: 16074
|
|
P: 0.84199, R: 0.80988, F1: 0.82562
|
|
Used time: 40.365823
|
|
!!! Best valid (epoch=2): 82.56
|
|
Saving model to sh_aug+klue_dir...
|
|
Epoch=3, iter=54, loss=2.32016
|
|
Epoch=3, iter=154, loss=2.18908
|
|
Epoch=3, iter=254, loss=2.26152
|
|
Epoch=3, iter=354, loss=2.06879
|
|
Epoch=3, iter=454, loss=2.03323
|
|
Epoch=3, iter=554, loss=1.93354
|
|
Epoch=3, iter=654, loss=1.86967
|
|
Evaluating...
|
|
Accuracy: 0.996433
|
|
Cor: 13478, Pred TOT: 15757, Gold TOT: 16074
|
|
P: 0.85537, R: 0.83850, F1: 0.84685
|
|
Used time: 41.699907
|
|
!!! Best valid (epoch=3): 84.68
|
|
Saving model to sh_aug+klue_dir...
|
|
Epoch=4, iter=39, loss=1.74192
|
|
Epoch=4, iter=139, loss=1.66635
|
|
Epoch=4, iter=239, loss=1.71463
|
|
Epoch=4, iter=339, loss=1.59322
|
|
Epoch=4, iter=439, loss=1.62414
|
|
Epoch=4, iter=539, loss=1.52524
|
|
Epoch=4, iter=639, loss=1.55066
|
|
Evaluating...
|
|
Accuracy: 0.996524
|
|
Cor: 13755, Pred TOT: 16223, Gold TOT: 16074
|
|
P: 0.84787, R: 0.85573, F1: 0.85178
|
|
Used time: 40.325464
|
|
!!! Best valid (epoch=4): 85.18
|
|
Saving model to sh_aug+klue_dir...
|
|
Epoch=5, iter=24, loss=1.37847
|
|
Epoch=5, iter=124, loss=1.37336
|
|
Epoch=5, iter=224, loss=1.39704
|
|
Epoch=5, iter=324, loss=1.28449
|
|
Epoch=5, iter=424, loss=1.41600
|
|
Epoch=5, iter=524, loss=1.20445
|
|
Epoch=5, iter=624, loss=1.30613
|
|
Evaluating...
|
|
Accuracy: 0.996762
|
|
Cor: 13890, Pred TOT: 16181, Gold TOT: 16074
|
|
P: 0.85841, R: 0.86413, F1: 0.86126
|
|
Used time: 67.691342
|
|
!!! Best valid (epoch=5): 86.13
|
|
Saving model to sh_aug+klue_dir...
|
|
Epoch=6, iter=9, loss=1.21428
|
|
Epoch=6, iter=109, loss=1.10397
|
|
|