m2_joint_label_ref_cmbert_io / trainer_state.json
nlpso's picture
Load model and tokenizer
e4211ec
{
"best_metric": 0.9680589680589681,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_2/tmp/211-camembert-ner-joint-labelling-io/checkpoint-600",
"epoch": 1.574803149606299,
"global_step": 600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.9012229539040452,
"number": 519,
"precision": 0.8805147058823529,
"recall": 0.9229287090558767
},
"eval_ACT_L1": {
"f1": 0.9149952244508118,
"number": 503,
"precision": 0.8805147058823529,
"recall": 0.952286282306163
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9911764705882352,
"number": 678,
"precision": 0.9882697947214076,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9370179948586118,
"number": 761,
"precision": 0.9169811320754717,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.9478324761204997,
"number": 676,
"precision": 0.9416058394160584,
"recall": 0.9541420118343196
},
"eval_SPAT": {
"f1": 0.9201680672268908,
"number": 694,
"precision": 0.8950953678474114,
"recall": 0.946685878962536
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.939051638530288,
"eval_accuracy-all": 0.9571747765640516,
"eval_accuracy-das": 0.9535749751737835,
"eval_accuracy-l1": 0.945506454816286,
"eval_accuracy-l2": 0.9688430983118173,
"eval_f1": 0.9351139497750036,
"eval_f1-all": 0.9303140978816655,
"eval_f1-das": 0.9332096474953618,
"eval_f1-l1": 0.920889348500517,
"eval_f1-l2": 0.9425596237823312,
"eval_loss": 0.34274226427078247,
"eval_precision": 0.9374272409778812,
"eval_precision-all": 0.9255813953488372,
"eval_precision-das": 0.9294161123429416,
"eval_precision-l1": 0.9072847682119205,
"eval_precision-l2": 0.949898442789438,
"eval_recall": 0.932812047494932,
"eval_recall-all": 0.9350954478707783,
"eval_recall-das": 0.9370342771982116,
"eval_recall-l1": 0.9349081364829396,
"eval_recall-l2": 0.9353333333333333,
"eval_runtime": 5.3519,
"eval_samples_per_second": 126.31,
"eval_steps_per_second": 8.034,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.9210526315789475,
"number": 519,
"precision": 0.8990825688073395,
"recall": 0.9441233140655106
},
"eval_ACT_L1": {
"f1": 0.9351145038167938,
"number": 503,
"precision": 0.8990825688073395,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9911764705882352,
"number": 678,
"precision": 0.9882697947214076,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9466840052015604,
"number": 761,
"precision": 0.9369369369369369,
"recall": 0.9566360052562418
},
"eval_PER": {
"f1": 0.9691176470588235,
"number": 676,
"precision": 0.9634502923976608,
"recall": 0.9748520710059172
},
"eval_SPAT": {
"f1": 0.9319971367215462,
"number": 694,
"precision": 0.9260312944523471,
"recall": 0.9380403458213257
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.5454545454545454,
"number": 33,
"precision": 0.5454545454545454,
"recall": 0.5454545454545454
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9461271102284012,
"eval_accuracy-all": 0.9623882820258193,
"eval_accuracy-das": 0.9620158887785502,
"eval_accuracy-l1": 0.952085402184707,
"eval_accuracy-l2": 0.9726911618669315,
"eval_f1": 0.9448275862068966,
"eval_f1-all": 0.9415204678362573,
"eval_f1-das": 0.9487511563367254,
"eval_f1-l1": 0.9355509355509356,
"eval_f1-l2": 0.9491978609625668,
"eval_loss": 0.25068724155426025,
"eval_precision": 0.9375534644995723,
"eval_precision-all": 0.9374090247452693,
"eval_precision-das": 0.9423006247703051,
"eval_precision-l1": 0.9264024704065877,
"eval_precision-l2": 0.9517426273458445,
"eval_recall": 0.952215464813206,
"eval_recall-all": 0.9456681350954479,
"eval_recall-das": 0.9552906110283159,
"eval_recall-l1": 0.9448818897637795,
"eval_recall-l2": 0.9466666666666667,
"eval_runtime": 5.4759,
"eval_samples_per_second": 123.45,
"eval_steps_per_second": 7.853,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9352380952380951,
"number": 519,
"precision": 0.9246704331450094,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9497098646034816,
"number": 503,
"precision": 0.9246704331450094,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9926470588235294,
"number": 678,
"precision": 0.9897360703812317,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.28571428571428575,
"number": 30,
"precision": 0.25,
"recall": 0.3333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9646133682830931,
"number": 761,
"precision": 0.9620915032679739,
"recall": 0.9671484888304862
},
"eval_PER": {
"f1": 0.980825958702065,
"number": 676,
"precision": 0.9779411764705882,
"recall": 0.9837278106508875
},
"eval_SPAT": {
"f1": 0.9634931997136722,
"number": 694,
"precision": 0.957325746799431,
"recall": 0.9697406340057637
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.927536231884058,
"number": 33,
"precision": 0.8888888888888888,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.961519364448858,
"eval_accuracy-all": 0.972877358490566,
"eval_accuracy-das": 0.9733118172790467,
"eval_accuracy-l1": 0.9668570009930486,
"eval_accuracy-l2": 0.9788977159880834,
"eval_f1": 0.9649198787353834,
"eval_f1-all": 0.9593686056708564,
"eval_f1-das": 0.9698884758364312,
"eval_f1-l1": 0.9530966571650686,
"eval_f1-l2": 0.9674824002681863,
"eval_loss": 0.16728797554969788,
"eval_precision": 0.9620034542314335,
"eval_precision-all": 0.9549025312772766,
"eval_precision-das": 0.9677299703264095,
"eval_precision-l1": 0.9411463664278403,
"eval_precision-l2": 0.9730276466621712,
"eval_recall": 0.9678540399652477,
"eval_recall-all": 0.9638766519823788,
"eval_recall-das": 0.9720566318926974,
"eval_recall-l1": 0.9653543307086614,
"eval_recall-l2": 0.962,
"eval_runtime": 5.9254,
"eval_samples_per_second": 114.086,
"eval_steps_per_second": 7.257,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9230769230769231,
"number": 519,
"precision": 0.9101123595505618,
"recall": 0.9364161849710982
},
"eval_ACT_L1": {
"f1": 0.9373191899710704,
"number": 503,
"precision": 0.9101123595505618,
"recall": 0.9662027833001988
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.17142857142857143,
"number": 30,
"precision": 0.15,
"recall": 0.2
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9620418848167539,
"number": 761,
"precision": 0.9582790091264668,
"recall": 0.9658344283837057
},
"eval_PER": {
"f1": 0.9779086892488954,
"number": 676,
"precision": 0.9736070381231672,
"recall": 0.9822485207100592
},
"eval_SPAT": {
"f1": 0.9557142857142857,
"number": 694,
"precision": 0.9475920679886686,
"recall": 0.9639769452449568
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8732394366197183,
"number": 33,
"precision": 0.8157894736842105,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9606504468718967,
"eval_accuracy-all": 0.9717601787487586,
"eval_accuracy-das": 0.9735600794438928,
"eval_accuracy-l1": 0.9641261171797418,
"eval_accuracy-l2": 0.9793942403177756,
"eval_f1": 0.9591571655361523,
"eval_f1-all": 0.9531592003502116,
"eval_f1-das": 0.9647364513734225,
"eval_f1-l1": 0.9438841479182829,
"eval_f1-l2": 0.9651707970529135,
"eval_loss": 0.15428000688552856,
"eval_precision": 0.9559838895281934,
"eval_precision-all": 0.947215777262181,
"eval_precision-das": 0.9611686390532544,
"eval_precision-l1": 0.9301732925586137,
"eval_precision-l2": 0.9697173620457604,
"eval_recall": 0.9623515783376774,
"eval_recall-all": 0.9591776798825257,
"eval_recall-das": 0.9683308494783904,
"eval_recall-l1": 0.958005249343832,
"eval_recall-l2": 0.9606666666666667,
"eval_runtime": 6.235,
"eval_samples_per_second": 108.42,
"eval_steps_per_second": 6.897,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.3421,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9407265774378585,
"number": 519,
"precision": 0.9335863377609108,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.9590643274853801,
"number": 503,
"precision": 0.9407265774378585,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.3555555555555555,
"number": 30,
"precision": 0.5333333333333333,
"recall": 0.26666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9546044098573281,
"number": 761,
"precision": 0.942381562099872,
"recall": 0.9671484888304862
},
"eval_PER": {
"f1": 0.9786921381337252,
"number": 676,
"precision": 0.9722627737226277,
"recall": 0.985207100591716
},
"eval_SPAT": {
"f1": 0.9524485450674237,
"number": 694,
"precision": 0.9384615384615385,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8888888888888888,
"number": 33,
"precision": 0.8205128205128205,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9608987090367428,
"eval_accuracy-all": 0.9716981132075472,
"eval_accuracy-das": 0.9724428997020854,
"eval_accuracy-l1": 0.9652432969215492,
"eval_accuracy-l2": 0.9781529294935452,
"eval_f1": 0.9627705627705628,
"eval_f1-all": 0.9579439252336449,
"eval_f1-das": 0.9659259259259259,
"eval_f1-l1": 0.9560239396304969,
"eval_f1-l2": 0.9603993344425957,
"eval_loss": 0.16323766112327576,
"eval_precision": 0.9594477998274374,
"eval_precision-all": 0.9526575660760964,
"eval_precision-das": 0.9602356406480118,
"eval_precision-l1": 0.9478844169246646,
"eval_precision-l2": 0.9588039867109635,
"eval_recall": 0.9661164205039097,
"eval_recall-all": 0.9632892804698973,
"eval_recall-das": 0.9716840536512668,
"eval_recall-l1": 0.9643044619422572,
"eval_recall-l2": 0.962,
"eval_runtime": 6.0867,
"eval_samples_per_second": 111.062,
"eval_steps_per_second": 7.065,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9512893982808023,
"number": 519,
"precision": 0.9431818181818182,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9669260700389105,
"number": 503,
"precision": 0.9466666666666667,
"recall": 0.9880715705765407
},
"eval_ACT_L2": {
"f1": 0.10526315789473684,
"number": 16,
"precision": 0.3333333333333333,
"recall": 0.0625
},
"eval_CARDINAL": {
"f1": 0.9926470588235294,
"number": 678,
"precision": 0.9897360703812317,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.3928571428571428,
"number": 30,
"precision": 0.4230769230769231,
"recall": 0.36666666666666664
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9647058823529412,
"number": 761,
"precision": 0.9596879063719116,
"recall": 0.9697766097240473
},
"eval_PER": {
"f1": 0.9852289512555391,
"number": 676,
"precision": 0.9837758112094396,
"recall": 0.9866863905325444
},
"eval_SPAT": {
"f1": 0.9590811198851399,
"number": 694,
"precision": 0.9556509298998569,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8985507246376813,
"number": 33,
"precision": 0.8611111111111112,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9640019860973188,
"eval_accuracy-all": 0.9731256206554121,
"eval_accuracy-das": 0.9754220456802384,
"eval_accuracy-l1": 0.9687189672293942,
"eval_accuracy-l2": 0.97753227408143,
"eval_f1": 0.9680589680589681,
"eval_f1-all": 0.9637989154330939,
"eval_f1-das": 0.9730332899386276,
"eval_f1-l1": 0.9616488390294807,
"eval_f1-l2": 0.9665551839464883,
"eval_loss": 0.15035659074783325,
"eval_precision": 0.9662435083669937,
"eval_precision-all": 0.9619660620245758,
"eval_precision-das": 0.9714073523950985,
"eval_precision-l1": 0.9559128630705395,
"eval_precision-l2": 0.9697986577181208,
"eval_recall": 0.9698812626701419,
"eval_recall-all": 0.9656387665198238,
"eval_recall-das": 0.9746646795827124,
"eval_recall-l1": 0.9674540682414698,
"eval_recall-l2": 0.9633333333333334,
"eval_runtime": 6.3141,
"eval_samples_per_second": 107.061,
"eval_steps_per_second": 6.81,
"step": 600
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 241578442301760.0,
"trial_name": null,
"trial_params": null
}