m2_joint_label_ocr_cmbert_io / trainer_state.json
nlpso's picture
Load model and tokenizer
305673d
{
"best_metric": 0.9654571843251089,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_2/tmp/221-camembert-ner-joint-labelling-io/checkpoint-2000",
"epoch": 5.2493438320209975,
"global_step": 2000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.8818604651162791,
"number": 519,
"precision": 0.8525179856115108,
"recall": 0.9132947976878613
},
"eval_ACT_L1": {
"f1": 0.8951841359773371,
"number": 503,
"precision": 0.8525179856115108,
"recall": 0.9423459244532804
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9765739385065886,
"number": 678,
"precision": 0.9694767441860465,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9248704663212436,
"number": 761,
"precision": 0.9118773946360154,
"recall": 0.938239159001314
},
"eval_PER": {
"f1": 0.9236417033773863,
"number": 676,
"precision": 0.9169096209912536,
"recall": 0.9304733727810651
},
"eval_SPAT": {
"f1": 0.9313304721030043,
"number": 694,
"precision": 0.9247159090909091,
"recall": 0.9380403458213257
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.931030118957226,
"eval_accuracy-all": 0.9533029612756264,
"eval_accuracy-das": 0.9460895975702354,
"eval_accuracy-l1": 0.9406479372310808,
"eval_accuracy-l2": 0.9659579853201721,
"eval_f1": 0.9194107452339687,
"eval_f1-all": 0.9189506082368459,
"eval_f1-das": 0.9173768062245277,
"eval_f1-l1": 0.910932225396001,
"eval_f1-l2": 0.9293405114401078,
"eval_loss": 0.3786505162715912,
"eval_precision": 0.9136050516647531,
"eval_precision-all": 0.9174714661984197,
"eval_precision-das": 0.9126428308145964,
"eval_precision-l1": 0.9013360739979445,
"eval_precision-l2": 0.938817131203263,
"eval_recall": 0.9252906976744186,
"eval_recall-all": 0.9204345273047563,
"eval_recall-das": 0.9221601489757915,
"eval_recall-l1": 0.920734908136483,
"eval_recall-l2": 0.9200532978014657,
"eval_runtime": 5.4791,
"eval_samples_per_second": 123.379,
"eval_steps_per_second": 7.848,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.8797061524334251,
"number": 519,
"precision": 0.8403508771929824,
"recall": 0.9229287090558767
},
"eval_ACT_L1": {
"f1": 0.8928238583410996,
"number": 503,
"precision": 0.8403508771929824,
"recall": 0.952286282306163
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9773557341124909,
"number": 678,
"precision": 0.9681620839363242,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.09523809523809522,
"number": 30,
"precision": 0.16666666666666666,
"recall": 0.06666666666666667
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9347123464770524,
"number": 761,
"precision": 0.9198473282442748,
"recall": 0.9500657030223391
},
"eval_PER": {
"f1": 0.9285187914517319,
"number": 676,
"precision": 0.9251101321585903,
"recall": 0.9319526627218935
},
"eval_SPAT": {
"f1": 0.9212207239176721,
"number": 694,
"precision": 0.9076923076923077,
"recall": 0.9351585014409222
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9339407744874715,
"eval_accuracy-all": 0.9529865856745128,
"eval_accuracy-das": 0.9482409516578082,
"eval_accuracy-l1": 0.9407744874715261,
"eval_accuracy-l2": 0.9651986838774994,
"eval_f1": 0.9257654534950897,
"eval_f1-all": 0.9188164990526161,
"eval_f1-das": 0.9222242748937742,
"eval_f1-l1": 0.9065155807365439,
"eval_f1-l2": 0.9348556077904635,
"eval_loss": 0.2861093580722809,
"eval_precision": 0.9199196326061998,
"eval_precision-all": 0.912301013024602,
"eval_precision-das": 0.9149560117302052,
"eval_precision-l1": 0.8897876643073812,
"eval_precision-l2": 0.942450914014895,
"eval_recall": 0.9316860465116279,
"eval_recall-all": 0.9254257193188491,
"eval_recall-das": 0.929608938547486,
"eval_recall-l1": 0.9238845144356955,
"eval_recall-l2": 0.927381745502998,
"eval_runtime": 5.893,
"eval_samples_per_second": 114.712,
"eval_steps_per_second": 7.297,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9220532319391636,
"number": 519,
"precision": 0.9099437148217636,
"recall": 0.9344894026974951
},
"eval_ACT_L1": {
"f1": 0.9362934362934364,
"number": 503,
"precision": 0.9099437148217636,
"recall": 0.9642147117296223
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9860396767083027,
"number": 678,
"precision": 0.9824304538799414,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.27450980392156865,
"number": 30,
"precision": 0.3333333333333333,
"recall": 0.23333333333333334
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9346405228758171,
"number": 761,
"precision": 0.929778933680104,
"recall": 0.9395532194480947
},
"eval_PER": {
"f1": 0.9381443298969072,
"number": 676,
"precision": 0.9340175953079178,
"recall": 0.9423076923076923
},
"eval_SPAT": {
"f1": 0.9430199430199431,
"number": 694,
"precision": 0.9323943661971831,
"recall": 0.9538904899135446
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.17777777777777776,
"number": 33,
"precision": 0.3333333333333333,
"recall": 0.12121212121212122
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9472285497342445,
"eval_accuracy-all": 0.9614654517843584,
"eval_accuracy-das": 0.9639331814730449,
"eval_accuracy-l1": 0.9538091622374083,
"eval_accuracy-l2": 0.9691217413313086,
"eval_f1": 0.9426157879405767,
"eval_f1-all": 0.9333920187793427,
"eval_f1-das": 0.9416153702667412,
"eval_f1-l1": 0.9301480135029863,
"eval_f1-l2": 0.9376053962900506,
"eval_loss": 0.22815603017807007,
"eval_precision": 0.9445417396380619,
"eval_precision-all": 0.9328445747800587,
"eval_precision-das": 0.9431988041853513,
"eval_precision-l1": 0.920349434737924,
"eval_precision-l2": 0.9494535519125683,
"eval_recall": 0.9406976744186046,
"eval_recall-all": 0.9339401056958309,
"eval_recall-das": 0.9400372439478585,
"eval_recall-l1": 0.9401574803149606,
"eval_recall-l2": 0.9260493004663558,
"eval_runtime": 6.5502,
"eval_samples_per_second": 103.203,
"eval_steps_per_second": 6.565,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9244019138755981,
"number": 519,
"precision": 0.9182509505703422,
"recall": 0.930635838150289
},
"eval_ACT_L1": {
"f1": 0.9448818897637794,
"number": 503,
"precision": 0.935672514619883,
"recall": 0.9542743538767395
},
"eval_ACT_L2": {
"f1": 0.20689655172413793,
"number": 16,
"precision": 0.23076923076923078,
"recall": 0.1875
},
"eval_CARDINAL": {
"f1": 0.9874723655121592,
"number": 678,
"precision": 0.9867452135493373,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.28235294117647064,
"number": 30,
"precision": 0.21818181818181817,
"recall": 0.4
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9488859764089123,
"number": 761,
"precision": 0.9464052287581699,
"recall": 0.9513797634691196
},
"eval_PER": {
"f1": 0.951683748169839,
"number": 676,
"precision": 0.9420289855072463,
"recall": 0.9615384615384616
},
"eval_SPAT": {
"f1": 0.9491768074445239,
"number": 694,
"precision": 0.9431009957325747,
"recall": 0.9553314121037464
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.5263157894736842,
"number": 33,
"precision": 0.625,
"recall": 0.45454545454545453
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9395089850670716,
"eval_accuracy-all": 0.9572892938496583,
"eval_accuracy-das": 0.9578587699316629,
"eval_accuracy-l1": 0.9484940521386991,
"eval_accuracy-l2": 0.9660845355606176,
"eval_f1": 0.9442109839153746,
"eval_f1-all": 0.9395443925233645,
"eval_f1-das": 0.9498415066194295,
"eval_f1-l1": 0.933781686497672,
"eval_f1-l2": 0.9470154258886653,
"eval_loss": 0.19686226546764374,
"eval_precision": 0.9413464316671483,
"eval_precision-all": 0.9346310284718187,
"eval_precision-das": 0.9510828976848394,
"eval_precision-l1": 0.9204487506374299,
"eval_precision-l2": 0.9534098582039163,
"eval_recall": 0.9470930232558139,
"eval_recall-all": 0.9445096887844979,
"eval_recall-das": 0.9486033519553073,
"eval_recall-l1": 0.94750656167979,
"eval_recall-l2": 0.9407061958694204,
"eval_runtime": 6.1906,
"eval_samples_per_second": 109.198,
"eval_steps_per_second": 6.946,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.3718,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9380362249761677,
"number": 519,
"precision": 0.9283018867924528,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.952565343659245,
"number": 503,
"precision": 0.9283018867924528,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.986019131714496,
"number": 678,
"precision": 0.9838472834067548,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.23809523809523808,
"number": 30,
"precision": 0.4166666666666667,
"recall": 0.16666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.945645055664702,
"number": 761,
"precision": 0.9425587467362925,
"recall": 0.9487516425755584
},
"eval_PER": {
"f1": 0.9683124539425203,
"number": 676,
"precision": 0.9647577092511013,
"recall": 0.9718934911242604
},
"eval_SPAT": {
"f1": 0.9472182596291013,
"number": 694,
"precision": 0.9378531073446328,
"recall": 0.9567723342939481
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8181818181818182,
"number": 33,
"precision": 0.8181818181818182,
"recall": 0.8181818181818182
},
"eval_TITREP": {
"f1": 0.25,
"number": 6,
"precision": 0.5,
"recall": 0.16666666666666666
},
"eval_accuracy": 0.9534295115160719,
"eval_accuracy-all": 0.9654517843583903,
"eval_accuracy-das": 0.9665907365223994,
"eval_accuracy-l1": 0.958744621614781,
"eval_accuracy-l2": 0.9721589471019995,
"eval_f1": 0.9550021843599825,
"eval_f1-all": 0.9496993694090042,
"eval_f1-das": 0.9570552147239264,
"eval_f1-l1": 0.9478623566214807,
"eval_f1-l2": 0.9520616828695944,
"eval_loss": 0.18782156705856323,
"eval_precision": 0.9568135395389553,
"eval_precision-all": 0.9487254614708468,
"eval_precision-das": 0.955456570155902,
"eval_precision-l1": 0.9414810978767478,
"eval_precision-l2": 0.9581646423751687,
"eval_recall": 0.9531976744186047,
"eval_recall-all": 0.9506752789195537,
"eval_recall-das": 0.958659217877095,
"eval_recall-l1": 0.9543307086614173,
"eval_recall-l2": 0.9460359760159893,
"eval_runtime": 6.174,
"eval_samples_per_second": 109.491,
"eval_steps_per_second": 6.965,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9334600760456274,
"number": 519,
"precision": 0.9212007504690432,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9468599033816425,
"number": 503,
"precision": 0.9210526315789473,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.11764705882352941,
"number": 16,
"precision": 1.0,
"recall": 0.0625
},
"eval_CARDINAL": {
"f1": 0.9867452135493373,
"number": 678,
"precision": 0.9852941176470589,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.3333333333333333,
"number": 30,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9490403706154864,
"number": 761,
"precision": 0.956,
"recall": 0.9421813403416557
},
"eval_PER": {
"f1": 0.9572271386430679,
"number": 676,
"precision": 0.9544117647058824,
"recall": 0.9600591715976331
},
"eval_SPAT": {
"f1": 0.9538904899135446,
"number": 694,
"precision": 0.9538904899135446,
"recall": 0.9538904899135446
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.6153846153846154,
"number": 33,
"precision": 0.625,
"recall": 0.6060606060606061
},
"eval_TITREP": {
"f1": 0.4444444444444444,
"number": 6,
"precision": 0.6666666666666666,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9544419134396356,
"eval_accuracy-all": 0.9670969374841812,
"eval_accuracy-das": 0.9669703872437357,
"eval_accuracy-l1": 0.960642875221463,
"eval_accuracy-l2": 0.9735509997468995,
"eval_f1": 0.9518265172463979,
"eval_f1-all": 0.9462397179788484,
"eval_f1-das": 0.952807312068644,
"eval_f1-l1": 0.9429835980213485,
"eval_f1-l2": 0.9504550050556118,
"eval_loss": 0.1709740161895752,
"eval_precision": 0.9530749052754299,
"eval_precision-all": 0.9467960023515579,
"eval_precision-das": 0.9544095665171899,
"eval_precision-l1": 0.9354338842975206,
"eval_precision-l2": 0.9618008185538881,
"eval_recall": 0.9505813953488372,
"eval_recall-all": 0.9456840869054609,
"eval_recall-das": 0.9512104283054004,
"eval_recall-l1": 0.9506561679790027,
"eval_recall-l2": 0.9393737508327782,
"eval_runtime": 6.1402,
"eval_samples_per_second": 110.094,
"eval_steps_per_second": 7.003,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9339712918660287,
"number": 519,
"precision": 0.9277566539923955,
"recall": 0.9402697495183044
},
"eval_ACT_L1": {
"f1": 0.9536031589338598,
"number": 503,
"precision": 0.9470588235294117,
"recall": 0.9602385685884692
},
"eval_ACT_L2": {
"f1": 0.3125,
"number": 16,
"precision": 0.3125,
"recall": 0.3125
},
"eval_CARDINAL": {
"f1": 0.9867647058823529,
"number": 678,
"precision": 0.9838709677419355,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.5,
"number": 30,
"precision": 0.47058823529411764,
"recall": 0.5333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9457161543492479,
"number": 761,
"precision": 0.94140625,
"recall": 0.9500657030223391
},
"eval_PER": {
"f1": 0.9711324944485566,
"number": 676,
"precision": 0.9718518518518519,
"recall": 0.9704142011834319
},
"eval_SPAT": {
"f1": 0.9611510791366907,
"number": 694,
"precision": 0.9597701149425287,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9032258064516129,
"number": 33,
"precision": 0.9655172413793104,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.2857142857142857,
"number": 6,
"precision": 1.0,
"recall": 0.16666666666666666
},
"eval_accuracy": 0.95292331055429,
"eval_accuracy-all": 0.9641862819539357,
"eval_accuracy-das": 0.9721589471019995,
"eval_accuracy-l1": 0.9586180713743356,
"eval_accuracy-l2": 0.9697544925335359,
"eval_f1": 0.9564586357039186,
"eval_f1-all": 0.9537919906117059,
"eval_f1-das": 0.9595827900912646,
"eval_f1-l1": 0.9544502617801047,
"eval_f1-l2": 0.9529529529529529,
"eval_loss": 0.16730760037899017,
"eval_precision": 0.9550724637681159,
"eval_precision-all": 0.9530929346232776,
"eval_precision-das": 0.9597615499254843,
"eval_precision-l1": 0.951958224543081,
"eval_precision-l2": 0.9545454545454546,
"eval_recall": 0.9578488372093024,
"eval_recall-all": 0.9544920728126834,
"eval_recall-das": 0.9594040968342644,
"eval_recall-l1": 0.9569553805774278,
"eval_recall-l2": 0.9513657561625583,
"eval_runtime": 6.0205,
"eval_samples_per_second": 112.283,
"eval_steps_per_second": 7.142,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9249762583095916,
"number": 519,
"precision": 0.9119850187265918,
"recall": 0.9383429672447013
},
"eval_ACT_L1": {
"f1": 0.9545454545454545,
"number": 503,
"precision": 0.9489194499017681,
"recall": 0.9602385685884692
},
"eval_ACT_L2": {
"f1": 0.19512195121951217,
"number": 16,
"precision": 0.16,
"recall": 0.25
},
"eval_CARDINAL": {
"f1": 0.9851851851851852,
"number": 678,
"precision": 0.9895833333333334,
"recall": 0.9808259587020649
},
"eval_DESC": {
"f1": 0.4347826086956522,
"number": 30,
"precision": 0.38461538461538464,
"recall": 0.5
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9516971279373369,
"number": 761,
"precision": 0.9455252918287937,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.9748892171344165,
"number": 676,
"precision": 0.9734513274336283,
"recall": 0.9763313609467456
},
"eval_SPAT": {
"f1": 0.9342857142857142,
"number": 694,
"precision": 0.9263456090651558,
"recall": 0.9423631123919308
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8656716417910447,
"number": 33,
"precision": 0.8529411764705882,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.5,
"number": 6,
"precision": 1.0,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9510250569476082,
"eval_accuracy-all": 0.9619083776259175,
"eval_accuracy-das": 0.9702606934953176,
"eval_accuracy-l1": 0.9567198177676538,
"eval_accuracy-l2": 0.9670969374841812,
"eval_f1": 0.955323469683783,
"eval_f1-all": 0.9473838059047063,
"eval_f1-das": 0.9587053571428571,
"eval_f1-l1": 0.9444878811571541,
"eval_f1-l2": 0.95108153078203,
"eval_loss": 0.1715497374534607,
"eval_precision": 0.9533873769542559,
"eval_precision-all": 0.9432479627473807,
"eval_precision-das": 0.9576365663322185,
"eval_precision-l1": 0.937888198757764,
"eval_precision-l2": 0.9501329787234043,
"eval_recall": 0.9572674418604651,
"eval_recall-all": 0.9515560775102759,
"eval_recall-das": 0.9597765363128492,
"eval_recall-l1": 0.9511811023622048,
"eval_recall-l2": 0.9520319786808794,
"eval_runtime": 6.0149,
"eval_samples_per_second": 112.387,
"eval_steps_per_second": 7.149,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9271523178807947,
"number": 519,
"precision": 0.9107806691449815,
"recall": 0.9441233140655106
},
"eval_ACT_L1": {
"f1": 0.9500489715964741,
"number": 503,
"precision": 0.9362934362934363,
"recall": 0.9642147117296223
},
"eval_ACT_L2": {
"f1": 0.2777777777777778,
"number": 16,
"precision": 0.25,
"recall": 0.3125
},
"eval_CARDINAL": {
"f1": 0.9816581071166545,
"number": 678,
"precision": 0.9766423357664233,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.39473684210526316,
"number": 30,
"precision": 0.32608695652173914,
"recall": 0.5
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9455022980958635,
"number": 761,
"precision": 0.9448818897637795,
"recall": 0.9461235216819974
},
"eval_PER": {
"f1": 0.9763663220088628,
"number": 676,
"precision": 0.9749262536873157,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9526542324246772,
"number": 694,
"precision": 0.9485714285714286,
"recall": 0.9567723342939481
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.823529411764706,
"number": 33,
"precision": 0.8,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9524171095925082,
"eval_accuracy-all": 0.9633637053910402,
"eval_accuracy-das": 0.9712730954188813,
"eval_accuracy-l1": 0.9593773728170083,
"eval_accuracy-l2": 0.9673500379650721,
"eval_f1": 0.9529599073672022,
"eval_f1-all": 0.9477829638273045,
"eval_f1-das": 0.9574902543159458,
"eval_f1-l1": 0.9487912659214973,
"eval_f1-l2": 0.9464938517779994,
"eval_loss": 0.15614591538906097,
"eval_precision": 0.9489766503315077,
"eval_precision-all": 0.9417391304347826,
"eval_precision-das": 0.9544781643227239,
"eval_precision-l1": 0.9397528321318228,
"eval_precision-l2": 0.9442970822281167,
"eval_recall": 0.9569767441860465,
"eval_recall-all": 0.953904873752202,
"eval_recall-das": 0.9605214152700187,
"eval_recall-l1": 0.958005249343832,
"eval_recall-l2": 0.9487008660892738,
"eval_runtime": 6.5502,
"eval_samples_per_second": 103.202,
"eval_steps_per_second": 6.565,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.1448,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.9319470699432891,
"number": 519,
"precision": 0.9146567717996289,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.9547244094488189,
"number": 503,
"precision": 0.9454191033138402,
"recall": 0.9642147117296223
},
"eval_ACT_L2": {
"f1": 0.380952380952381,
"number": 16,
"precision": 0.3076923076923077,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9852941176470589,
"number": 678,
"precision": 0.9824046920821115,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.45569620253164556,
"number": 30,
"precision": 0.3673469387755102,
"recall": 0.6
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9586342744583061,
"number": 761,
"precision": 0.958005249343832,
"recall": 0.9592641261498029
},
"eval_PER": {
"f1": 0.9719350073855243,
"number": 676,
"precision": 0.9705014749262537,
"recall": 0.9733727810650887
},
"eval_SPAT": {
"f1": 0.9469914040114613,
"number": 694,
"precision": 0.9415954415954416,
"recall": 0.952449567723343
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7692307692307692,
"number": 33,
"precision": 0.78125,
"recall": 0.7575757575757576
},
"eval_TITREP": {
"f1": 0.4444444444444444,
"number": 6,
"precision": 0.6666666666666666,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9536826119969628,
"eval_accuracy-all": 0.9634902556314857,
"eval_accuracy-das": 0.9735509997468995,
"eval_accuracy-l1": 0.9593773728170083,
"eval_accuracy-l2": 0.967603138445963,
"eval_f1": 0.958689665168865,
"eval_f1-all": 0.9505326134539618,
"eval_f1-das": 0.9622466059140785,
"eval_f1-l1": 0.9472316090460099,
"eval_f1-l2": 0.9547571523619428,
"eval_loss": 0.16222244501113892,
"eval_precision": 0.9560566637756577,
"eval_precision-all": 0.944879605454018,
"eval_precision-das": 0.9609955423476969,
"eval_precision-l1": 0.9382080329557158,
"eval_precision-l2": 0.9534883720930233,
"eval_recall": 0.9613372093023256,
"eval_recall-all": 0.956253669994128,
"eval_recall-das": 0.9635009310986965,
"eval_recall-l1": 0.9564304461942257,
"eval_recall-l2": 0.9560293137908061,
"eval_runtime": 5.8166,
"eval_samples_per_second": 116.219,
"eval_steps_per_second": 7.393,
"step": 1000
},
{
"epoch": 2.89,
"eval_ACT": {
"f1": 0.9426386233269598,
"number": 519,
"precision": 0.9354838709677419,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.9614243323442137,
"number": 503,
"precision": 0.9566929133858267,
"recall": 0.9662027833001988
},
"eval_ACT_L2": {
"f1": 0.39999999999999997,
"number": 16,
"precision": 0.3684210526315789,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9882179675994109,
"number": 678,
"precision": 0.986764705882353,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.5217391304347826,
"number": 30,
"precision": 0.46153846153846156,
"recall": 0.6
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9420949902407288,
"number": 761,
"precision": 0.9329896907216495,
"recall": 0.9513797634691196
},
"eval_PER": {
"f1": 0.9770879526977089,
"number": 676,
"precision": 0.9763663220088626,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9577060931899642,
"number": 694,
"precision": 0.9529243937232525,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8,
"number": 33,
"precision": 0.8125,
"recall": 0.7878787878787878
},
"eval_TITREP": {
"f1": 0.4,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.5
},
"eval_accuracy": 0.9539357124778537,
"eval_accuracy-all": 0.9638699063528221,
"eval_accuracy-das": 0.9727916983042267,
"eval_accuracy-l1": 0.9610225259427992,
"eval_accuracy-l2": 0.9667172867628449,
"eval_f1": 0.9571883135666762,
"eval_f1-all": 0.9534102526654009,
"eval_f1-das": 0.9606533036377134,
"eval_f1-l1": 0.9571801566579634,
"eval_f1-l2": 0.9486244613854822,
"eval_loss": 0.17501647770404816,
"eval_precision": 0.9525043177892919,
"eval_precision-all": 0.948561464690497,
"eval_precision-das": 0.9574546799852016,
"eval_precision-l1": 0.9522077922077922,
"eval_precision-l2": 0.9439313984168866,
"eval_recall": 0.9619186046511627,
"eval_recall-all": 0.9583088667058133,
"eval_recall-das": 0.9638733705772812,
"eval_recall-l1": 0.9622047244094488,
"eval_recall-l2": 0.9533644237175216,
"eval_runtime": 6.2615,
"eval_samples_per_second": 107.961,
"eval_steps_per_second": 6.867,
"step": 1100
},
{
"epoch": 3.15,
"eval_ACT": {
"f1": 0.9417382999044891,
"number": 519,
"precision": 0.9337121212121212,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.9594460929772503,
"number": 503,
"precision": 0.9547244094488189,
"recall": 0.9642147117296223
},
"eval_ACT_L2": {
"f1": 0.4444444444444445,
"number": 16,
"precision": 0.4,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9867647058823529,
"number": 678,
"precision": 0.9838709677419355,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.45454545454545453,
"number": 30,
"precision": 0.4166666666666667,
"recall": 0.5
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9510763209393347,
"number": 761,
"precision": 0.944300518134715,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.9785661492978566,
"number": 676,
"precision": 0.9778434268833087,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9562096195262024,
"number": 694,
"precision": 0.9527896995708155,
"recall": 0.9596541786743515
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8055555555555556,
"number": 33,
"precision": 0.7435897435897436,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.5454545454545454,
"number": 6,
"precision": 0.6,
"recall": 0.5
},
"eval_accuracy": 0.9538091622374083,
"eval_accuracy-all": 0.9638066312325994,
"eval_accuracy-das": 0.9724120475828905,
"eval_accuracy-l1": 0.9598835737787902,
"eval_accuracy-l2": 0.9677296886864085,
"eval_f1": 0.9574775817182528,
"eval_f1-all": 0.9549970777323202,
"eval_f1-das": 0.9612172944887734,
"eval_f1-l1": 0.9558169934640522,
"eval_f1-l2": 0.9539582643259357,
"eval_loss": 0.17843317985534668,
"eval_precision": 0.9527921704087507,
"eval_precision-all": 0.9505526468877254,
"eval_precision-das": 0.9578402366863905,
"eval_precision-l1": 0.9520833333333333,
"eval_precision-l2": 0.9486166007905138,
"eval_recall": 0.9622093023255814,
"eval_recall-all": 0.9594832648267763,
"eval_recall-das": 0.9646182495344506,
"eval_recall-l1": 0.9595800524934384,
"eval_recall-l2": 0.9593604263824117,
"eval_runtime": 6.7294,
"eval_samples_per_second": 100.455,
"eval_steps_per_second": 6.39,
"step": 1200
},
{
"epoch": 3.41,
"eval_ACT": {
"f1": 0.939047619047619,
"number": 519,
"precision": 0.928436911487759,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.9576354679802955,
"number": 503,
"precision": 0.94921875,
"recall": 0.9662027833001988
},
"eval_ACT_L2": {
"f1": 0.39999999999999997,
"number": 16,
"precision": 0.3684210526315789,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9852724594992636,
"number": 678,
"precision": 0.9838235294117647,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.5161290322580646,
"number": 30,
"precision": 0.5,
"recall": 0.5333333333333333
},
"eval_FT": {
"f1": 0.4444444444444445,
"number": 7,
"precision": 1.0,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9546946815495732,
"number": 761,
"precision": 0.9540682414698163,
"recall": 0.9553219448094612
},
"eval_PER": {
"f1": 0.9785661492978566,
"number": 676,
"precision": 0.9778434268833087,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9569583931133429,
"number": 694,
"precision": 0.9528571428571428,
"recall": 0.9610951008645533
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7096774193548386,
"number": 33,
"precision": 0.7586206896551724,
"recall": 0.6666666666666666
},
"eval_TITREP": {
"f1": 0.5,
"number": 6,
"precision": 0.5,
"recall": 0.5
},
"eval_accuracy": 0.960642875221463,
"eval_accuracy-all": 0.9691217413313086,
"eval_accuracy-das": 0.9778537079220451,
"eval_accuracy-l1": 0.9653252341179448,
"eval_accuracy-l2": 0.9729182485446722,
"eval_f1": 0.9602562236133353,
"eval_f1-all": 0.9556043956043958,
"eval_f1-das": 0.9622044312046174,
"eval_f1-l1": 0.9571353894406691,
"eval_f1-l2": 0.9536512170723576,
"eval_loss": 0.16250379383563995,
"eval_precision": 0.9617964421114027,
"eval_precision-all": 0.9537876572097105,
"eval_precision-das": 0.9620253164556962,
"eval_precision-l1": 0.9531494013534617,
"eval_precision-l2": 0.9546061415220294,
"eval_recall": 0.9587209302325581,
"eval_recall-all": 0.9574280681150911,
"eval_recall-das": 0.9623836126629423,
"eval_recall-l1": 0.9611548556430446,
"eval_recall-l2": 0.9526982011992006,
"eval_runtime": 5.7506,
"eval_samples_per_second": 117.554,
"eval_steps_per_second": 7.478,
"step": 1300
},
{
"epoch": 3.67,
"eval_ACT": {
"f1": 0.9439696106362773,
"number": 519,
"precision": 0.9307116104868914,
"recall": 0.9576107899807321
},
"eval_ACT_L1": {
"f1": 0.9616519174041297,
"number": 503,
"precision": 0.9513618677042801,
"recall": 0.9721669980119284
},
"eval_ACT_L2": {
"f1": 0.4444444444444445,
"number": 16,
"precision": 0.4,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9830757910228108,
"number": 678,
"precision": 0.9809104258443465,
"recall": 0.9852507374631269
},
"eval_DESC": {
"f1": 0.4927536231884058,
"number": 30,
"precision": 0.4358974358974359,
"recall": 0.5666666666666667
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9560655737704917,
"number": 761,
"precision": 0.9541884816753927,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.9807692307692307,
"number": 676,
"precision": 0.9807692307692307,
"recall": 0.9807692307692307
},
"eval_SPAT": {
"f1": 0.9590222861250898,
"number": 694,
"precision": 0.9569583931133429,
"recall": 0.9610951008645533
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.875,
"number": 33,
"precision": 0.9032258064516129,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9583649708934447,
"eval_accuracy-all": 0.9695646671728676,
"eval_accuracy-das": 0.9716527461402177,
"eval_accuracy-l1": 0.9645659326752721,
"eval_accuracy-l2": 0.9745634016704632,
"eval_f1": 0.9603128621089224,
"eval_f1-all": 0.957284961966062,
"eval_f1-das": 0.9644783336432956,
"eval_f1-l1": 0.9584964761158966,
"eval_f1-l2": 0.9557404326123128,
"eval_loss": 0.17416799068450928,
"eval_precision": 0.956986143187067,
"eval_precision-all": 0.953935860058309,
"eval_precision-das": 0.9632243684992571,
"eval_precision-l1": 0.9532710280373832,
"eval_precision-l2": 0.9547872340425532,
"eval_recall": 0.9636627906976745,
"eval_recall-all": 0.9606576629477392,
"eval_recall-das": 0.9657355679702049,
"eval_recall-l1": 0.9637795275590552,
"eval_recall-l2": 0.9566955363091273,
"eval_runtime": 6.3107,
"eval_samples_per_second": 107.119,
"eval_steps_per_second": 6.814,
"step": 1400
},
{
"epoch": 3.94,
"learning_rate": 7e-05,
"loss": 0.0854,
"step": 1500
},
{
"epoch": 3.94,
"eval_ACT": {
"f1": 0.9382716049382717,
"number": 519,
"precision": 0.9250936329588015,
"recall": 0.9518304431599229
},
"eval_ACT_L1": {
"f1": 0.9614243323442137,
"number": 503,
"precision": 0.9566929133858267,
"recall": 0.9662027833001988
},
"eval_ACT_L2": {
"f1": 0.380952380952381,
"number": 16,
"precision": 0.3076923076923077,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9874538745387453,
"number": 678,
"precision": 0.9881831610044313,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.5142857142857143,
"number": 30,
"precision": 0.45,
"recall": 0.6
},
"eval_FT": {
"f1": 0.2,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9559500328731098,
"number": 761,
"precision": 0.9565789473684211,
"recall": 0.9553219448094612
},
"eval_PER": {
"f1": 0.9763313609467456,
"number": 676,
"precision": 0.9763313609467456,
"recall": 0.9763313609467456
},
"eval_SPAT": {
"f1": 0.9577060931899642,
"number": 694,
"precision": 0.9529243937232525,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8529411764705883,
"number": 33,
"precision": 0.8285714285714286,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.5454545454545454,
"number": 6,
"precision": 0.6,
"recall": 0.5
},
"eval_accuracy": 0.9515312579093901,
"eval_accuracy-all": 0.9630473297899266,
"eval_accuracy-das": 0.9717792963806631,
"eval_accuracy-l1": 0.9570994684889901,
"eval_accuracy-l2": 0.9689951910908631,
"eval_f1": 0.9592576482528636,
"eval_f1-all": 0.9562673687289747,
"eval_f1-das": 0.9624395686128672,
"eval_f1-l1": 0.9566579634464752,
"eval_f1-l2": 0.9557698703026272,
"eval_loss": 0.18355852365493774,
"eval_precision": 0.9568990454150998,
"eval_precision-all": 0.9527834450597493,
"eval_precision-das": 0.961010025993316,
"eval_precision-l1": 0.9516883116883117,
"eval_precision-l2": 0.954183266932271,
"eval_recall": 0.9616279069767442,
"eval_recall-all": 0.959776864357017,
"eval_recall-das": 0.9638733705772812,
"eval_recall-l1": 0.9616797900262467,
"eval_recall-l2": 0.9573617588274483,
"eval_runtime": 6.1311,
"eval_samples_per_second": 110.258,
"eval_steps_per_second": 7.013,
"step": 1500
},
{
"epoch": 4.2,
"eval_ACT": {
"f1": 0.9375,
"number": 519,
"precision": 0.9217877094972067,
"recall": 0.953757225433526
},
"eval_ACT_L1": {
"f1": 0.9577187807276303,
"number": 503,
"precision": 0.9474708171206225,
"recall": 0.9681908548707754
},
"eval_ACT_L2": {
"f1": 0.41025641025641024,
"number": 16,
"precision": 0.34782608695652173,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9874908020603386,
"number": 678,
"precision": 0.9853157121879589,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.5217391304347826,
"number": 30,
"precision": 0.46153846153846156,
"recall": 0.6
},
"eval_FT": {
"f1": 0.4615384615384615,
"number": 7,
"precision": 0.5,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.953063885267275,
"number": 761,
"precision": 0.9456662354463131,
"recall": 0.9605781865965834
},
"eval_PER": {
"f1": 0.9792899408284024,
"number": 676,
"precision": 0.9792899408284024,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9592566118656183,
"number": 694,
"precision": 0.9517730496453901,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.5,
"number": 2,
"precision": 0.5,
"recall": 0.5
},
"eval_TITREH": {
"f1": 0.84375,
"number": 33,
"precision": 0.8709677419354839,
"recall": 0.8181818181818182
},
"eval_TITREP": {
"f1": 0.4,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.5
},
"eval_accuracy": 0.9557074158440901,
"eval_accuracy-all": 0.9666540116426221,
"eval_accuracy-das": 0.9732978992660086,
"eval_accuracy-l1": 0.9629207795494812,
"eval_accuracy-l2": 0.9703872437357631,
"eval_f1": 0.959525874530211,
"eval_f1-all": 0.9561544064093226,
"eval_f1-das": 0.9638286032276017,
"eval_f1-l1": 0.9575631346003645,
"eval_f1-l2": 0.9543650793650794,
"eval_loss": 0.1747445911169052,
"eval_precision": 0.9542840713053479,
"eval_precision-all": 0.9488291413703382,
"eval_precision-das": 0.9600886917960089,
"eval_precision-l1": 0.949896694214876,
"eval_precision-l2": 0.9474720945502298,
"eval_recall": 0.9648255813953488,
"eval_recall-all": 0.9635936582501468,
"eval_recall-das": 0.9675977653631285,
"eval_recall-l1": 0.9653543307086614,
"eval_recall-l2": 0.9613590939373751,
"eval_runtime": 6.3526,
"eval_samples_per_second": 106.414,
"eval_steps_per_second": 6.769,
"step": 1600
},
{
"epoch": 4.46,
"eval_ACT": {
"f1": 0.9438629876308278,
"number": 519,
"precision": 0.9323308270676691,
"recall": 0.9556840077071291
},
"eval_ACT_L1": {
"f1": 0.9663366336633663,
"number": 503,
"precision": 0.9625246548323472,
"recall": 0.9701789264413518
},
"eval_ACT_L2": {
"f1": 0.39024390243902435,
"number": 16,
"precision": 0.32,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9867452135493373,
"number": 678,
"precision": 0.9852941176470589,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.5373134328358209,
"number": 30,
"precision": 0.4864864864864865,
"recall": 0.6
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9619921363040629,
"number": 761,
"precision": 0.9594771241830066,
"recall": 0.9645203679369251
},
"eval_PER": {
"f1": 0.9792899408284024,
"number": 676,
"precision": 0.9792899408284024,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9627507163323783,
"number": 694,
"precision": 0.9572649572649573,
"recall": 0.968299711815562
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8484848484848486,
"number": 33,
"precision": 0.8484848484848485,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.5454545454545454,
"number": 6,
"precision": 0.6,
"recall": 0.5
},
"eval_accuracy": 0.9554543153631991,
"eval_accuracy-all": 0.9662743609212857,
"eval_accuracy-das": 0.975069602632245,
"eval_accuracy-l1": 0.9619083776259175,
"eval_accuracy-l2": 0.970640344216654,
"eval_f1": 0.9615552009284782,
"eval_f1-all": 0.9603627321924821,
"eval_f1-das": 0.9665178571428571,
"eval_f1-l1": 0.9615887117846877,
"eval_f1-l2": 0.9588039867109635,
"eval_loss": 0.17034310102462769,
"eval_precision": 0.9597451491456704,
"eval_precision-all": 0.9568638880792771,
"eval_precision-das": 0.9654403567447045,
"eval_precision-l1": 0.9573361082206036,
"eval_precision-l2": 0.9562624254473161,
"eval_recall": 0.9633720930232558,
"eval_recall-all": 0.9638872577803875,
"eval_recall-das": 0.9675977653631285,
"eval_recall-l1": 0.9658792650918635,
"eval_recall-l2": 0.9613590939373751,
"eval_runtime": 6.4585,
"eval_samples_per_second": 104.669,
"eval_steps_per_second": 6.658,
"step": 1700
},
{
"epoch": 4.72,
"eval_ACT": {
"f1": 0.9551098376313275,
"number": 519,
"precision": 0.946969696969697,
"recall": 0.9633911368015414
},
"eval_ACT_L1": {
"f1": 0.971540726202159,
"number": 503,
"precision": 0.9593023255813954,
"recall": 0.9840954274353877
},
"eval_ACT_L2": {
"f1": 0.35714285714285715,
"number": 16,
"precision": 0.4166666666666667,
"recall": 0.3125
},
"eval_CARDINAL": {
"f1": 0.9867452135493373,
"number": 678,
"precision": 0.9852941176470589,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.523076923076923,
"number": 30,
"precision": 0.4857142857142857,
"recall": 0.5666666666666667
},
"eval_FT": {
"f1": 0.42857142857142855,
"number": 7,
"precision": 0.42857142857142855,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.945645055664702,
"number": 761,
"precision": 0.9425587467362925,
"recall": 0.9487516425755584
},
"eval_PER": {
"f1": 0.9800148038490007,
"number": 676,
"precision": 0.9807407407407407,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9463902787705505,
"number": 694,
"precision": 0.9390070921985816,
"recall": 0.9538904899135446
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.875,
"number": 33,
"precision": 0.9032258064516129,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.30769230769230765,
"number": 6,
"precision": 0.2857142857142857,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9596304732978993,
"eval_accuracy-all": 0.968299164768413,
"eval_accuracy-das": 0.9749430523917996,
"eval_accuracy-l1": 0.9654517843583903,
"eval_accuracy-l2": 0.9711465451784358,
"eval_f1": 0.9605339524085896,
"eval_f1-all": 0.9548311650343518,
"eval_f1-das": 0.9643255295429208,
"eval_f1-l1": 0.9569976544175137,
"eval_f1-l2": 0.9520639147802931,
"eval_loss": 0.17404037714004517,
"eval_precision": 0.958864426419467,
"eval_precision-all": 0.9508005822416302,
"eval_precision-das": 0.9621802002224694,
"eval_precision-l1": 0.9503105590062112,
"eval_precision-l2": 0.9514304723885563,
"eval_recall": 0.9622093023255814,
"eval_recall-all": 0.9588960657662948,
"eval_recall-das": 0.9664804469273743,
"eval_recall-l1": 0.9637795275590552,
"eval_recall-l2": 0.9526982011992006,
"eval_runtime": 5.4184,
"eval_samples_per_second": 124.761,
"eval_steps_per_second": 7.936,
"step": 1800
},
{
"epoch": 4.99,
"eval_ACT": {
"f1": 0.939047619047619,
"number": 519,
"precision": 0.928436911487759,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.961576354679803,
"number": 503,
"precision": 0.953125,
"recall": 0.9701789264413518
},
"eval_ACT_L2": {
"f1": 0.2857142857142857,
"number": 16,
"precision": 0.2631578947368421,
"recall": 0.3125
},
"eval_CARDINAL": {
"f1": 0.9815770081061163,
"number": 678,
"precision": 0.9808541973490427,
"recall": 0.9823008849557522
},
"eval_DESC": {
"f1": 0.5483870967741935,
"number": 30,
"precision": 0.53125,
"recall": 0.5666666666666667
},
"eval_FT": {
"f1": 0.2,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.953063885267275,
"number": 761,
"precision": 0.9456662354463131,
"recall": 0.9605781865965834
},
"eval_PER": {
"f1": 0.977810650887574,
"number": 676,
"precision": 0.977810650887574,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9626972740315638,
"number": 694,
"precision": 0.9585714285714285,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8285714285714285,
"number": 33,
"precision": 0.7837837837837838,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.28571428571428575,
"number": 6,
"precision": 0.25,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9579853201721084,
"eval_accuracy-all": 0.9677929638066313,
"eval_accuracy-das": 0.9754492533535813,
"eval_accuracy-l1": 0.9646924829157175,
"eval_accuracy-l2": 0.9708934446975449,
"eval_f1": 0.9568491167101071,
"eval_f1-all": 0.9554549437709947,
"eval_f1-das": 0.9595997034840623,
"eval_f1-l1": 0.96002090410243,
"eval_f1-l2": 0.9496688741721854,
"eval_loss": 0.18735294044017792,
"eval_precision": 0.953260242354299,
"eval_precision-all": 0.95059575704737,
"eval_precision-das": 0.9549981556621173,
"eval_precision-l1": 0.9557752341311134,
"eval_precision-l2": 0.9440421329822252,
"eval_recall": 0.9604651162790697,
"eval_recall-all": 0.9603640634174986,
"eval_recall-das": 0.964245810055866,
"eval_recall-l1": 0.9643044619422572,
"eval_recall-l2": 0.955363091272485,
"eval_runtime": 5.4368,
"eval_samples_per_second": 124.338,
"eval_steps_per_second": 7.909,
"step": 1900
},
{
"epoch": 5.25,
"learning_rate": 6e-05,
"loss": 0.0555,
"step": 2000
},
{
"epoch": 5.25,
"eval_ACT": {
"f1": 0.9514747859181732,
"number": 519,
"precision": 0.9398496240601504,
"recall": 0.9633911368015414
},
"eval_ACT_L1": {
"f1": 0.970414201183432,
"number": 503,
"precision": 0.9628180039138943,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.4324324324324324,
"number": 16,
"precision": 0.38095238095238093,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9874723655121592,
"number": 678,
"precision": 0.9867452135493373,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.5538461538461538,
"number": 30,
"precision": 0.5142857142857142,
"recall": 0.6
},
"eval_FT": {
"f1": 0.30769230769230765,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9625246548323472,
"number": 761,
"precision": 0.9631578947368421,
"recall": 0.961892247043364
},
"eval_PER": {
"f1": 0.9800148038490007,
"number": 676,
"precision": 0.9807407407407407,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9612625538020085,
"number": 694,
"precision": 0.9571428571428572,
"recall": 0.9654178674351584
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8923076923076922,
"number": 33,
"precision": 0.90625,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.5,
"number": 6,
"precision": 0.5,
"recall": 0.5
},
"eval_accuracy": 0.958744621614781,
"eval_accuracy-all": 0.9686155403695267,
"eval_accuracy-das": 0.9762085547962541,
"eval_accuracy-l1": 0.9640597317134902,
"eval_accuracy-l2": 0.9731713490255631,
"eval_f1": 0.9654571843251089,
"eval_f1-all": 0.9620846142585272,
"eval_f1-das": 0.9683897359613239,
"eval_f1-l1": 0.9628855201254575,
"eval_f1-l2": 0.9610648918469219,
"eval_loss": 0.18852506577968597,
"eval_precision": 0.9640579710144928,
"eval_precision-all": 0.9594160583941606,
"eval_precision-das": 0.966951355365763,
"eval_precision-l1": 0.9588755856324831,
"eval_precision-l2": 0.9601063829787234,
"eval_recall": 0.9668604651162791,
"eval_recall-all": 0.9647680563711099,
"eval_recall-das": 0.9698324022346368,
"eval_recall-l1": 0.9669291338582677,
"eval_recall-l2": 0.9620253164556962,
"eval_runtime": 5.6224,
"eval_samples_per_second": 120.232,
"eval_steps_per_second": 7.648,
"step": 2000
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 813927239246016.0,
"trial_name": null,
"trial_params": null
}