nlpso's picture
Load model and tokenizer
2eec7bc
raw history blame
No virus
44.2 kB
{
"best_metric": 0.9732283464566929,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/314-pretrained-camembert-ner-hierarchical-loss-iob2/checkpoint-1400",
"epoch": 3.674540682414698,
"global_step": 1400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.8992673992673993,
"number": 519,
"precision": 0.8568935427574171,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.912639405204461,
"number": 503,
"precision": 0.8568935427574171,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9816041206769685,
"number": 678,
"precision": 0.9794419970631424,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9583333333333334,
"number": 762,
"precision": 0.9509043927648578,
"recall": 0.9658792650918635
},
"eval_PER": {
"f1": 0.9560117302052786,
"number": 676,
"precision": 0.9476744186046512,
"recall": 0.9644970414201184
},
"eval_SPAT": {
"f1": 0.9562724014336917,
"number": 694,
"precision": 0.9514978601997147,
"recall": 0.9610951008645533
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9404170804369414,
"eval_accuracy-all": 0.9610228401191658,
"eval_accuracy-das": 0.9565541211519365,
"eval_accuracy-l1": 0.9500993048659384,
"eval_accuracy-l1l2": 0.9407894736842105,
"eval_accuracy-l2": 0.9719463753723933,
"eval_f1": 0.9438787055894999,
"eval_f1-all": 0.9416764361078547,
"eval_f1-das": 0.9402153731897512,
"eval_f1-l1": 0.9361261960175847,
"eval_f1-l1l2": 0.9384570933256284,
"eval_f1-l2": 0.9489347311464321,
"eval_loss": 0.6206728219985962,
"eval_precision": 0.9473086531910061,
"eval_precision-all": 0.9402985074626866,
"eval_precision-das": 0.9370836417468542,
"eval_precision-l1": 0.9225280326197758,
"eval_precision-l1l2": 0.9368329968272282,
"eval_precision-l2": 0.9642611683848797,
"eval_recall": 0.9404735062006765,
"eval_recall-all": 0.9430584091576166,
"eval_recall-das": 0.9433681073025335,
"eval_recall-l1": 0.9501312335958005,
"eval_recall-l1l2": 0.9400868306801736,
"eval_recall-l2": 0.9340878828229028,
"eval_runtime": 7.1724,
"eval_samples_per_second": 94.251,
"eval_steps_per_second": 5.995,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.9291784702549574,
"number": 519,
"precision": 0.9111111111111111,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.9434324065196549,
"number": 503,
"precision": 0.9111111111111111,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9919058130978661,
"number": 678,
"precision": 0.9897209985315712,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.3103448275862069,
"number": 30,
"precision": 0.32142857142857145,
"recall": 0.3
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9521345407503234,
"number": 762,
"precision": 0.9387755102040817,
"recall": 0.9658792650918635
},
"eval_PER": {
"f1": 0.983050847457627,
"number": 676,
"precision": 0.9794419970631424,
"recall": 0.9866863905325444
},
"eval_SPAT": {
"f1": 0.9542857142857143,
"number": 694,
"precision": 0.9461756373937678,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.43373493975903615,
"number": 33,
"precision": 0.36,
"recall": 0.5454545454545454
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.951837140019861,
"eval_accuracy-all": 0.9676017874875869,
"eval_accuracy-das": 0.9716981132075472,
"eval_accuracy-l1": 0.9602780536246276,
"eval_accuracy-l1l2": 0.9524577954319762,
"eval_accuracy-l2": 0.9749255213505462,
"eval_f1": 0.9533235856484086,
"eval_f1-all": 0.9492511269448888,
"eval_f1-das": 0.9659385412810071,
"eval_f1-l1": 0.9512953367875648,
"eval_f1-l1l2": 0.9528720813637014,
"eval_f1-l2": 0.9466357308584686,
"eval_loss": 0.3473620116710663,
"eval_precision": 0.9510771992818672,
"eval_precision-all": 0.9406340057636887,
"eval_precision-das": 0.9598969830757911,
"eval_precision-l1": 0.9391304347826087,
"eval_precision-l1l2": 0.9432785025524674,
"eval_precision-l2": 0.9425742574257425,
"eval_recall": 0.9555806087936866,
"eval_recall-all": 0.9580275902553567,
"eval_recall-das": 0.9720566318926974,
"eval_recall-l1": 0.9637795275590552,
"eval_recall-l1l2": 0.9626628075253256,
"eval_recall-l2": 0.9507323568575233,
"eval_runtime": 7.1425,
"eval_samples_per_second": 94.645,
"eval_steps_per_second": 6.02,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9467680608365019,
"number": 519,
"precision": 0.9343339587242027,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9613899613899614,
"number": 503,
"precision": 0.9343339587242027,
"recall": 0.9900596421471173
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.22580645161290322,
"number": 30,
"precision": 0.21875,
"recall": 0.23333333333333334
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9609882964889467,
"number": 762,
"precision": 0.9523195876288659,
"recall": 0.9698162729658792
},
"eval_PER": {
"f1": 0.9808541973490428,
"number": 676,
"precision": 0.9765395894428153,
"recall": 0.985207100591716
},
"eval_SPAT": {
"f1": 0.9700000000000001,
"number": 694,
"precision": 0.9617563739376771,
"recall": 0.978386167146974
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.6756756756756757,
"number": 33,
"precision": 0.6097560975609756,
"recall": 0.7575757575757576
},
"eval_TITREP": {
"f1": 0.6,
"number": 6,
"precision": 0.75,
"recall": 0.5
},
"eval_accuracy": 0.9551886792452831,
"eval_accuracy-all": 0.9682845084409136,
"eval_accuracy-das": 0.9759185700099305,
"eval_accuracy-l1": 0.9617676266137041,
"eval_accuracy-l1l2": 0.9554369414101291,
"eval_accuracy-l2": 0.9748013902681232,
"eval_f1": 0.9625788999098286,
"eval_f1-all": 0.9594870300204023,
"eval_f1-das": 0.9718100890207715,
"eval_f1-l1": 0.9590461378952824,
"eval_f1-l1l2": 0.9622695852534562,
"eval_f1-l2": 0.9600532623169108,
"eval_loss": 0.24261289834976196,
"eval_precision": 0.9623619562767636,
"eval_precision-all": 0.952821997105644,
"eval_precision-das": 0.9675036927621861,
"eval_precision-l1": 0.9472606246799795,
"eval_precision-l1l2": 0.9575809687589567,
"eval_precision-l2": 0.9600532623169108,
"eval_recall": 0.9627959413754228,
"eval_recall-all": 0.9662459641913707,
"eval_recall-das": 0.9761549925484352,
"eval_recall-l1": 0.9711286089238845,
"eval_recall-l1l2": 0.9670043415340087,
"eval_recall-l2": 0.9600532623169108,
"eval_runtime": 8.0913,
"eval_samples_per_second": 83.547,
"eval_steps_per_second": 5.314,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9337121212121212,
"number": 519,
"precision": 0.9180633147113594,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.9480769230769232,
"number": 503,
"precision": 0.9180633147113594,
"recall": 0.9801192842942346
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.21951219512195122,
"number": 30,
"precision": 0.17307692307692307,
"recall": 0.3
},
"eval_FT": {
"f1": 0.2,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9583875162548764,
"number": 762,
"precision": 0.9497422680412371,
"recall": 0.9671916010498688
},
"eval_PER": {
"f1": 0.9889298892988929,
"number": 676,
"precision": 0.9867452135493373,
"recall": 0.9911242603550295
},
"eval_SPAT": {
"f1": 0.964924838940587,
"number": 694,
"precision": 0.9587482219061166,
"recall": 0.9711815561959655
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9117647058823529,
"number": 33,
"precision": 0.8857142857142857,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.6153846153846153,
"number": 6,
"precision": 0.5714285714285714,
"recall": 0.6666666666666666
},
"eval_accuracy": 0.961395233366435,
"eval_accuracy-all": 0.9726911618669315,
"eval_accuracy-das": 0.9774081429990069,
"eval_accuracy-l1": 0.9667328699106256,
"eval_accuracy-l1l2": 0.9620158887785502,
"eval_accuracy-l2": 0.9786494538232373,
"eval_f1": 0.9638120926050797,
"eval_f1-all": 0.9575581395348837,
"eval_f1-das": 0.9719799591760996,
"eval_f1-l1": 0.9525283797729618,
"eval_f1-l1l2": 0.962516156828953,
"eval_f1-l2": 0.9640479360852197,
"eval_loss": 0.1985810250043869,
"eval_precision": 0.9607887071476585,
"eval_precision-all": 0.9484595450619061,
"eval_precision-das": 0.9682070240295748,
"eval_precision-l1": 0.9365804160324708,
"eval_precision-l1l2": 0.9552451539338654,
"eval_precision-l2": 0.9640479360852197,
"eval_recall": 0.9668545659526494,
"eval_recall-all": 0.966832990901086,
"eval_recall-das": 0.9757824143070045,
"eval_recall-l1": 0.9690288713910761,
"eval_recall-l1l2": 0.9698986975397974,
"eval_recall-l2": 0.9640479360852197,
"eval_runtime": 6.8598,
"eval_samples_per_second": 98.545,
"eval_steps_per_second": 6.268,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.5596,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9334600760456274,
"number": 519,
"precision": 0.9212007504690432,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.948792270531401,
"number": 503,
"precision": 0.9229323308270677,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.2758620689655172,
"number": 30,
"precision": 0.2857142857142857,
"recall": 0.26666666666666666
},
"eval_FT": {
"f1": 0.36363636363636365,
"number": 7,
"precision": 0.5,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9538661468486029,
"number": 762,
"precision": 0.9446589446589446,
"recall": 0.963254593175853
},
"eval_PER": {
"f1": 0.9734904270986746,
"number": 676,
"precision": 0.969208211143695,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9549678341672624,
"number": 694,
"precision": 0.9475177304964539,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8571428571428571,
"number": 33,
"precision": 0.8108108108108109,
"recall": 0.9090909090909091
},
"eval_TITREP": {
"f1": 0.4615384615384615,
"number": 6,
"precision": 0.42857142857142855,
"recall": 0.5
},
"eval_accuracy": 0.961643495531281,
"eval_accuracy-all": 0.9728152929493545,
"eval_accuracy-das": 0.9765392254220456,
"eval_accuracy-l1": 0.9676017874875869,
"eval_accuracy-l1l2": 0.9621400198609732,
"eval_accuracy-l2": 0.9780287984111221,
"eval_f1": 0.9624465932089048,
"eval_f1-all": 0.9537968226206093,
"eval_f1-das": 0.9642393922549565,
"eval_f1-l1": 0.949117341640706,
"eval_f1-l1l2": 0.958699093394733,
"eval_f1-l2": 0.9597873047524094,
"eval_loss": 0.18591071665287018,
"eval_precision": 0.9598564700605517,
"eval_precision-all": 0.9473074696004632,
"eval_precision-das": 0.9590858827865831,
"eval_precision-l1": 0.9388803287108372,
"eval_precision-l1l2": 0.9533485975958786,
"eval_precision-l2": 0.9581950895819509,
"eval_recall": 0.9650507328072153,
"eval_recall-all": 0.9603756970942178,
"eval_recall-das": 0.9694485842026825,
"eval_recall-l1": 0.9595800524934384,
"eval_recall-l1l2": 0.96410998552822,
"eval_recall-l2": 0.9613848202396804,
"eval_runtime": 7.193,
"eval_samples_per_second": 93.98,
"eval_steps_per_second": 5.978,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9419600380589914,
"number": 519,
"precision": 0.9304511278195489,
"recall": 0.953757225433526
},
"eval_ACT_L1": {
"f1": 0.9573643410852714,
"number": 503,
"precision": 0.9338374291115312,
"recall": 0.9821073558648111
},
"eval_ACT_L2": {
"f1": 0.10526315789473684,
"number": 16,
"precision": 0.3333333333333333,
"recall": 0.0625
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.30985915492957744,
"number": 30,
"precision": 0.2682926829268293,
"recall": 0.36666666666666664
},
"eval_FT": {
"f1": 0.30769230769230765,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9487345879299156,
"number": 762,
"precision": 0.938382541720154,
"recall": 0.9593175853018373
},
"eval_PER": {
"f1": 0.9823008849557522,
"number": 676,
"precision": 0.9794117647058823,
"recall": 0.985207100591716
},
"eval_SPAT": {
"f1": 0.9590222861250898,
"number": 694,
"precision": 0.9569583931133429,
"recall": 0.9610951008645533
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9117647058823529,
"number": 33,
"precision": 0.8857142857142857,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.5714285714285715,
"number": 6,
"precision": 0.5,
"recall": 0.6666666666666666
},
"eval_accuracy": 0.9654915590863953,
"eval_accuracy-all": 0.9756703078450845,
"eval_accuracy-das": 0.9801390268123138,
"eval_accuracy-l1": 0.9725670307845085,
"eval_accuracy-l1l2": 0.9663604766633564,
"eval_accuracy-l2": 0.9787735849056604,
"eval_f1": 0.9630793401413982,
"eval_f1-all": 0.9560151471016604,
"eval_f1-das": 0.9725213516524323,
"eval_f1-l1": 0.9543094496365525,
"eval_f1-l1l2": 0.9620471535365152,
"eval_f1-l2": 0.958195089581951,
"eval_loss": 0.14890924096107483,
"eval_precision": 0.9586684539767649,
"eval_precision-all": 0.9488291413703382,
"eval_precision-das": 0.9692820133234641,
"eval_precision-l1": 0.9440164355418593,
"eval_precision-l1l2": 0.9557269351613824,
"eval_precision-l2": 0.955026455026455,
"eval_recall": 0.9675310033821871,
"eval_recall-all": 0.9633108306427942,
"eval_recall-das": 0.9757824143070045,
"eval_recall-l1": 0.9648293963254593,
"eval_recall-l1l2": 0.968451519536903,
"eval_recall-l2": 0.9613848202396804,
"eval_runtime": 6.5579,
"eval_samples_per_second": 103.082,
"eval_steps_per_second": 6.557,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9421800947867298,
"number": 519,
"precision": 0.9272388059701493,
"recall": 0.9576107899807321
},
"eval_ACT_L1": {
"f1": 0.9573643410852714,
"number": 503,
"precision": 0.9338374291115312,
"recall": 0.9821073558648111
},
"eval_ACT_L2": {
"f1": 0.26086956521739124,
"number": 16,
"precision": 0.42857142857142855,
"recall": 0.1875
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.4126984126984127,
"number": 30,
"precision": 0.3939393939393939,
"recall": 0.43333333333333335
},
"eval_FT": {
"f1": 0.3333333333333333,
"number": 7,
"precision": 0.4,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9566343042071198,
"number": 762,
"precision": 0.9438058748403576,
"recall": 0.9698162729658792
},
"eval_PER": {
"f1": 0.9852507374631269,
"number": 676,
"precision": 0.9823529411764705,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9634931997136722,
"number": 694,
"precision": 0.957325746799431,
"recall": 0.9697406340057637
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.927536231884058,
"number": 33,
"precision": 0.8888888888888888,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9669811320754716,
"eval_accuracy-all": 0.9762288977159881,
"eval_accuracy-das": 0.980759682224429,
"eval_accuracy-l1": 0.9724428997020854,
"eval_accuracy-l1l2": 0.9677259185700099,
"eval_accuracy-l2": 0.9800148957298908,
"eval_f1": 0.9667938074938299,
"eval_f1-all": 0.9609898107714702,
"eval_f1-das": 0.9720111214087118,
"eval_f1-l1": 0.96,
"eval_f1-l1l2": 0.964824120603015,
"eval_f1-l2": 0.9622516556291391,
"eval_loss": 0.15314123034477234,
"eval_precision": 0.962045099352534,
"eval_precision-all": 0.9532197516604101,
"eval_precision-das": 0.967170785687938,
"eval_precision-l1": 0.9501285347043702,
"eval_precision-l1l2": 0.9572649572649573,
"eval_precision-l2": 0.9571805006587615,
"eval_recall": 0.9715896279594137,
"eval_recall-all": 0.9688875843850895,
"eval_recall-das": 0.9769001490312966,
"eval_recall-l1": 0.9700787401574803,
"eval_recall-l1l2": 0.9725036179450073,
"eval_recall-l2": 0.9673768308921438,
"eval_runtime": 7.6675,
"eval_samples_per_second": 88.164,
"eval_steps_per_second": 5.608,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9300567107750471,
"number": 519,
"precision": 0.9128014842300557,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.9568627450980391,
"number": 503,
"precision": 0.9439071566731141,
"recall": 0.9701789264413518
},
"eval_ACT_L2": {
"f1": 0.2105263157894737,
"number": 16,
"precision": 0.18181818181818182,
"recall": 0.25
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.37499999999999994,
"number": 30,
"precision": 0.3,
"recall": 0.5
},
"eval_FT": {
"f1": 0.3333333333333333,
"number": 7,
"precision": 0.4,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9635890767230169,
"number": 762,
"precision": 0.9548969072164949,
"recall": 0.9724409448818898
},
"eval_PER": {
"f1": 0.986019131714496,
"number": 676,
"precision": 0.9809663250366032,
"recall": 0.9911242603550295
},
"eval_SPAT": {
"f1": 0.9591982820329277,
"number": 694,
"precision": 0.9530583214793741,
"recall": 0.9654178674351584
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9090909090909091,
"number": 33,
"precision": 0.9090909090909091,
"recall": 0.9090909090909091
},
"eval_TITREP": {
"f1": 0.6153846153846153,
"number": 6,
"precision": 0.5714285714285714,
"recall": 0.6666666666666666
},
"eval_accuracy": 0.9632571996027806,
"eval_accuracy-all": 0.9734980139026812,
"eval_accuracy-das": 0.9815044687189672,
"eval_accuracy-l1": 0.9703326713008937,
"eval_accuracy-l1l2": 0.9643743793445879,
"eval_accuracy-l2": 0.9766633565044687,
"eval_f1": 0.9649299719887955,
"eval_f1-all": 0.9584543869843115,
"eval_f1-das": 0.9727323316638843,
"eval_f1-l1": 0.9554173146708138,
"eval_f1-l1l2": 0.9624534250501576,
"eval_f1-l2": 0.9623265036351619,
"eval_loss": 0.13265174627304077,
"eval_precision": 0.9590200445434298,
"eval_precision-all": 0.9488064423353466,
"eval_precision-das": 0.9685999261174733,
"eval_precision-l1": 0.9436763952892985,
"eval_precision-l1l2": 0.9531649162645472,
"eval_precision-l2": 0.9553805774278216,
"eval_recall": 0.970913190529876,
"eval_recall-all": 0.9683005576753743,
"eval_recall-das": 0.9769001490312966,
"eval_recall-l1": 0.9674540682414698,
"eval_recall-l1l2": 0.9719247467438495,
"eval_recall-l2": 0.9693741677762983,
"eval_runtime": 7.359,
"eval_samples_per_second": 91.86,
"eval_steps_per_second": 5.843,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9409559512652297,
"number": 519,
"precision": 0.916058394160584,
"recall": 0.9672447013487476
},
"eval_ACT_L1": {
"f1": 0.96484375,
"number": 503,
"precision": 0.9481765834932822,
"recall": 0.9821073558648111
},
"eval_ACT_L2": {
"f1": 0.37209302325581395,
"number": 16,
"precision": 0.2962962962962963,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.47368421052631576,
"number": 30,
"precision": 0.391304347826087,
"recall": 0.6
},
"eval_FT": {
"f1": 0.3333333333333333,
"number": 7,
"precision": 0.4,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9609375,
"number": 762,
"precision": 0.9534883720930233,
"recall": 0.968503937007874
},
"eval_PER": {
"f1": 0.9852507374631269,
"number": 676,
"precision": 0.9823529411764705,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9597701149425288,
"number": 694,
"precision": 0.9570200573065902,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9253731343283583,
"number": 33,
"precision": 0.9117647058823529,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.42857142857142855,
"number": 6,
"precision": 0.375,
"recall": 0.5
},
"eval_accuracy": 0.9653674280039722,
"eval_accuracy-all": 0.9744289970208541,
"eval_accuracy-das": 0.9823733862959285,
"eval_accuracy-l1": 0.9714498510427011,
"eval_accuracy-l1l2": 0.9663604766633564,
"eval_accuracy-l2": 0.9774081429990069,
"eval_f1": 0.9669171245934731,
"eval_f1-all": 0.960616189507339,
"eval_f1-das": 0.9740452354467927,
"eval_f1-l1": 0.96,
"eval_f1-l1l2": 0.9648745519713262,
"eval_f1-l2": 0.9613988782580007,
"eval_loss": 0.14285241067409515,
"eval_precision": 0.9618473895582329,
"eval_precision-all": 0.9513529073114565,
"eval_precision-das": 0.9693726937269372,
"eval_precision-l1": 0.9501285347043702,
"eval_precision-l1l2": 0.9559659090909091,
"eval_precision-l2": 0.9529103989535644,
"eval_recall": 0.9720405862457723,
"eval_recall-all": 0.9700616378045201,
"eval_recall-das": 0.9787630402384501,
"eval_recall-l1": 0.9700787401574803,
"eval_recall-l1l2": 0.9739507959479016,
"eval_recall-l2": 0.9700399467376831,
"eval_runtime": 7.5384,
"eval_samples_per_second": 89.674,
"eval_steps_per_second": 5.704,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.1442,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.9571020019065777,
"number": 519,
"precision": 0.9471698113207547,
"recall": 0.9672447013487476
},
"eval_ACT_L1": {
"f1": 0.9782178217821782,
"number": 503,
"precision": 0.9743589743589743,
"recall": 0.9821073558648111
},
"eval_ACT_L2": {
"f1": 0.41025641025641024,
"number": 16,
"precision": 0.34782608695652173,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9919058130978661,
"number": 678,
"precision": 0.9897209985315712,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.47368421052631576,
"number": 30,
"precision": 0.391304347826087,
"recall": 0.6
},
"eval_FT": {
"f1": 0.30769230769230765,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9712041884816753,
"number": 762,
"precision": 0.9686684073107049,
"recall": 0.973753280839895
},
"eval_PER": {
"f1": 0.9867060561299853,
"number": 676,
"precision": 0.9852507374631269,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9621157969978557,
"number": 694,
"precision": 0.9546099290780142,
"recall": 0.9697406340057637
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9253731343283583,
"number": 33,
"precision": 0.9117647058823529,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.42857142857142855,
"number": 6,
"precision": 0.375,
"recall": 0.5
},
"eval_accuracy": 0.9658639523336644,
"eval_accuracy-all": 0.9746772591857001,
"eval_accuracy-das": 0.9833664349553128,
"eval_accuracy-l1": 0.971077457795432,
"eval_accuracy-l1l2": 0.9664846077457795,
"eval_accuracy-l2": 0.9782770605759682,
"eval_f1": 0.9711776626885835,
"eval_f1-all": 0.9657484331730068,
"eval_f1-das": 0.9778769287971741,
"eval_f1-l1": 0.9648529028898724,
"eval_f1-l1l2": 0.9700633275762809,
"eval_f1-l2": 0.966887417218543,
"eval_loss": 0.1273569017648697,
"eval_precision": 0.9698673262873847,
"eval_precision-all": 0.959177764910249,
"eval_precision-das": 0.9758812615955473,
"eval_precision-l1": 0.9571280991735537,
"eval_precision-l1l2": 0.9647867162897223,
"eval_precision-l2": 0.9617918313570487,
"eval_recall": 0.9724915445321308,
"eval_recall-all": 0.9724097446433813,
"eval_recall-das": 0.9798807749627422,
"eval_recall-l1": 0.9727034120734908,
"eval_recall-l1l2": 0.975397973950796,
"eval_recall-l2": 0.9720372836218375,
"eval_runtime": 6.084,
"eval_samples_per_second": 111.111,
"eval_steps_per_second": 7.068,
"step": 1000
},
{
"epoch": 2.89,
"eval_ACT": {
"f1": 0.9563567362428842,
"number": 519,
"precision": 0.9420560747663551,
"recall": 0.9710982658959537
},
"eval_ACT_L1": {
"f1": 0.9782608695652174,
"number": 503,
"precision": 0.9724950884086444,
"recall": 0.9840954274353877
},
"eval_ACT_L2": {
"f1": 0.4285714285714286,
"number": 16,
"precision": 0.34615384615384615,
"recall": 0.5625
},
"eval_CARDINAL": {
"f1": 0.9933677229182019,
"number": 678,
"precision": 0.9926362297496318,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.5070422535211268,
"number": 30,
"precision": 0.43902439024390244,
"recall": 0.6
},
"eval_FT": {
"f1": 0.36363636363636365,
"number": 7,
"precision": 0.5,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9713541666666666,
"number": 762,
"precision": 0.9638242894056848,
"recall": 0.979002624671916
},
"eval_PER": {
"f1": 0.9859778597785979,
"number": 676,
"precision": 0.9837997054491899,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9654676258992806,
"number": 694,
"precision": 0.9640804597701149,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9696969696969697,
"number": 33,
"precision": 0.9696969696969697,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.42857142857142855,
"number": 6,
"precision": 0.375,
"recall": 0.5
},
"eval_accuracy": 0.9636295928500497,
"eval_accuracy-all": 0.9731256206554121,
"eval_accuracy-das": 0.9812562065541212,
"eval_accuracy-l1": 0.9700844091360477,
"eval_accuracy-l1l2": 0.964746772591857,
"eval_accuracy-l2": 0.9761668321747765,
"eval_f1": 0.9710437710437709,
"eval_f1-all": 0.9679113185530922,
"eval_f1-das": 0.9770114942528736,
"eval_f1-l1": 0.9671018276762402,
"eval_f1-l1l2": 0.9714039373473201,
"eval_f1-l2": 0.9689358889623265,
"eval_loss": 0.15453395247459412,
"eval_precision": 0.9667039106145251,
"eval_precision-all": 0.9620179762249927,
"eval_precision-das": 0.9723247232472325,
"eval_precision-l1": 0.9620779220779221,
"eval_precision-l1l2": 0.9646118721461188,
"eval_precision-l2": 0.9619422572178478,
"eval_recall": 0.9754227733934611,
"eval_recall-all": 0.9738773114176695,
"eval_recall-das": 0.9817436661698957,
"eval_recall-l1": 0.9721784776902888,
"eval_recall-l1l2": 0.9782923299565847,
"eval_recall-l2": 0.9760319573901465,
"eval_runtime": 6.429,
"eval_samples_per_second": 105.148,
"eval_steps_per_second": 6.688,
"step": 1100
},
{
"epoch": 3.15,
"eval_ACT": {
"f1": 0.9466666666666668,
"number": 519,
"precision": 0.935969868173258,
"recall": 0.9576107899807321
},
"eval_ACT_L1": {
"f1": 0.9674234945705825,
"number": 503,
"precision": 0.9607843137254902,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.37837837837837834,
"number": 16,
"precision": 0.3333333333333333,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.547945205479452,
"number": 30,
"precision": 0.46511627906976744,
"recall": 0.6666666666666666
},
"eval_FT": {
"f1": 0.4615384615384615,
"number": 7,
"precision": 0.5,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9647979139504563,
"number": 762,
"precision": 0.9585492227979274,
"recall": 0.9711286089238845
},
"eval_PER": {
"f1": 0.9881656804733728,
"number": 676,
"precision": 0.9881656804733728,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9691756272401433,
"number": 694,
"precision": 0.9643366619115549,
"recall": 0.9740634005763689
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9393939393939394,
"number": 33,
"precision": 0.9393939393939394,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.6,
"number": 6,
"precision": 0.75,
"recall": 0.5
},
"eval_accuracy": 0.964746772591857,
"eval_accuracy-all": 0.9746151936444886,
"eval_accuracy-das": 0.9803872889771599,
"eval_accuracy-l1": 0.9708291956305859,
"eval_accuracy-l1l2": 0.9652432969215492,
"eval_accuracy-l2": 0.9784011916583912,
"eval_f1": 0.9706774519716885,
"eval_f1-all": 0.9667347534286548,
"eval_f1-das": 0.9745589600742803,
"eval_f1-l1": 0.9668839634941329,
"eval_f1-l1l2": 0.9678068410462776,
"eval_f1-l2": 0.9665452136469029,
"eval_loss": 0.14055882394313812,
"eval_precision": 0.9673085535154501,
"eval_precision-all": 0.9611256164780969,
"eval_precision-das": 0.9714920399851906,
"eval_precision-l1": 0.960621761658031,
"eval_precision-l1l2": 0.96117613474165,
"eval_precision-l2": 0.961766644693474,
"eval_recall": 0.9740698985343855,
"eval_recall-all": 0.9724097446433813,
"eval_recall-das": 0.977645305514158,
"eval_recall-l1": 0.9732283464566929,
"eval_recall-l1l2": 0.9745296671490593,
"eval_recall-l2": 0.9713715046604527,
"eval_runtime": 5.9342,
"eval_samples_per_second": 113.916,
"eval_steps_per_second": 7.246,
"step": 1200
},
{
"epoch": 3.41,
"eval_ACT": {
"f1": 0.9363295880149812,
"number": 519,
"precision": 0.9107468123861566,
"recall": 0.9633911368015414
},
"eval_ACT_L1": {
"f1": 0.9591439688715954,
"number": 503,
"precision": 0.939047619047619,
"recall": 0.9801192842942346
},
"eval_ACT_L2": {
"f1": 0.35000000000000003,
"number": 16,
"precision": 0.2916666666666667,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.43037974683544306,
"number": 30,
"precision": 0.3469387755102041,
"recall": 0.5666666666666667
},
"eval_FT": {
"f1": 0.42857142857142855,
"number": 7,
"precision": 0.42857142857142855,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9636363636363636,
"number": 762,
"precision": 0.9537275064267352,
"recall": 0.973753280839895
},
"eval_PER": {
"f1": 0.9845246868091379,
"number": 676,
"precision": 0.9809104258443465,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9707351891506067,
"number": 694,
"precision": 0.9618104667609618,
"recall": 0.9798270893371758
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9253731343283583,
"number": 33,
"precision": 0.9117647058823529,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.42857142857142855,
"number": 6,
"precision": 0.375,
"recall": 0.5
},
"eval_accuracy": 0.967974180734856,
"eval_accuracy-all": 0.9767254220456802,
"eval_accuracy-das": 0.9826216484607746,
"eval_accuracy-l1": 0.9735600794438928,
"eval_accuracy-l1l2": 0.9685948361469712,
"eval_accuracy-l2": 0.9798907646474677,
"eval_f1": 0.9691876750700281,
"eval_f1-all": 0.961889581220113,
"eval_f1-das": 0.9733333333333334,
"eval_f1-l1": 0.960951642099819,
"eval_f1-l1l2": 0.9658928059615935,
"eval_f1-l2": 0.963085036255768,
"eval_loss": 0.13519717752933502,
"eval_precision": 0.9632516703786191,
"eval_precision-all": 0.9499141385231826,
"eval_precision-das": 0.96759941089838,
"eval_precision-l1": 0.9469928644240571,
"eval_precision-l1l2": 0.9565711041725802,
"eval_precision-l2": 0.9536553524804178,
"eval_recall": 0.9751972942502819,
"eval_recall-all": 0.9741708247725271,
"eval_recall-das": 0.9791356184798807,
"eval_recall-l1": 0.9753280839895013,
"eval_recall-l1l2": 0.975397973950796,
"eval_recall-l2": 0.9727030625832224,
"eval_runtime": 6.3863,
"eval_samples_per_second": 105.852,
"eval_steps_per_second": 6.733,
"step": 1300
},
{
"epoch": 3.67,
"eval_ACT": {
"f1": 0.9461756373937679,
"number": 519,
"precision": 0.9277777777777778,
"recall": 0.9653179190751445
},
"eval_ACT_L1": {
"f1": 0.9686274509803922,
"number": 503,
"precision": 0.9555125725338491,
"recall": 0.9821073558648111
},
"eval_ACT_L2": {
"f1": 0.358974358974359,
"number": 16,
"precision": 0.30434782608695654,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.5507246376811593,
"number": 30,
"precision": 0.48717948717948717,
"recall": 0.6333333333333333
},
"eval_FT": {
"f1": 0.5,
"number": 7,
"precision": 0.6,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9679529103989535,
"number": 762,
"precision": 0.9647979139504563,
"recall": 0.9711286089238845
},
"eval_PER": {
"f1": 0.9881656804733728,
"number": 676,
"precision": 0.9881656804733728,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9727403156384505,
"number": 694,
"precision": 0.9685714285714285,
"recall": 0.9769452449567724
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9696969696969697,
"number": 33,
"precision": 0.9696969696969697,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.4615384615384615,
"number": 6,
"precision": 0.42857142857142855,
"recall": 0.5
},
"eval_accuracy": 0.9664846077457795,
"eval_accuracy-all": 0.9749255213505462,
"eval_accuracy-das": 0.9826216484607746,
"eval_accuracy-l1": 0.9723187686196624,
"eval_accuracy-l1l2": 0.9669811320754716,
"eval_accuracy-l2": 0.97753227408143,
"eval_f1": 0.9732283464566929,
"eval_f1-all": 0.9683442742523706,
"eval_f1-das": 0.9756912228613843,
"eval_f1-l1": 0.9689861871253583,
"eval_f1-l1l2": 0.9711981566820277,
"eval_f1-l2": 0.9675281643472498,
"eval_loss": 0.1356203556060791,
"eval_precision": 0.971043771043771,
"eval_precision-all": 0.9625870069605569,
"eval_precision-das": 0.9719038817005545,
"eval_precision-l1": 0.9622153209109731,
"eval_precision-l1l2": 0.9664660361134996,
"eval_precision-l2": 0.9630606860158312,
"eval_recall": 0.9754227733934611,
"eval_recall-all": 0.9741708247725271,
"eval_recall-das": 0.9795081967213115,
"eval_recall-l1": 0.9758530183727034,
"eval_recall-l1l2": 0.9759768451519537,
"eval_recall-l2": 0.9720372836218375,
"eval_runtime": 7.0867,
"eval_samples_per_second": 95.39,
"eval_steps_per_second": 6.068,
"step": 1400
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 564085470663792.0,
"trial_name": null,
"trial_params": null
}