{ "best_metric": 0.9654571843251089, "best_model_checkpoint": "/work/stual/res_ICDAR/method_2/tmp/221-camembert-ner-joint-labelling-io/checkpoint-2000", "epoch": 5.2493438320209975, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.26, "eval_ACT": { "f1": 0.8818604651162791, "number": 519, "precision": 0.8525179856115108, "recall": 0.9132947976878613 }, "eval_ACT_L1": { "f1": 0.8951841359773371, "number": 503, "precision": 0.8525179856115108, "recall": 0.9423459244532804 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9765739385065886, "number": 678, "precision": 0.9694767441860465, "recall": 0.9837758112094396 }, "eval_DESC": { "f1": 0.0, "number": 30, "precision": 0.0, "recall": 0.0 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9248704663212436, "number": 761, "precision": 0.9118773946360154, "recall": 0.938239159001314 }, "eval_PER": { "f1": 0.9236417033773863, "number": 676, "precision": 0.9169096209912536, "recall": 0.9304733727810651 }, "eval_SPAT": { "f1": 0.9313304721030043, "number": 694, "precision": 0.9247159090909091, "recall": 0.9380403458213257 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.0, "number": 33, "precision": 0.0, "recall": 0.0 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.931030118957226, "eval_accuracy-all": 0.9533029612756264, "eval_accuracy-das": 0.9460895975702354, "eval_accuracy-l1": 0.9406479372310808, "eval_accuracy-l2": 0.9659579853201721, "eval_f1": 0.9194107452339687, "eval_f1-all": 0.9189506082368459, "eval_f1-das": 0.9173768062245277, "eval_f1-l1": 0.910932225396001, "eval_f1-l2": 0.9293405114401078, "eval_loss": 0.3786505162715912, "eval_precision": 0.9136050516647531, "eval_precision-all": 0.9174714661984197, "eval_precision-das": 0.9126428308145964, "eval_precision-l1": 0.9013360739979445, "eval_precision-l2": 0.938817131203263, "eval_recall": 0.9252906976744186, "eval_recall-all": 0.9204345273047563, "eval_recall-das": 0.9221601489757915, "eval_recall-l1": 0.920734908136483, "eval_recall-l2": 0.9200532978014657, "eval_runtime": 5.4791, "eval_samples_per_second": 123.379, "eval_steps_per_second": 7.848, "step": 100 }, { "epoch": 0.52, "eval_ACT": { "f1": 0.8797061524334251, "number": 519, "precision": 0.8403508771929824, "recall": 0.9229287090558767 }, "eval_ACT_L1": { "f1": 0.8928238583410996, "number": 503, "precision": 0.8403508771929824, "recall": 0.952286282306163 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9773557341124909, "number": 678, "precision": 0.9681620839363242, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.09523809523809522, "number": 30, "precision": 0.16666666666666666, "recall": 0.06666666666666667 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9347123464770524, "number": 761, "precision": 0.9198473282442748, "recall": 0.9500657030223391 }, "eval_PER": { "f1": 0.9285187914517319, "number": 676, "precision": 0.9251101321585903, "recall": 0.9319526627218935 }, "eval_SPAT": { "f1": 0.9212207239176721, "number": 694, "precision": 0.9076923076923077, "recall": 0.9351585014409222 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.0, "number": 33, "precision": 0.0, "recall": 0.0 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9339407744874715, "eval_accuracy-all": 0.9529865856745128, "eval_accuracy-das": 0.9482409516578082, "eval_accuracy-l1": 0.9407744874715261, "eval_accuracy-l2": 0.9651986838774994, "eval_f1": 0.9257654534950897, "eval_f1-all": 0.9188164990526161, "eval_f1-das": 0.9222242748937742, "eval_f1-l1": 0.9065155807365439, "eval_f1-l2": 0.9348556077904635, "eval_loss": 0.2861093580722809, "eval_precision": 0.9199196326061998, "eval_precision-all": 0.912301013024602, "eval_precision-das": 0.9149560117302052, "eval_precision-l1": 0.8897876643073812, "eval_precision-l2": 0.942450914014895, "eval_recall": 0.9316860465116279, "eval_recall-all": 0.9254257193188491, "eval_recall-das": 0.929608938547486, "eval_recall-l1": 0.9238845144356955, "eval_recall-l2": 0.927381745502998, "eval_runtime": 5.893, "eval_samples_per_second": 114.712, "eval_steps_per_second": 7.297, "step": 200 }, { "epoch": 0.79, "eval_ACT": { "f1": 0.9220532319391636, "number": 519, "precision": 0.9099437148217636, "recall": 0.9344894026974951 }, "eval_ACT_L1": { "f1": 0.9362934362934364, "number": 503, "precision": 0.9099437148217636, "recall": 0.9642147117296223 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9860396767083027, "number": 678, "precision": 0.9824304538799414, "recall": 0.9896755162241888 }, "eval_DESC": { "f1": 0.27450980392156865, "number": 30, "precision": 0.3333333333333333, "recall": 0.23333333333333334 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9346405228758171, "number": 761, "precision": 0.929778933680104, "recall": 0.9395532194480947 }, "eval_PER": { "f1": 0.9381443298969072, "number": 676, "precision": 0.9340175953079178, "recall": 0.9423076923076923 }, "eval_SPAT": { "f1": 0.9430199430199431, "number": 694, "precision": 0.9323943661971831, "recall": 0.9538904899135446 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.17777777777777776, "number": 33, "precision": 0.3333333333333333, "recall": 0.12121212121212122 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9472285497342445, "eval_accuracy-all": 0.9614654517843584, "eval_accuracy-das": 0.9639331814730449, "eval_accuracy-l1": 0.9538091622374083, "eval_accuracy-l2": 0.9691217413313086, "eval_f1": 0.9426157879405767, "eval_f1-all": 0.9333920187793427, "eval_f1-das": 0.9416153702667412, "eval_f1-l1": 0.9301480135029863, "eval_f1-l2": 0.9376053962900506, "eval_loss": 0.22815603017807007, "eval_precision": 0.9445417396380619, "eval_precision-all": 0.9328445747800587, "eval_precision-das": 0.9431988041853513, "eval_precision-l1": 0.920349434737924, "eval_precision-l2": 0.9494535519125683, "eval_recall": 0.9406976744186046, "eval_recall-all": 0.9339401056958309, "eval_recall-das": 0.9400372439478585, "eval_recall-l1": 0.9401574803149606, "eval_recall-l2": 0.9260493004663558, "eval_runtime": 6.5502, "eval_samples_per_second": 103.203, "eval_steps_per_second": 6.565, "step": 300 }, { "epoch": 1.05, "eval_ACT": { "f1": 0.9244019138755981, "number": 519, "precision": 0.9182509505703422, "recall": 0.930635838150289 }, "eval_ACT_L1": { "f1": 0.9448818897637794, "number": 503, "precision": 0.935672514619883, "recall": 0.9542743538767395 }, "eval_ACT_L2": { "f1": 0.20689655172413793, "number": 16, "precision": 0.23076923076923078, "recall": 0.1875 }, "eval_CARDINAL": { "f1": 0.9874723655121592, "number": 678, "precision": 0.9867452135493373, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.28235294117647064, "number": 30, "precision": 0.21818181818181817, "recall": 0.4 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9488859764089123, "number": 761, "precision": 0.9464052287581699, "recall": 0.9513797634691196 }, "eval_PER": { "f1": 0.951683748169839, "number": 676, "precision": 0.9420289855072463, "recall": 0.9615384615384616 }, "eval_SPAT": { "f1": 0.9491768074445239, "number": 694, "precision": 0.9431009957325747, "recall": 0.9553314121037464 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.5263157894736842, "number": 33, "precision": 0.625, "recall": 0.45454545454545453 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9395089850670716, "eval_accuracy-all": 0.9572892938496583, "eval_accuracy-das": 0.9578587699316629, "eval_accuracy-l1": 0.9484940521386991, "eval_accuracy-l2": 0.9660845355606176, "eval_f1": 0.9442109839153746, "eval_f1-all": 0.9395443925233645, "eval_f1-das": 0.9498415066194295, "eval_f1-l1": 0.933781686497672, "eval_f1-l2": 0.9470154258886653, "eval_loss": 0.19686226546764374, "eval_precision": 0.9413464316671483, "eval_precision-all": 0.9346310284718187, "eval_precision-das": 0.9510828976848394, "eval_precision-l1": 0.9204487506374299, "eval_precision-l2": 0.9534098582039163, "eval_recall": 0.9470930232558139, "eval_recall-all": 0.9445096887844979, "eval_recall-das": 0.9486033519553073, "eval_recall-l1": 0.94750656167979, "eval_recall-l2": 0.9407061958694204, "eval_runtime": 6.1906, "eval_samples_per_second": 109.198, "eval_steps_per_second": 6.946, "step": 400 }, { "epoch": 1.31, "learning_rate": 9e-05, "loss": 0.3718, "step": 500 }, { "epoch": 1.31, "eval_ACT": { "f1": 0.9380362249761677, "number": 519, "precision": 0.9283018867924528, "recall": 0.9479768786127167 }, "eval_ACT_L1": { "f1": 0.952565343659245, "number": 503, "precision": 0.9283018867924528, "recall": 0.9781312127236581 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.986019131714496, "number": 678, "precision": 0.9838472834067548, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.23809523809523808, "number": 30, "precision": 0.4166666666666667, "recall": 0.16666666666666666 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.945645055664702, "number": 761, "precision": 0.9425587467362925, "recall": 0.9487516425755584 }, "eval_PER": { "f1": 0.9683124539425203, "number": 676, "precision": 0.9647577092511013, "recall": 0.9718934911242604 }, "eval_SPAT": { "f1": 0.9472182596291013, "number": 694, "precision": 0.9378531073446328, "recall": 0.9567723342939481 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8181818181818182, "number": 33, "precision": 0.8181818181818182, "recall": 0.8181818181818182 }, "eval_TITREP": { "f1": 0.25, "number": 6, "precision": 0.5, "recall": 0.16666666666666666 }, "eval_accuracy": 0.9534295115160719, "eval_accuracy-all": 0.9654517843583903, "eval_accuracy-das": 0.9665907365223994, "eval_accuracy-l1": 0.958744621614781, "eval_accuracy-l2": 0.9721589471019995, "eval_f1": 0.9550021843599825, "eval_f1-all": 0.9496993694090042, "eval_f1-das": 0.9570552147239264, "eval_f1-l1": 0.9478623566214807, "eval_f1-l2": 0.9520616828695944, "eval_loss": 0.18782156705856323, "eval_precision": 0.9568135395389553, "eval_precision-all": 0.9487254614708468, "eval_precision-das": 0.955456570155902, "eval_precision-l1": 0.9414810978767478, "eval_precision-l2": 0.9581646423751687, "eval_recall": 0.9531976744186047, "eval_recall-all": 0.9506752789195537, "eval_recall-das": 0.958659217877095, "eval_recall-l1": 0.9543307086614173, "eval_recall-l2": 0.9460359760159893, "eval_runtime": 6.174, "eval_samples_per_second": 109.491, "eval_steps_per_second": 6.965, "step": 500 }, { "epoch": 1.57, "eval_ACT": { "f1": 0.9334600760456274, "number": 519, "precision": 0.9212007504690432, "recall": 0.9460500963391136 }, "eval_ACT_L1": { "f1": 0.9468599033816425, "number": 503, "precision": 0.9210526315789473, "recall": 0.974155069582505 }, "eval_ACT_L2": { "f1": 0.11764705882352941, "number": 16, "precision": 1.0, "recall": 0.0625 }, "eval_CARDINAL": { "f1": 0.9867452135493373, "number": 678, "precision": 0.9852941176470589, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.3333333333333333, "number": 30, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9490403706154864, "number": 761, "precision": 0.956, "recall": 0.9421813403416557 }, "eval_PER": { "f1": 0.9572271386430679, "number": 676, "precision": 0.9544117647058824, "recall": 0.9600591715976331 }, "eval_SPAT": { "f1": 0.9538904899135446, "number": 694, "precision": 0.9538904899135446, "recall": 0.9538904899135446 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.6153846153846154, "number": 33, "precision": 0.625, "recall": 0.6060606060606061 }, "eval_TITREP": { "f1": 0.4444444444444444, "number": 6, "precision": 0.6666666666666666, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9544419134396356, "eval_accuracy-all": 0.9670969374841812, "eval_accuracy-das": 0.9669703872437357, "eval_accuracy-l1": 0.960642875221463, "eval_accuracy-l2": 0.9735509997468995, "eval_f1": 0.9518265172463979, "eval_f1-all": 0.9462397179788484, "eval_f1-das": 0.952807312068644, "eval_f1-l1": 0.9429835980213485, "eval_f1-l2": 0.9504550050556118, "eval_loss": 0.1709740161895752, "eval_precision": 0.9530749052754299, "eval_precision-all": 0.9467960023515579, "eval_precision-das": 0.9544095665171899, "eval_precision-l1": 0.9354338842975206, "eval_precision-l2": 0.9618008185538881, "eval_recall": 0.9505813953488372, "eval_recall-all": 0.9456840869054609, "eval_recall-das": 0.9512104283054004, "eval_recall-l1": 0.9506561679790027, "eval_recall-l2": 0.9393737508327782, "eval_runtime": 6.1402, "eval_samples_per_second": 110.094, "eval_steps_per_second": 7.003, "step": 600 }, { "epoch": 1.84, "eval_ACT": { "f1": 0.9339712918660287, "number": 519, "precision": 0.9277566539923955, "recall": 0.9402697495183044 }, "eval_ACT_L1": { "f1": 0.9536031589338598, "number": 503, "precision": 0.9470588235294117, "recall": 0.9602385685884692 }, "eval_ACT_L2": { "f1": 0.3125, "number": 16, "precision": 0.3125, "recall": 0.3125 }, "eval_CARDINAL": { "f1": 0.9867647058823529, "number": 678, "precision": 0.9838709677419355, "recall": 0.9896755162241888 }, "eval_DESC": { "f1": 0.5, "number": 30, "precision": 0.47058823529411764, "recall": 0.5333333333333333 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9457161543492479, "number": 761, "precision": 0.94140625, "recall": 0.9500657030223391 }, "eval_PER": { "f1": 0.9711324944485566, "number": 676, "precision": 0.9718518518518519, "recall": 0.9704142011834319 }, "eval_SPAT": { "f1": 0.9611510791366907, "number": 694, "precision": 0.9597701149425287, "recall": 0.962536023054755 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9032258064516129, "number": 33, "precision": 0.9655172413793104, "recall": 0.8484848484848485 }, "eval_TITREP": { "f1": 0.2857142857142857, "number": 6, "precision": 1.0, "recall": 0.16666666666666666 }, "eval_accuracy": 0.95292331055429, "eval_accuracy-all": 0.9641862819539357, "eval_accuracy-das": 0.9721589471019995, "eval_accuracy-l1": 0.9586180713743356, "eval_accuracy-l2": 0.9697544925335359, "eval_f1": 0.9564586357039186, "eval_f1-all": 0.9537919906117059, "eval_f1-das": 0.9595827900912646, "eval_f1-l1": 0.9544502617801047, "eval_f1-l2": 0.9529529529529529, "eval_loss": 0.16730760037899017, "eval_precision": 0.9550724637681159, "eval_precision-all": 0.9530929346232776, "eval_precision-das": 0.9597615499254843, "eval_precision-l1": 0.951958224543081, "eval_precision-l2": 0.9545454545454546, "eval_recall": 0.9578488372093024, "eval_recall-all": 0.9544920728126834, "eval_recall-das": 0.9594040968342644, "eval_recall-l1": 0.9569553805774278, "eval_recall-l2": 0.9513657561625583, "eval_runtime": 6.0205, "eval_samples_per_second": 112.283, "eval_steps_per_second": 7.142, "step": 700 }, { "epoch": 2.1, "eval_ACT": { "f1": 0.9249762583095916, "number": 519, "precision": 0.9119850187265918, "recall": 0.9383429672447013 }, "eval_ACT_L1": { "f1": 0.9545454545454545, "number": 503, "precision": 0.9489194499017681, "recall": 0.9602385685884692 }, "eval_ACT_L2": { "f1": 0.19512195121951217, "number": 16, "precision": 0.16, "recall": 0.25 }, "eval_CARDINAL": { "f1": 0.9851851851851852, "number": 678, "precision": 0.9895833333333334, "recall": 0.9808259587020649 }, "eval_DESC": { "f1": 0.4347826086956522, "number": 30, "precision": 0.38461538461538464, "recall": 0.5 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9516971279373369, "number": 761, "precision": 0.9455252918287937, "recall": 0.9579500657030223 }, "eval_PER": { "f1": 0.9748892171344165, "number": 676, "precision": 0.9734513274336283, "recall": 0.9763313609467456 }, "eval_SPAT": { "f1": 0.9342857142857142, "number": 694, "precision": 0.9263456090651558, "recall": 0.9423631123919308 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8656716417910447, "number": 33, "precision": 0.8529411764705882, "recall": 0.8787878787878788 }, "eval_TITREP": { "f1": 0.5, "number": 6, "precision": 1.0, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9510250569476082, "eval_accuracy-all": 0.9619083776259175, "eval_accuracy-das": 0.9702606934953176, "eval_accuracy-l1": 0.9567198177676538, "eval_accuracy-l2": 0.9670969374841812, "eval_f1": 0.955323469683783, "eval_f1-all": 0.9473838059047063, "eval_f1-das": 0.9587053571428571, "eval_f1-l1": 0.9444878811571541, "eval_f1-l2": 0.95108153078203, "eval_loss": 0.1715497374534607, "eval_precision": 0.9533873769542559, "eval_precision-all": 0.9432479627473807, "eval_precision-das": 0.9576365663322185, "eval_precision-l1": 0.937888198757764, "eval_precision-l2": 0.9501329787234043, "eval_recall": 0.9572674418604651, "eval_recall-all": 0.9515560775102759, "eval_recall-das": 0.9597765363128492, "eval_recall-l1": 0.9511811023622048, "eval_recall-l2": 0.9520319786808794, "eval_runtime": 6.0149, "eval_samples_per_second": 112.387, "eval_steps_per_second": 7.149, "step": 800 }, { "epoch": 2.36, "eval_ACT": { "f1": 0.9271523178807947, "number": 519, "precision": 0.9107806691449815, "recall": 0.9441233140655106 }, "eval_ACT_L1": { "f1": 0.9500489715964741, "number": 503, "precision": 0.9362934362934363, "recall": 0.9642147117296223 }, "eval_ACT_L2": { "f1": 0.2777777777777778, "number": 16, "precision": 0.25, "recall": 0.3125 }, "eval_CARDINAL": { "f1": 0.9816581071166545, "number": 678, "precision": 0.9766423357664233, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.39473684210526316, "number": 30, "precision": 0.32608695652173914, "recall": 0.5 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9455022980958635, "number": 761, "precision": 0.9448818897637795, "recall": 0.9461235216819974 }, "eval_PER": { "f1": 0.9763663220088628, "number": 676, "precision": 0.9749262536873157, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9526542324246772, "number": 694, "precision": 0.9485714285714286, "recall": 0.9567723342939481 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.823529411764706, "number": 33, "precision": 0.8, "recall": 0.8484848484848485 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9524171095925082, "eval_accuracy-all": 0.9633637053910402, "eval_accuracy-das": 0.9712730954188813, "eval_accuracy-l1": 0.9593773728170083, "eval_accuracy-l2": 0.9673500379650721, "eval_f1": 0.9529599073672022, "eval_f1-all": 0.9477829638273045, "eval_f1-das": 0.9574902543159458, "eval_f1-l1": 0.9487912659214973, "eval_f1-l2": 0.9464938517779994, "eval_loss": 0.15614591538906097, "eval_precision": 0.9489766503315077, "eval_precision-all": 0.9417391304347826, "eval_precision-das": 0.9544781643227239, "eval_precision-l1": 0.9397528321318228, "eval_precision-l2": 0.9442970822281167, "eval_recall": 0.9569767441860465, "eval_recall-all": 0.953904873752202, "eval_recall-das": 0.9605214152700187, "eval_recall-l1": 0.958005249343832, "eval_recall-l2": 0.9487008660892738, "eval_runtime": 6.5502, "eval_samples_per_second": 103.202, "eval_steps_per_second": 6.565, "step": 900 }, { "epoch": 2.62, "learning_rate": 8e-05, "loss": 0.1448, "step": 1000 }, { "epoch": 2.62, "eval_ACT": { "f1": 0.9319470699432891, "number": 519, "precision": 0.9146567717996289, "recall": 0.9499036608863198 }, "eval_ACT_L1": { "f1": 0.9547244094488189, "number": 503, "precision": 0.9454191033138402, "recall": 0.9642147117296223 }, "eval_ACT_L2": { "f1": 0.380952380952381, "number": 16, "precision": 0.3076923076923077, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9852941176470589, "number": 678, "precision": 0.9824046920821115, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.45569620253164556, "number": 30, "precision": 0.3673469387755102, "recall": 0.6 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9586342744583061, "number": 761, "precision": 0.958005249343832, "recall": 0.9592641261498029 }, "eval_PER": { "f1": 0.9719350073855243, "number": 676, "precision": 0.9705014749262537, "recall": 0.9733727810650887 }, "eval_SPAT": { "f1": 0.9469914040114613, "number": 694, "precision": 0.9415954415954416, "recall": 0.952449567723343 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.7692307692307692, "number": 33, "precision": 0.78125, "recall": 0.7575757575757576 }, "eval_TITREP": { "f1": 0.4444444444444444, "number": 6, "precision": 0.6666666666666666, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9536826119969628, "eval_accuracy-all": 0.9634902556314857, "eval_accuracy-das": 0.9735509997468995, "eval_accuracy-l1": 0.9593773728170083, "eval_accuracy-l2": 0.967603138445963, "eval_f1": 0.958689665168865, "eval_f1-all": 0.9505326134539618, "eval_f1-das": 0.9622466059140785, "eval_f1-l1": 0.9472316090460099, "eval_f1-l2": 0.9547571523619428, "eval_loss": 0.16222244501113892, "eval_precision": 0.9560566637756577, "eval_precision-all": 0.944879605454018, "eval_precision-das": 0.9609955423476969, "eval_precision-l1": 0.9382080329557158, "eval_precision-l2": 0.9534883720930233, "eval_recall": 0.9613372093023256, "eval_recall-all": 0.956253669994128, "eval_recall-das": 0.9635009310986965, "eval_recall-l1": 0.9564304461942257, "eval_recall-l2": 0.9560293137908061, "eval_runtime": 5.8166, "eval_samples_per_second": 116.219, "eval_steps_per_second": 7.393, "step": 1000 }, { "epoch": 2.89, "eval_ACT": { "f1": 0.9426386233269598, "number": 519, "precision": 0.9354838709677419, "recall": 0.9499036608863198 }, "eval_ACT_L1": { "f1": 0.9614243323442137, "number": 503, "precision": 0.9566929133858267, "recall": 0.9662027833001988 }, "eval_ACT_L2": { "f1": 0.39999999999999997, "number": 16, "precision": 0.3684210526315789, "recall": 0.4375 }, "eval_CARDINAL": { "f1": 0.9882179675994109, "number": 678, "precision": 0.986764705882353, "recall": 0.9896755162241888 }, "eval_DESC": { "f1": 0.5217391304347826, "number": 30, "precision": 0.46153846153846156, "recall": 0.6 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9420949902407288, "number": 761, "precision": 0.9329896907216495, "recall": 0.9513797634691196 }, "eval_PER": { "f1": 0.9770879526977089, "number": 676, "precision": 0.9763663220088626, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9577060931899642, "number": 694, "precision": 0.9529243937232525, "recall": 0.962536023054755 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8, "number": 33, "precision": 0.8125, "recall": 0.7878787878787878 }, "eval_TITREP": { "f1": 0.4, "number": 6, "precision": 0.3333333333333333, "recall": 0.5 }, "eval_accuracy": 0.9539357124778537, "eval_accuracy-all": 0.9638699063528221, "eval_accuracy-das": 0.9727916983042267, "eval_accuracy-l1": 0.9610225259427992, "eval_accuracy-l2": 0.9667172867628449, "eval_f1": 0.9571883135666762, "eval_f1-all": 0.9534102526654009, "eval_f1-das": 0.9606533036377134, "eval_f1-l1": 0.9571801566579634, "eval_f1-l2": 0.9486244613854822, "eval_loss": 0.17501647770404816, "eval_precision": 0.9525043177892919, "eval_precision-all": 0.948561464690497, "eval_precision-das": 0.9574546799852016, "eval_precision-l1": 0.9522077922077922, "eval_precision-l2": 0.9439313984168866, "eval_recall": 0.9619186046511627, "eval_recall-all": 0.9583088667058133, "eval_recall-das": 0.9638733705772812, "eval_recall-l1": 0.9622047244094488, "eval_recall-l2": 0.9533644237175216, "eval_runtime": 6.2615, "eval_samples_per_second": 107.961, "eval_steps_per_second": 6.867, "step": 1100 }, { "epoch": 3.15, "eval_ACT": { "f1": 0.9417382999044891, "number": 519, "precision": 0.9337121212121212, "recall": 0.9499036608863198 }, "eval_ACT_L1": { "f1": 0.9594460929772503, "number": 503, "precision": 0.9547244094488189, "recall": 0.9642147117296223 }, "eval_ACT_L2": { "f1": 0.4444444444444445, "number": 16, "precision": 0.4, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9867647058823529, "number": 678, "precision": 0.9838709677419355, "recall": 0.9896755162241888 }, "eval_DESC": { "f1": 0.45454545454545453, "number": 30, "precision": 0.4166666666666667, "recall": 0.5 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9510763209393347, "number": 761, "precision": 0.944300518134715, "recall": 0.9579500657030223 }, "eval_PER": { "f1": 0.9785661492978566, "number": 676, "precision": 0.9778434268833087, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9562096195262024, "number": 694, "precision": 0.9527896995708155, "recall": 0.9596541786743515 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8055555555555556, "number": 33, "precision": 0.7435897435897436, "recall": 0.8787878787878788 }, "eval_TITREP": { "f1": 0.5454545454545454, "number": 6, "precision": 0.6, "recall": 0.5 }, "eval_accuracy": 0.9538091622374083, "eval_accuracy-all": 0.9638066312325994, "eval_accuracy-das": 0.9724120475828905, "eval_accuracy-l1": 0.9598835737787902, "eval_accuracy-l2": 0.9677296886864085, "eval_f1": 0.9574775817182528, "eval_f1-all": 0.9549970777323202, "eval_f1-das": 0.9612172944887734, "eval_f1-l1": 0.9558169934640522, "eval_f1-l2": 0.9539582643259357, "eval_loss": 0.17843317985534668, "eval_precision": 0.9527921704087507, "eval_precision-all": 0.9505526468877254, "eval_precision-das": 0.9578402366863905, "eval_precision-l1": 0.9520833333333333, "eval_precision-l2": 0.9486166007905138, "eval_recall": 0.9622093023255814, "eval_recall-all": 0.9594832648267763, "eval_recall-das": 0.9646182495344506, "eval_recall-l1": 0.9595800524934384, "eval_recall-l2": 0.9593604263824117, "eval_runtime": 6.7294, "eval_samples_per_second": 100.455, "eval_steps_per_second": 6.39, "step": 1200 }, { "epoch": 3.41, "eval_ACT": { "f1": 0.939047619047619, "number": 519, "precision": 0.928436911487759, "recall": 0.9499036608863198 }, "eval_ACT_L1": { "f1": 0.9576354679802955, "number": 503, "precision": 0.94921875, "recall": 0.9662027833001988 }, "eval_ACT_L2": { "f1": 0.39999999999999997, "number": 16, "precision": 0.3684210526315789, "recall": 0.4375 }, "eval_CARDINAL": { "f1": 0.9852724594992636, "number": 678, "precision": 0.9838235294117647, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.5161290322580646, "number": 30, "precision": 0.5, "recall": 0.5333333333333333 }, "eval_FT": { "f1": 0.4444444444444445, "number": 7, "precision": 1.0, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9546946815495732, "number": 761, "precision": 0.9540682414698163, "recall": 0.9553219448094612 }, "eval_PER": { "f1": 0.9785661492978566, "number": 676, "precision": 0.9778434268833087, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9569583931133429, "number": 694, "precision": 0.9528571428571428, "recall": 0.9610951008645533 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.7096774193548386, "number": 33, "precision": 0.7586206896551724, "recall": 0.6666666666666666 }, "eval_TITREP": { "f1": 0.5, "number": 6, "precision": 0.5, "recall": 0.5 }, "eval_accuracy": 0.960642875221463, "eval_accuracy-all": 0.9691217413313086, "eval_accuracy-das": 0.9778537079220451, "eval_accuracy-l1": 0.9653252341179448, "eval_accuracy-l2": 0.9729182485446722, "eval_f1": 0.9602562236133353, "eval_f1-all": 0.9556043956043958, "eval_f1-das": 0.9622044312046174, "eval_f1-l1": 0.9571353894406691, "eval_f1-l2": 0.9536512170723576, "eval_loss": 0.16250379383563995, "eval_precision": 0.9617964421114027, "eval_precision-all": 0.9537876572097105, "eval_precision-das": 0.9620253164556962, "eval_precision-l1": 0.9531494013534617, "eval_precision-l2": 0.9546061415220294, "eval_recall": 0.9587209302325581, "eval_recall-all": 0.9574280681150911, "eval_recall-das": 0.9623836126629423, "eval_recall-l1": 0.9611548556430446, "eval_recall-l2": 0.9526982011992006, "eval_runtime": 5.7506, "eval_samples_per_second": 117.554, "eval_steps_per_second": 7.478, "step": 1300 }, { "epoch": 3.67, "eval_ACT": { "f1": 0.9439696106362773, "number": 519, "precision": 0.9307116104868914, "recall": 0.9576107899807321 }, "eval_ACT_L1": { "f1": 0.9616519174041297, "number": 503, "precision": 0.9513618677042801, "recall": 0.9721669980119284 }, "eval_ACT_L2": { "f1": 0.4444444444444445, "number": 16, "precision": 0.4, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9830757910228108, "number": 678, "precision": 0.9809104258443465, "recall": 0.9852507374631269 }, "eval_DESC": { "f1": 0.4927536231884058, "number": 30, "precision": 0.4358974358974359, "recall": 0.5666666666666667 }, "eval_FT": { "f1": 0.22222222222222224, "number": 7, "precision": 0.5, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9560655737704917, "number": 761, "precision": 0.9541884816753927, "recall": 0.9579500657030223 }, "eval_PER": { "f1": 0.9807692307692307, "number": 676, "precision": 0.9807692307692307, "recall": 0.9807692307692307 }, "eval_SPAT": { "f1": 0.9590222861250898, "number": 694, "precision": 0.9569583931133429, "recall": 0.9610951008645533 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.875, "number": 33, "precision": 0.9032258064516129, "recall": 0.8484848484848485 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9583649708934447, "eval_accuracy-all": 0.9695646671728676, "eval_accuracy-das": 0.9716527461402177, "eval_accuracy-l1": 0.9645659326752721, "eval_accuracy-l2": 0.9745634016704632, "eval_f1": 0.9603128621089224, "eval_f1-all": 0.957284961966062, "eval_f1-das": 0.9644783336432956, "eval_f1-l1": 0.9584964761158966, "eval_f1-l2": 0.9557404326123128, "eval_loss": 0.17416799068450928, "eval_precision": 0.956986143187067, "eval_precision-all": 0.953935860058309, "eval_precision-das": 0.9632243684992571, "eval_precision-l1": 0.9532710280373832, "eval_precision-l2": 0.9547872340425532, "eval_recall": 0.9636627906976745, "eval_recall-all": 0.9606576629477392, "eval_recall-das": 0.9657355679702049, "eval_recall-l1": 0.9637795275590552, "eval_recall-l2": 0.9566955363091273, "eval_runtime": 6.3107, "eval_samples_per_second": 107.119, "eval_steps_per_second": 6.814, "step": 1400 }, { "epoch": 3.94, "learning_rate": 7e-05, "loss": 0.0854, "step": 1500 }, { "epoch": 3.94, "eval_ACT": { "f1": 0.9382716049382717, "number": 519, "precision": 0.9250936329588015, "recall": 0.9518304431599229 }, "eval_ACT_L1": { "f1": 0.9614243323442137, "number": 503, "precision": 0.9566929133858267, "recall": 0.9662027833001988 }, "eval_ACT_L2": { "f1": 0.380952380952381, "number": 16, "precision": 0.3076923076923077, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9874538745387453, "number": 678, "precision": 0.9881831610044313, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.5142857142857143, "number": 30, "precision": 0.45, "recall": 0.6 }, "eval_FT": { "f1": 0.2, "number": 7, "precision": 0.3333333333333333, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9559500328731098, "number": 761, "precision": 0.9565789473684211, "recall": 0.9553219448094612 }, "eval_PER": { "f1": 0.9763313609467456, "number": 676, "precision": 0.9763313609467456, "recall": 0.9763313609467456 }, "eval_SPAT": { "f1": 0.9577060931899642, "number": 694, "precision": 0.9529243937232525, "recall": 0.962536023054755 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8529411764705883, "number": 33, "precision": 0.8285714285714286, "recall": 0.8787878787878788 }, "eval_TITREP": { "f1": 0.5454545454545454, "number": 6, "precision": 0.6, "recall": 0.5 }, "eval_accuracy": 0.9515312579093901, "eval_accuracy-all": 0.9630473297899266, "eval_accuracy-das": 0.9717792963806631, "eval_accuracy-l1": 0.9570994684889901, "eval_accuracy-l2": 0.9689951910908631, "eval_f1": 0.9592576482528636, "eval_f1-all": 0.9562673687289747, "eval_f1-das": 0.9624395686128672, "eval_f1-l1": 0.9566579634464752, "eval_f1-l2": 0.9557698703026272, "eval_loss": 0.18355852365493774, "eval_precision": 0.9568990454150998, "eval_precision-all": 0.9527834450597493, "eval_precision-das": 0.961010025993316, "eval_precision-l1": 0.9516883116883117, "eval_precision-l2": 0.954183266932271, "eval_recall": 0.9616279069767442, "eval_recall-all": 0.959776864357017, "eval_recall-das": 0.9638733705772812, "eval_recall-l1": 0.9616797900262467, "eval_recall-l2": 0.9573617588274483, "eval_runtime": 6.1311, "eval_samples_per_second": 110.258, "eval_steps_per_second": 7.013, "step": 1500 }, { "epoch": 4.2, "eval_ACT": { "f1": 0.9375, "number": 519, "precision": 0.9217877094972067, "recall": 0.953757225433526 }, "eval_ACT_L1": { "f1": 0.9577187807276303, "number": 503, "precision": 0.9474708171206225, "recall": 0.9681908548707754 }, "eval_ACT_L2": { "f1": 0.41025641025641024, "number": 16, "precision": 0.34782608695652173, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9874908020603386, "number": 678, "precision": 0.9853157121879589, "recall": 0.9896755162241888 }, "eval_DESC": { "f1": 0.5217391304347826, "number": 30, "precision": 0.46153846153846156, "recall": 0.6 }, "eval_FT": { "f1": 0.4615384615384615, "number": 7, "precision": 0.5, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.953063885267275, "number": 761, "precision": 0.9456662354463131, "recall": 0.9605781865965834 }, "eval_PER": { "f1": 0.9792899408284024, "number": 676, "precision": 0.9792899408284024, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9592566118656183, "number": 694, "precision": 0.9517730496453901, "recall": 0.9668587896253602 }, "eval_TITRE": { "f1": 0.5, "number": 2, "precision": 0.5, "recall": 0.5 }, "eval_TITREH": { "f1": 0.84375, "number": 33, "precision": 0.8709677419354839, "recall": 0.8181818181818182 }, "eval_TITREP": { "f1": 0.4, "number": 6, "precision": 0.3333333333333333, "recall": 0.5 }, "eval_accuracy": 0.9557074158440901, "eval_accuracy-all": 0.9666540116426221, "eval_accuracy-das": 0.9732978992660086, "eval_accuracy-l1": 0.9629207795494812, "eval_accuracy-l2": 0.9703872437357631, "eval_f1": 0.959525874530211, "eval_f1-all": 0.9561544064093226, "eval_f1-das": 0.9638286032276017, "eval_f1-l1": 0.9575631346003645, "eval_f1-l2": 0.9543650793650794, "eval_loss": 0.1747445911169052, "eval_precision": 0.9542840713053479, "eval_precision-all": 0.9488291413703382, "eval_precision-das": 0.9600886917960089, "eval_precision-l1": 0.949896694214876, "eval_precision-l2": 0.9474720945502298, "eval_recall": 0.9648255813953488, "eval_recall-all": 0.9635936582501468, "eval_recall-das": 0.9675977653631285, "eval_recall-l1": 0.9653543307086614, "eval_recall-l2": 0.9613590939373751, "eval_runtime": 6.3526, "eval_samples_per_second": 106.414, "eval_steps_per_second": 6.769, "step": 1600 }, { "epoch": 4.46, "eval_ACT": { "f1": 0.9438629876308278, "number": 519, "precision": 0.9323308270676691, "recall": 0.9556840077071291 }, "eval_ACT_L1": { "f1": 0.9663366336633663, "number": 503, "precision": 0.9625246548323472, "recall": 0.9701789264413518 }, "eval_ACT_L2": { "f1": 0.39024390243902435, "number": 16, "precision": 0.32, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9867452135493373, "number": 678, "precision": 0.9852941176470589, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.5373134328358209, "number": 30, "precision": 0.4864864864864865, "recall": 0.6 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9619921363040629, "number": 761, "precision": 0.9594771241830066, "recall": 0.9645203679369251 }, "eval_PER": { "f1": 0.9792899408284024, "number": 676, "precision": 0.9792899408284024, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9627507163323783, "number": 694, "precision": 0.9572649572649573, "recall": 0.968299711815562 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8484848484848486, "number": 33, "precision": 0.8484848484848485, "recall": 0.8484848484848485 }, "eval_TITREP": { "f1": 0.5454545454545454, "number": 6, "precision": 0.6, "recall": 0.5 }, "eval_accuracy": 0.9554543153631991, "eval_accuracy-all": 0.9662743609212857, "eval_accuracy-das": 0.975069602632245, "eval_accuracy-l1": 0.9619083776259175, "eval_accuracy-l2": 0.970640344216654, "eval_f1": 0.9615552009284782, "eval_f1-all": 0.9603627321924821, "eval_f1-das": 0.9665178571428571, "eval_f1-l1": 0.9615887117846877, "eval_f1-l2": 0.9588039867109635, "eval_loss": 0.17034310102462769, "eval_precision": 0.9597451491456704, "eval_precision-all": 0.9568638880792771, "eval_precision-das": 0.9654403567447045, "eval_precision-l1": 0.9573361082206036, "eval_precision-l2": 0.9562624254473161, "eval_recall": 0.9633720930232558, "eval_recall-all": 0.9638872577803875, "eval_recall-das": 0.9675977653631285, "eval_recall-l1": 0.9658792650918635, "eval_recall-l2": 0.9613590939373751, "eval_runtime": 6.4585, "eval_samples_per_second": 104.669, "eval_steps_per_second": 6.658, "step": 1700 }, { "epoch": 4.72, "eval_ACT": { "f1": 0.9551098376313275, "number": 519, "precision": 0.946969696969697, "recall": 0.9633911368015414 }, "eval_ACT_L1": { "f1": 0.971540726202159, "number": 503, "precision": 0.9593023255813954, "recall": 0.9840954274353877 }, "eval_ACT_L2": { "f1": 0.35714285714285715, "number": 16, "precision": 0.4166666666666667, "recall": 0.3125 }, "eval_CARDINAL": { "f1": 0.9867452135493373, "number": 678, "precision": 0.9852941176470589, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.523076923076923, "number": 30, "precision": 0.4857142857142857, "recall": 0.5666666666666667 }, "eval_FT": { "f1": 0.42857142857142855, "number": 7, "precision": 0.42857142857142855, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.945645055664702, "number": 761, "precision": 0.9425587467362925, "recall": 0.9487516425755584 }, "eval_PER": { "f1": 0.9800148038490007, "number": 676, "precision": 0.9807407407407407, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9463902787705505, "number": 694, "precision": 0.9390070921985816, "recall": 0.9538904899135446 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.875, "number": 33, "precision": 0.9032258064516129, "recall": 0.8484848484848485 }, "eval_TITREP": { "f1": 0.30769230769230765, "number": 6, "precision": 0.2857142857142857, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9596304732978993, "eval_accuracy-all": 0.968299164768413, "eval_accuracy-das": 0.9749430523917996, "eval_accuracy-l1": 0.9654517843583903, "eval_accuracy-l2": 0.9711465451784358, "eval_f1": 0.9605339524085896, "eval_f1-all": 0.9548311650343518, "eval_f1-das": 0.9643255295429208, "eval_f1-l1": 0.9569976544175137, "eval_f1-l2": 0.9520639147802931, "eval_loss": 0.17404037714004517, "eval_precision": 0.958864426419467, "eval_precision-all": 0.9508005822416302, "eval_precision-das": 0.9621802002224694, "eval_precision-l1": 0.9503105590062112, "eval_precision-l2": 0.9514304723885563, "eval_recall": 0.9622093023255814, "eval_recall-all": 0.9588960657662948, "eval_recall-das": 0.9664804469273743, "eval_recall-l1": 0.9637795275590552, "eval_recall-l2": 0.9526982011992006, "eval_runtime": 5.4184, "eval_samples_per_second": 124.761, "eval_steps_per_second": 7.936, "step": 1800 }, { "epoch": 4.99, "eval_ACT": { "f1": 0.939047619047619, "number": 519, "precision": 0.928436911487759, "recall": 0.9499036608863198 }, "eval_ACT_L1": { "f1": 0.961576354679803, "number": 503, "precision": 0.953125, "recall": 0.9701789264413518 }, "eval_ACT_L2": { "f1": 0.2857142857142857, "number": 16, "precision": 0.2631578947368421, "recall": 0.3125 }, "eval_CARDINAL": { "f1": 0.9815770081061163, "number": 678, "precision": 0.9808541973490427, "recall": 0.9823008849557522 }, "eval_DESC": { "f1": 0.5483870967741935, "number": 30, "precision": 0.53125, "recall": 0.5666666666666667 }, "eval_FT": { "f1": 0.2, "number": 7, "precision": 0.3333333333333333, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.953063885267275, "number": 761, "precision": 0.9456662354463131, "recall": 0.9605781865965834 }, "eval_PER": { "f1": 0.977810650887574, "number": 676, "precision": 0.977810650887574, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9626972740315638, "number": 694, "precision": 0.9585714285714285, "recall": 0.9668587896253602 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8285714285714285, "number": 33, "precision": 0.7837837837837838, "recall": 0.8787878787878788 }, "eval_TITREP": { "f1": 0.28571428571428575, "number": 6, "precision": 0.25, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9579853201721084, "eval_accuracy-all": 0.9677929638066313, "eval_accuracy-das": 0.9754492533535813, "eval_accuracy-l1": 0.9646924829157175, "eval_accuracy-l2": 0.9708934446975449, "eval_f1": 0.9568491167101071, "eval_f1-all": 0.9554549437709947, "eval_f1-das": 0.9595997034840623, "eval_f1-l1": 0.96002090410243, "eval_f1-l2": 0.9496688741721854, "eval_loss": 0.18735294044017792, "eval_precision": 0.953260242354299, "eval_precision-all": 0.95059575704737, "eval_precision-das": 0.9549981556621173, "eval_precision-l1": 0.9557752341311134, "eval_precision-l2": 0.9440421329822252, "eval_recall": 0.9604651162790697, "eval_recall-all": 0.9603640634174986, "eval_recall-das": 0.964245810055866, "eval_recall-l1": 0.9643044619422572, "eval_recall-l2": 0.955363091272485, "eval_runtime": 5.4368, "eval_samples_per_second": 124.338, "eval_steps_per_second": 7.909, "step": 1900 }, { "epoch": 5.25, "learning_rate": 6e-05, "loss": 0.0555, "step": 2000 }, { "epoch": 5.25, "eval_ACT": { "f1": 0.9514747859181732, "number": 519, "precision": 0.9398496240601504, "recall": 0.9633911368015414 }, "eval_ACT_L1": { "f1": 0.970414201183432, "number": 503, "precision": 0.9628180039138943, "recall": 0.9781312127236581 }, "eval_ACT_L2": { "f1": 0.4324324324324324, "number": 16, "precision": 0.38095238095238093, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9874723655121592, "number": 678, "precision": 0.9867452135493373, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.5538461538461538, "number": 30, "precision": 0.5142857142857142, "recall": 0.6 }, "eval_FT": { "f1": 0.30769230769230765, "number": 7, "precision": 0.3333333333333333, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9625246548323472, "number": 761, "precision": 0.9631578947368421, "recall": 0.961892247043364 }, "eval_PER": { "f1": 0.9800148038490007, "number": 676, "precision": 0.9807407407407407, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9612625538020085, "number": 694, "precision": 0.9571428571428572, "recall": 0.9654178674351584 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8923076923076922, "number": 33, "precision": 0.90625, "recall": 0.8787878787878788 }, "eval_TITREP": { "f1": 0.5, "number": 6, "precision": 0.5, "recall": 0.5 }, "eval_accuracy": 0.958744621614781, "eval_accuracy-all": 0.9686155403695267, "eval_accuracy-das": 0.9762085547962541, "eval_accuracy-l1": 0.9640597317134902, "eval_accuracy-l2": 0.9731713490255631, "eval_f1": 0.9654571843251089, "eval_f1-all": 0.9620846142585272, "eval_f1-das": 0.9683897359613239, "eval_f1-l1": 0.9628855201254575, "eval_f1-l2": 0.9610648918469219, "eval_loss": 0.18852506577968597, "eval_precision": 0.9640579710144928, "eval_precision-all": 0.9594160583941606, "eval_precision-das": 0.966951355365763, "eval_precision-l1": 0.9588755856324831, "eval_precision-l2": 0.9601063829787234, "eval_recall": 0.9668604651162791, "eval_recall-all": 0.9647680563711099, "eval_recall-das": 0.9698324022346368, "eval_recall-l1": 0.9669291338582677, "eval_recall-l2": 0.9620253164556962, "eval_runtime": 5.6224, "eval_samples_per_second": 120.232, "eval_steps_per_second": 7.648, "step": 2000 } ], "max_steps": 5000, "num_train_epochs": 14, "total_flos": 813927239246016.0, "trial_name": null, "trial_params": null }