{ "best_metric": 0.9732283464566929, "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/314-pretrained-camembert-ner-hierarchical-loss-iob2/checkpoint-1400", "epoch": 3.674540682414698, "global_step": 1400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.26, "eval_ACT": { "f1": 0.8992673992673993, "number": 519, "precision": 0.8568935427574171, "recall": 0.9460500963391136 }, "eval_ACT_L1": { "f1": 0.912639405204461, "number": 503, "precision": 0.8568935427574171, "recall": 0.9761431411530815 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9816041206769685, "number": 678, "precision": 0.9794419970631424, "recall": 0.9837758112094396 }, "eval_DESC": { "f1": 0.0, "number": 30, "precision": 0.0, "recall": 0.0 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9583333333333334, "number": 762, "precision": 0.9509043927648578, "recall": 0.9658792650918635 }, "eval_PER": { "f1": 0.9560117302052786, "number": 676, "precision": 0.9476744186046512, "recall": 0.9644970414201184 }, "eval_SPAT": { "f1": 0.9562724014336917, "number": 694, "precision": 0.9514978601997147, "recall": 0.9610951008645533 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.0, "number": 33, "precision": 0.0, "recall": 0.0 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9404170804369414, "eval_accuracy-all": 0.9610228401191658, "eval_accuracy-das": 0.9565541211519365, "eval_accuracy-l1": 0.9500993048659384, "eval_accuracy-l1l2": 0.9407894736842105, "eval_accuracy-l2": 0.9719463753723933, "eval_f1": 0.9438787055894999, "eval_f1-all": 0.9416764361078547, "eval_f1-das": 0.9402153731897512, "eval_f1-l1": 0.9361261960175847, "eval_f1-l1l2": 0.9384570933256284, "eval_f1-l2": 0.9489347311464321, "eval_loss": 0.6206728219985962, "eval_precision": 0.9473086531910061, "eval_precision-all": 0.9402985074626866, "eval_precision-das": 0.9370836417468542, "eval_precision-l1": 0.9225280326197758, "eval_precision-l1l2": 0.9368329968272282, "eval_precision-l2": 0.9642611683848797, "eval_recall": 0.9404735062006765, "eval_recall-all": 0.9430584091576166, "eval_recall-das": 0.9433681073025335, "eval_recall-l1": 0.9501312335958005, "eval_recall-l1l2": 0.9400868306801736, "eval_recall-l2": 0.9340878828229028, "eval_runtime": 7.1724, "eval_samples_per_second": 94.251, "eval_steps_per_second": 5.995, "step": 100 }, { "epoch": 0.52, "eval_ACT": { "f1": 0.9291784702549574, "number": 519, "precision": 0.9111111111111111, "recall": 0.9479768786127167 }, "eval_ACT_L1": { "f1": 0.9434324065196549, "number": 503, "precision": 0.9111111111111111, "recall": 0.9781312127236581 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9919058130978661, "number": 678, "precision": 0.9897209985315712, "recall": 0.9941002949852508 }, "eval_DESC": { "f1": 0.3103448275862069, "number": 30, "precision": 0.32142857142857145, "recall": 0.3 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9521345407503234, "number": 762, "precision": 0.9387755102040817, "recall": 0.9658792650918635 }, "eval_PER": { "f1": 0.983050847457627, "number": 676, "precision": 0.9794419970631424, "recall": 0.9866863905325444 }, "eval_SPAT": { "f1": 0.9542857142857143, "number": 694, "precision": 0.9461756373937678, "recall": 0.962536023054755 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.43373493975903615, "number": 33, "precision": 0.36, "recall": 0.5454545454545454 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.951837140019861, "eval_accuracy-all": 0.9676017874875869, "eval_accuracy-das": 0.9716981132075472, "eval_accuracy-l1": 0.9602780536246276, "eval_accuracy-l1l2": 0.9524577954319762, "eval_accuracy-l2": 0.9749255213505462, "eval_f1": 0.9533235856484086, "eval_f1-all": 0.9492511269448888, "eval_f1-das": 0.9659385412810071, "eval_f1-l1": 0.9512953367875648, "eval_f1-l1l2": 0.9528720813637014, "eval_f1-l2": 0.9466357308584686, "eval_loss": 0.3473620116710663, "eval_precision": 0.9510771992818672, "eval_precision-all": 0.9406340057636887, "eval_precision-das": 0.9598969830757911, "eval_precision-l1": 0.9391304347826087, "eval_precision-l1l2": 0.9432785025524674, "eval_precision-l2": 0.9425742574257425, "eval_recall": 0.9555806087936866, "eval_recall-all": 0.9580275902553567, "eval_recall-das": 0.9720566318926974, "eval_recall-l1": 0.9637795275590552, "eval_recall-l1l2": 0.9626628075253256, "eval_recall-l2": 0.9507323568575233, "eval_runtime": 7.1425, "eval_samples_per_second": 94.645, "eval_steps_per_second": 6.02, "step": 200 }, { "epoch": 0.79, "eval_ACT": { "f1": 0.9467680608365019, "number": 519, "precision": 0.9343339587242027, "recall": 0.9595375722543352 }, "eval_ACT_L1": { "f1": 0.9613899613899614, "number": 503, "precision": 0.9343339587242027, "recall": 0.9900596421471173 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.22580645161290322, "number": 30, "precision": 0.21875, "recall": 0.23333333333333334 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9609882964889467, "number": 762, "precision": 0.9523195876288659, "recall": 0.9698162729658792 }, "eval_PER": { "f1": 0.9808541973490428, "number": 676, "precision": 0.9765395894428153, "recall": 0.985207100591716 }, "eval_SPAT": { "f1": 0.9700000000000001, "number": 694, "precision": 0.9617563739376771, "recall": 0.978386167146974 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.6756756756756757, "number": 33, "precision": 0.6097560975609756, "recall": 0.7575757575757576 }, "eval_TITREP": { "f1": 0.6, "number": 6, "precision": 0.75, "recall": 0.5 }, "eval_accuracy": 0.9551886792452831, "eval_accuracy-all": 0.9682845084409136, "eval_accuracy-das": 0.9759185700099305, "eval_accuracy-l1": 0.9617676266137041, "eval_accuracy-l1l2": 0.9554369414101291, "eval_accuracy-l2": 0.9748013902681232, "eval_f1": 0.9625788999098286, "eval_f1-all": 0.9594870300204023, "eval_f1-das": 0.9718100890207715, "eval_f1-l1": 0.9590461378952824, "eval_f1-l1l2": 0.9622695852534562, "eval_f1-l2": 0.9600532623169108, "eval_loss": 0.24261289834976196, "eval_precision": 0.9623619562767636, "eval_precision-all": 0.952821997105644, "eval_precision-das": 0.9675036927621861, "eval_precision-l1": 0.9472606246799795, "eval_precision-l1l2": 0.9575809687589567, "eval_precision-l2": 0.9600532623169108, "eval_recall": 0.9627959413754228, "eval_recall-all": 0.9662459641913707, "eval_recall-das": 0.9761549925484352, "eval_recall-l1": 0.9711286089238845, "eval_recall-l1l2": 0.9670043415340087, "eval_recall-l2": 0.9600532623169108, "eval_runtime": 8.0913, "eval_samples_per_second": 83.547, "eval_steps_per_second": 5.314, "step": 300 }, { "epoch": 1.05, "eval_ACT": { "f1": 0.9337121212121212, "number": 519, "precision": 0.9180633147113594, "recall": 0.9499036608863198 }, "eval_ACT_L1": { "f1": 0.9480769230769232, "number": 503, "precision": 0.9180633147113594, "recall": 0.9801192842942346 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.21951219512195122, "number": 30, "precision": 0.17307692307692307, "recall": 0.3 }, "eval_FT": { "f1": 0.2, "number": 7, "precision": 0.3333333333333333, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9583875162548764, "number": 762, "precision": 0.9497422680412371, "recall": 0.9671916010498688 }, "eval_PER": { "f1": 0.9889298892988929, "number": 676, "precision": 0.9867452135493373, "recall": 0.9911242603550295 }, "eval_SPAT": { "f1": 0.964924838940587, "number": 694, "precision": 0.9587482219061166, "recall": 0.9711815561959655 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9117647058823529, "number": 33, "precision": 0.8857142857142857, "recall": 0.9393939393939394 }, "eval_TITREP": { "f1": 0.6153846153846153, "number": 6, "precision": 0.5714285714285714, "recall": 0.6666666666666666 }, "eval_accuracy": 0.961395233366435, "eval_accuracy-all": 0.9726911618669315, "eval_accuracy-das": 0.9774081429990069, "eval_accuracy-l1": 0.9667328699106256, "eval_accuracy-l1l2": 0.9620158887785502, "eval_accuracy-l2": 0.9786494538232373, "eval_f1": 0.9638120926050797, "eval_f1-all": 0.9575581395348837, "eval_f1-das": 0.9719799591760996, "eval_f1-l1": 0.9525283797729618, "eval_f1-l1l2": 0.962516156828953, "eval_f1-l2": 0.9640479360852197, "eval_loss": 0.1985810250043869, "eval_precision": 0.9607887071476585, "eval_precision-all": 0.9484595450619061, "eval_precision-das": 0.9682070240295748, "eval_precision-l1": 0.9365804160324708, "eval_precision-l1l2": 0.9552451539338654, "eval_precision-l2": 0.9640479360852197, "eval_recall": 0.9668545659526494, "eval_recall-all": 0.966832990901086, "eval_recall-das": 0.9757824143070045, "eval_recall-l1": 0.9690288713910761, "eval_recall-l1l2": 0.9698986975397974, "eval_recall-l2": 0.9640479360852197, "eval_runtime": 6.8598, "eval_samples_per_second": 98.545, "eval_steps_per_second": 6.268, "step": 400 }, { "epoch": 1.31, "learning_rate": 9e-05, "loss": 0.5596, "step": 500 }, { "epoch": 1.31, "eval_ACT": { "f1": 0.9334600760456274, "number": 519, "precision": 0.9212007504690432, "recall": 0.9460500963391136 }, "eval_ACT_L1": { "f1": 0.948792270531401, "number": 503, "precision": 0.9229323308270677, "recall": 0.9761431411530815 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.2758620689655172, "number": 30, "precision": 0.2857142857142857, "recall": 0.26666666666666666 }, "eval_FT": { "f1": 0.36363636363636365, "number": 7, "precision": 0.5, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9538661468486029, "number": 762, "precision": 0.9446589446589446, "recall": 0.963254593175853 }, "eval_PER": { "f1": 0.9734904270986746, "number": 676, "precision": 0.969208211143695, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9549678341672624, "number": 694, "precision": 0.9475177304964539, "recall": 0.962536023054755 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8571428571428571, "number": 33, "precision": 0.8108108108108109, "recall": 0.9090909090909091 }, "eval_TITREP": { "f1": 0.4615384615384615, "number": 6, "precision": 0.42857142857142855, "recall": 0.5 }, "eval_accuracy": 0.961643495531281, "eval_accuracy-all": 0.9728152929493545, "eval_accuracy-das": 0.9765392254220456, "eval_accuracy-l1": 0.9676017874875869, "eval_accuracy-l1l2": 0.9621400198609732, "eval_accuracy-l2": 0.9780287984111221, "eval_f1": 0.9624465932089048, "eval_f1-all": 0.9537968226206093, "eval_f1-das": 0.9642393922549565, "eval_f1-l1": 0.949117341640706, "eval_f1-l1l2": 0.958699093394733, "eval_f1-l2": 0.9597873047524094, "eval_loss": 0.18591071665287018, "eval_precision": 0.9598564700605517, "eval_precision-all": 0.9473074696004632, "eval_precision-das": 0.9590858827865831, "eval_precision-l1": 0.9388803287108372, "eval_precision-l1l2": 0.9533485975958786, "eval_precision-l2": 0.9581950895819509, "eval_recall": 0.9650507328072153, "eval_recall-all": 0.9603756970942178, "eval_recall-das": 0.9694485842026825, "eval_recall-l1": 0.9595800524934384, "eval_recall-l1l2": 0.96410998552822, "eval_recall-l2": 0.9613848202396804, "eval_runtime": 7.193, "eval_samples_per_second": 93.98, "eval_steps_per_second": 5.978, "step": 500 }, { "epoch": 1.57, "eval_ACT": { "f1": 0.9419600380589914, "number": 519, "precision": 0.9304511278195489, "recall": 0.953757225433526 }, "eval_ACT_L1": { "f1": 0.9573643410852714, "number": 503, "precision": 0.9338374291115312, "recall": 0.9821073558648111 }, "eval_ACT_L2": { "f1": 0.10526315789473684, "number": 16, "precision": 0.3333333333333333, "recall": 0.0625 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.30985915492957744, "number": 30, "precision": 0.2682926829268293, "recall": 0.36666666666666664 }, "eval_FT": { "f1": 0.30769230769230765, "number": 7, "precision": 0.3333333333333333, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9487345879299156, "number": 762, "precision": 0.938382541720154, "recall": 0.9593175853018373 }, "eval_PER": { "f1": 0.9823008849557522, "number": 676, "precision": 0.9794117647058823, "recall": 0.985207100591716 }, "eval_SPAT": { "f1": 0.9590222861250898, "number": 694, "precision": 0.9569583931133429, "recall": 0.9610951008645533 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9117647058823529, "number": 33, "precision": 0.8857142857142857, "recall": 0.9393939393939394 }, "eval_TITREP": { "f1": 0.5714285714285715, "number": 6, "precision": 0.5, "recall": 0.6666666666666666 }, "eval_accuracy": 0.9654915590863953, "eval_accuracy-all": 0.9756703078450845, "eval_accuracy-das": 0.9801390268123138, "eval_accuracy-l1": 0.9725670307845085, "eval_accuracy-l1l2": 0.9663604766633564, "eval_accuracy-l2": 0.9787735849056604, "eval_f1": 0.9630793401413982, "eval_f1-all": 0.9560151471016604, "eval_f1-das": 0.9725213516524323, "eval_f1-l1": 0.9543094496365525, "eval_f1-l1l2": 0.9620471535365152, "eval_f1-l2": 0.958195089581951, "eval_loss": 0.14890924096107483, "eval_precision": 0.9586684539767649, "eval_precision-all": 0.9488291413703382, "eval_precision-das": 0.9692820133234641, "eval_precision-l1": 0.9440164355418593, "eval_precision-l1l2": 0.9557269351613824, "eval_precision-l2": 0.955026455026455, "eval_recall": 0.9675310033821871, "eval_recall-all": 0.9633108306427942, "eval_recall-das": 0.9757824143070045, "eval_recall-l1": 0.9648293963254593, "eval_recall-l1l2": 0.968451519536903, "eval_recall-l2": 0.9613848202396804, "eval_runtime": 6.5579, "eval_samples_per_second": 103.082, "eval_steps_per_second": 6.557, "step": 600 }, { "epoch": 1.84, "eval_ACT": { "f1": 0.9421800947867298, "number": 519, "precision": 0.9272388059701493, "recall": 0.9576107899807321 }, "eval_ACT_L1": { "f1": 0.9573643410852714, "number": 503, "precision": 0.9338374291115312, "recall": 0.9821073558648111 }, "eval_ACT_L2": { "f1": 0.26086956521739124, "number": 16, "precision": 0.42857142857142855, "recall": 0.1875 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.4126984126984127, "number": 30, "precision": 0.3939393939393939, "recall": 0.43333333333333335 }, "eval_FT": { "f1": 0.3333333333333333, "number": 7, "precision": 0.4, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9566343042071198, "number": 762, "precision": 0.9438058748403576, "recall": 0.9698162729658792 }, "eval_PER": { "f1": 0.9852507374631269, "number": 676, "precision": 0.9823529411764705, "recall": 0.9881656804733728 }, "eval_SPAT": { "f1": 0.9634931997136722, "number": 694, "precision": 0.957325746799431, "recall": 0.9697406340057637 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.927536231884058, "number": 33, "precision": 0.8888888888888888, "recall": 0.9696969696969697 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9669811320754716, "eval_accuracy-all": 0.9762288977159881, "eval_accuracy-das": 0.980759682224429, "eval_accuracy-l1": 0.9724428997020854, "eval_accuracy-l1l2": 0.9677259185700099, "eval_accuracy-l2": 0.9800148957298908, "eval_f1": 0.9667938074938299, "eval_f1-all": 0.9609898107714702, "eval_f1-das": 0.9720111214087118, "eval_f1-l1": 0.96, "eval_f1-l1l2": 0.964824120603015, "eval_f1-l2": 0.9622516556291391, "eval_loss": 0.15314123034477234, "eval_precision": 0.962045099352534, "eval_precision-all": 0.9532197516604101, "eval_precision-das": 0.967170785687938, "eval_precision-l1": 0.9501285347043702, "eval_precision-l1l2": 0.9572649572649573, "eval_precision-l2": 0.9571805006587615, "eval_recall": 0.9715896279594137, "eval_recall-all": 0.9688875843850895, "eval_recall-das": 0.9769001490312966, "eval_recall-l1": 0.9700787401574803, "eval_recall-l1l2": 0.9725036179450073, "eval_recall-l2": 0.9673768308921438, "eval_runtime": 7.6675, "eval_samples_per_second": 88.164, "eval_steps_per_second": 5.608, "step": 700 }, { "epoch": 2.1, "eval_ACT": { "f1": 0.9300567107750471, "number": 519, "precision": 0.9128014842300557, "recall": 0.9479768786127167 }, "eval_ACT_L1": { "f1": 0.9568627450980391, "number": 503, "precision": 0.9439071566731141, "recall": 0.9701789264413518 }, "eval_ACT_L2": { "f1": 0.2105263157894737, "number": 16, "precision": 0.18181818181818182, "recall": 0.25 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.37499999999999994, "number": 30, "precision": 0.3, "recall": 0.5 }, "eval_FT": { "f1": 0.3333333333333333, "number": 7, "precision": 0.4, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9635890767230169, "number": 762, "precision": 0.9548969072164949, "recall": 0.9724409448818898 }, "eval_PER": { "f1": 0.986019131714496, "number": 676, "precision": 0.9809663250366032, "recall": 0.9911242603550295 }, "eval_SPAT": { "f1": 0.9591982820329277, "number": 694, "precision": 0.9530583214793741, "recall": 0.9654178674351584 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9090909090909091, "number": 33, "precision": 0.9090909090909091, "recall": 0.9090909090909091 }, "eval_TITREP": { "f1": 0.6153846153846153, "number": 6, "precision": 0.5714285714285714, "recall": 0.6666666666666666 }, "eval_accuracy": 0.9632571996027806, "eval_accuracy-all": 0.9734980139026812, "eval_accuracy-das": 0.9815044687189672, "eval_accuracy-l1": 0.9703326713008937, "eval_accuracy-l1l2": 0.9643743793445879, "eval_accuracy-l2": 0.9766633565044687, "eval_f1": 0.9649299719887955, "eval_f1-all": 0.9584543869843115, "eval_f1-das": 0.9727323316638843, "eval_f1-l1": 0.9554173146708138, "eval_f1-l1l2": 0.9624534250501576, "eval_f1-l2": 0.9623265036351619, "eval_loss": 0.13265174627304077, "eval_precision": 0.9590200445434298, "eval_precision-all": 0.9488064423353466, "eval_precision-das": 0.9685999261174733, "eval_precision-l1": 0.9436763952892985, "eval_precision-l1l2": 0.9531649162645472, "eval_precision-l2": 0.9553805774278216, "eval_recall": 0.970913190529876, "eval_recall-all": 0.9683005576753743, "eval_recall-das": 0.9769001490312966, "eval_recall-l1": 0.9674540682414698, "eval_recall-l1l2": 0.9719247467438495, "eval_recall-l2": 0.9693741677762983, "eval_runtime": 7.359, "eval_samples_per_second": 91.86, "eval_steps_per_second": 5.843, "step": 800 }, { "epoch": 2.36, "eval_ACT": { "f1": 0.9409559512652297, "number": 519, "precision": 0.916058394160584, "recall": 0.9672447013487476 }, "eval_ACT_L1": { "f1": 0.96484375, "number": 503, "precision": 0.9481765834932822, "recall": 0.9821073558648111 }, "eval_ACT_L2": { "f1": 0.37209302325581395, "number": 16, "precision": 0.2962962962962963, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.47368421052631576, "number": 30, "precision": 0.391304347826087, "recall": 0.6 }, "eval_FT": { "f1": 0.3333333333333333, "number": 7, "precision": 0.4, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9609375, "number": 762, "precision": 0.9534883720930233, "recall": 0.968503937007874 }, "eval_PER": { "f1": 0.9852507374631269, "number": 676, "precision": 0.9823529411764705, "recall": 0.9881656804733728 }, "eval_SPAT": { "f1": 0.9597701149425288, "number": 694, "precision": 0.9570200573065902, "recall": 0.962536023054755 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9253731343283583, "number": 33, "precision": 0.9117647058823529, "recall": 0.9393939393939394 }, "eval_TITREP": { "f1": 0.42857142857142855, "number": 6, "precision": 0.375, "recall": 0.5 }, "eval_accuracy": 0.9653674280039722, "eval_accuracy-all": 0.9744289970208541, "eval_accuracy-das": 0.9823733862959285, "eval_accuracy-l1": 0.9714498510427011, "eval_accuracy-l1l2": 0.9663604766633564, "eval_accuracy-l2": 0.9774081429990069, "eval_f1": 0.9669171245934731, "eval_f1-all": 0.960616189507339, "eval_f1-das": 0.9740452354467927, "eval_f1-l1": 0.96, "eval_f1-l1l2": 0.9648745519713262, "eval_f1-l2": 0.9613988782580007, "eval_loss": 0.14285241067409515, "eval_precision": 0.9618473895582329, "eval_precision-all": 0.9513529073114565, "eval_precision-das": 0.9693726937269372, "eval_precision-l1": 0.9501285347043702, "eval_precision-l1l2": 0.9559659090909091, "eval_precision-l2": 0.9529103989535644, "eval_recall": 0.9720405862457723, "eval_recall-all": 0.9700616378045201, "eval_recall-das": 0.9787630402384501, "eval_recall-l1": 0.9700787401574803, "eval_recall-l1l2": 0.9739507959479016, "eval_recall-l2": 0.9700399467376831, "eval_runtime": 7.5384, "eval_samples_per_second": 89.674, "eval_steps_per_second": 5.704, "step": 900 }, { "epoch": 2.62, "learning_rate": 8e-05, "loss": 0.1442, "step": 1000 }, { "epoch": 2.62, "eval_ACT": { "f1": 0.9571020019065777, "number": 519, "precision": 0.9471698113207547, "recall": 0.9672447013487476 }, "eval_ACT_L1": { "f1": 0.9782178217821782, "number": 503, "precision": 0.9743589743589743, "recall": 0.9821073558648111 }, "eval_ACT_L2": { "f1": 0.41025641025641024, "number": 16, "precision": 0.34782608695652173, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9919058130978661, "number": 678, "precision": 0.9897209985315712, "recall": 0.9941002949852508 }, "eval_DESC": { "f1": 0.47368421052631576, "number": 30, "precision": 0.391304347826087, "recall": 0.6 }, "eval_FT": { "f1": 0.30769230769230765, "number": 7, "precision": 0.3333333333333333, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9712041884816753, "number": 762, "precision": 0.9686684073107049, "recall": 0.973753280839895 }, "eval_PER": { "f1": 0.9867060561299853, "number": 676, "precision": 0.9852507374631269, "recall": 0.9881656804733728 }, "eval_SPAT": { "f1": 0.9621157969978557, "number": 694, "precision": 0.9546099290780142, "recall": 0.9697406340057637 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9253731343283583, "number": 33, "precision": 0.9117647058823529, "recall": 0.9393939393939394 }, "eval_TITREP": { "f1": 0.42857142857142855, "number": 6, "precision": 0.375, "recall": 0.5 }, "eval_accuracy": 0.9658639523336644, "eval_accuracy-all": 0.9746772591857001, "eval_accuracy-das": 0.9833664349553128, "eval_accuracy-l1": 0.971077457795432, "eval_accuracy-l1l2": 0.9664846077457795, "eval_accuracy-l2": 0.9782770605759682, "eval_f1": 0.9711776626885835, "eval_f1-all": 0.9657484331730068, "eval_f1-das": 0.9778769287971741, "eval_f1-l1": 0.9648529028898724, "eval_f1-l1l2": 0.9700633275762809, "eval_f1-l2": 0.966887417218543, "eval_loss": 0.1273569017648697, "eval_precision": 0.9698673262873847, "eval_precision-all": 0.959177764910249, "eval_precision-das": 0.9758812615955473, "eval_precision-l1": 0.9571280991735537, "eval_precision-l1l2": 0.9647867162897223, "eval_precision-l2": 0.9617918313570487, "eval_recall": 0.9724915445321308, "eval_recall-all": 0.9724097446433813, "eval_recall-das": 0.9798807749627422, "eval_recall-l1": 0.9727034120734908, "eval_recall-l1l2": 0.975397973950796, "eval_recall-l2": 0.9720372836218375, "eval_runtime": 6.084, "eval_samples_per_second": 111.111, "eval_steps_per_second": 7.068, "step": 1000 }, { "epoch": 2.89, "eval_ACT": { "f1": 0.9563567362428842, "number": 519, "precision": 0.9420560747663551, "recall": 0.9710982658959537 }, "eval_ACT_L1": { "f1": 0.9782608695652174, "number": 503, "precision": 0.9724950884086444, "recall": 0.9840954274353877 }, "eval_ACT_L2": { "f1": 0.4285714285714286, "number": 16, "precision": 0.34615384615384615, "recall": 0.5625 }, "eval_CARDINAL": { "f1": 0.9933677229182019, "number": 678, "precision": 0.9926362297496318, "recall": 0.9941002949852508 }, "eval_DESC": { "f1": 0.5070422535211268, "number": 30, "precision": 0.43902439024390244, "recall": 0.6 }, "eval_FT": { "f1": 0.36363636363636365, "number": 7, "precision": 0.5, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9713541666666666, "number": 762, "precision": 0.9638242894056848, "recall": 0.979002624671916 }, "eval_PER": { "f1": 0.9859778597785979, "number": 676, "precision": 0.9837997054491899, "recall": 0.9881656804733728 }, "eval_SPAT": { "f1": 0.9654676258992806, "number": 694, "precision": 0.9640804597701149, "recall": 0.9668587896253602 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9696969696969697, "number": 33, "precision": 0.9696969696969697, "recall": 0.9696969696969697 }, "eval_TITREP": { "f1": 0.42857142857142855, "number": 6, "precision": 0.375, "recall": 0.5 }, "eval_accuracy": 0.9636295928500497, "eval_accuracy-all": 0.9731256206554121, "eval_accuracy-das": 0.9812562065541212, "eval_accuracy-l1": 0.9700844091360477, "eval_accuracy-l1l2": 0.964746772591857, "eval_accuracy-l2": 0.9761668321747765, "eval_f1": 0.9710437710437709, "eval_f1-all": 0.9679113185530922, "eval_f1-das": 0.9770114942528736, "eval_f1-l1": 0.9671018276762402, "eval_f1-l1l2": 0.9714039373473201, "eval_f1-l2": 0.9689358889623265, "eval_loss": 0.15453395247459412, "eval_precision": 0.9667039106145251, "eval_precision-all": 0.9620179762249927, "eval_precision-das": 0.9723247232472325, "eval_precision-l1": 0.9620779220779221, "eval_precision-l1l2": 0.9646118721461188, "eval_precision-l2": 0.9619422572178478, "eval_recall": 0.9754227733934611, "eval_recall-all": 0.9738773114176695, "eval_recall-das": 0.9817436661698957, "eval_recall-l1": 0.9721784776902888, "eval_recall-l1l2": 0.9782923299565847, "eval_recall-l2": 0.9760319573901465, "eval_runtime": 6.429, "eval_samples_per_second": 105.148, "eval_steps_per_second": 6.688, "step": 1100 }, { "epoch": 3.15, "eval_ACT": { "f1": 0.9466666666666668, "number": 519, "precision": 0.935969868173258, "recall": 0.9576107899807321 }, "eval_ACT_L1": { "f1": 0.9674234945705825, "number": 503, "precision": 0.9607843137254902, "recall": 0.974155069582505 }, "eval_ACT_L2": { "f1": 0.37837837837837834, "number": 16, "precision": 0.3333333333333333, "recall": 0.4375 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.547945205479452, "number": 30, "precision": 0.46511627906976744, "recall": 0.6666666666666666 }, "eval_FT": { "f1": 0.4615384615384615, "number": 7, "precision": 0.5, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9647979139504563, "number": 762, "precision": 0.9585492227979274, "recall": 0.9711286089238845 }, "eval_PER": { "f1": 0.9881656804733728, "number": 676, "precision": 0.9881656804733728, "recall": 0.9881656804733728 }, "eval_SPAT": { "f1": 0.9691756272401433, "number": 694, "precision": 0.9643366619115549, "recall": 0.9740634005763689 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9393939393939394, "number": 33, "precision": 0.9393939393939394, "recall": 0.9393939393939394 }, "eval_TITREP": { "f1": 0.6, "number": 6, "precision": 0.75, "recall": 0.5 }, "eval_accuracy": 0.964746772591857, "eval_accuracy-all": 0.9746151936444886, "eval_accuracy-das": 0.9803872889771599, "eval_accuracy-l1": 0.9708291956305859, "eval_accuracy-l1l2": 0.9652432969215492, "eval_accuracy-l2": 0.9784011916583912, "eval_f1": 0.9706774519716885, "eval_f1-all": 0.9667347534286548, "eval_f1-das": 0.9745589600742803, "eval_f1-l1": 0.9668839634941329, "eval_f1-l1l2": 0.9678068410462776, "eval_f1-l2": 0.9665452136469029, "eval_loss": 0.14055882394313812, "eval_precision": 0.9673085535154501, "eval_precision-all": 0.9611256164780969, "eval_precision-das": 0.9714920399851906, "eval_precision-l1": 0.960621761658031, "eval_precision-l1l2": 0.96117613474165, "eval_precision-l2": 0.961766644693474, "eval_recall": 0.9740698985343855, "eval_recall-all": 0.9724097446433813, "eval_recall-das": 0.977645305514158, "eval_recall-l1": 0.9732283464566929, "eval_recall-l1l2": 0.9745296671490593, "eval_recall-l2": 0.9713715046604527, "eval_runtime": 5.9342, "eval_samples_per_second": 113.916, "eval_steps_per_second": 7.246, "step": 1200 }, { "epoch": 3.41, "eval_ACT": { "f1": 0.9363295880149812, "number": 519, "precision": 0.9107468123861566, "recall": 0.9633911368015414 }, "eval_ACT_L1": { "f1": 0.9591439688715954, "number": 503, "precision": 0.939047619047619, "recall": 0.9801192842942346 }, "eval_ACT_L2": { "f1": 0.35000000000000003, "number": 16, "precision": 0.2916666666666667, "recall": 0.4375 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.43037974683544306, "number": 30, "precision": 0.3469387755102041, "recall": 0.5666666666666667 }, "eval_FT": { "f1": 0.42857142857142855, "number": 7, "precision": 0.42857142857142855, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9636363636363636, "number": 762, "precision": 0.9537275064267352, "recall": 0.973753280839895 }, "eval_PER": { "f1": 0.9845246868091379, "number": 676, "precision": 0.9809104258443465, "recall": 0.9881656804733728 }, "eval_SPAT": { "f1": 0.9707351891506067, "number": 694, "precision": 0.9618104667609618, "recall": 0.9798270893371758 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9253731343283583, "number": 33, "precision": 0.9117647058823529, "recall": 0.9393939393939394 }, "eval_TITREP": { "f1": 0.42857142857142855, "number": 6, "precision": 0.375, "recall": 0.5 }, "eval_accuracy": 0.967974180734856, "eval_accuracy-all": 0.9767254220456802, "eval_accuracy-das": 0.9826216484607746, "eval_accuracy-l1": 0.9735600794438928, "eval_accuracy-l1l2": 0.9685948361469712, "eval_accuracy-l2": 0.9798907646474677, "eval_f1": 0.9691876750700281, "eval_f1-all": 0.961889581220113, "eval_f1-das": 0.9733333333333334, "eval_f1-l1": 0.960951642099819, "eval_f1-l1l2": 0.9658928059615935, "eval_f1-l2": 0.963085036255768, "eval_loss": 0.13519717752933502, "eval_precision": 0.9632516703786191, "eval_precision-all": 0.9499141385231826, "eval_precision-das": 0.96759941089838, "eval_precision-l1": 0.9469928644240571, "eval_precision-l1l2": 0.9565711041725802, "eval_precision-l2": 0.9536553524804178, "eval_recall": 0.9751972942502819, "eval_recall-all": 0.9741708247725271, "eval_recall-das": 0.9791356184798807, "eval_recall-l1": 0.9753280839895013, "eval_recall-l1l2": 0.975397973950796, "eval_recall-l2": 0.9727030625832224, "eval_runtime": 6.3863, "eval_samples_per_second": 105.852, "eval_steps_per_second": 6.733, "step": 1300 }, { "epoch": 3.67, "eval_ACT": { "f1": 0.9461756373937679, "number": 519, "precision": 0.9277777777777778, "recall": 0.9653179190751445 }, "eval_ACT_L1": { "f1": 0.9686274509803922, "number": 503, "precision": 0.9555125725338491, "recall": 0.9821073558648111 }, "eval_ACT_L2": { "f1": 0.358974358974359, "number": 16, "precision": 0.30434782608695654, "recall": 0.4375 }, "eval_CARDINAL": { "f1": 0.9933774834437086, "number": 678, "precision": 0.9911894273127754, "recall": 0.995575221238938 }, "eval_DESC": { "f1": 0.5507246376811593, "number": 30, "precision": 0.48717948717948717, "recall": 0.6333333333333333 }, "eval_FT": { "f1": 0.5, "number": 7, "precision": 0.6, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9679529103989535, "number": 762, "precision": 0.9647979139504563, "recall": 0.9711286089238845 }, "eval_PER": { "f1": 0.9881656804733728, "number": 676, "precision": 0.9881656804733728, "recall": 0.9881656804733728 }, "eval_SPAT": { "f1": 0.9727403156384505, "number": 694, "precision": 0.9685714285714285, "recall": 0.9769452449567724 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9696969696969697, "number": 33, "precision": 0.9696969696969697, "recall": 0.9696969696969697 }, "eval_TITREP": { "f1": 0.4615384615384615, "number": 6, "precision": 0.42857142857142855, "recall": 0.5 }, "eval_accuracy": 0.9664846077457795, "eval_accuracy-all": 0.9749255213505462, "eval_accuracy-das": 0.9826216484607746, "eval_accuracy-l1": 0.9723187686196624, "eval_accuracy-l1l2": 0.9669811320754716, "eval_accuracy-l2": 0.97753227408143, "eval_f1": 0.9732283464566929, "eval_f1-all": 0.9683442742523706, "eval_f1-das": 0.9756912228613843, "eval_f1-l1": 0.9689861871253583, "eval_f1-l1l2": 0.9711981566820277, "eval_f1-l2": 0.9675281643472498, "eval_loss": 0.1356203556060791, "eval_precision": 0.971043771043771, "eval_precision-all": 0.9625870069605569, "eval_precision-das": 0.9719038817005545, "eval_precision-l1": 0.9622153209109731, "eval_precision-l1l2": 0.9664660361134996, "eval_precision-l2": 0.9630606860158312, "eval_recall": 0.9754227733934611, "eval_recall-all": 0.9741708247725271, "eval_recall-das": 0.9795081967213115, "eval_recall-l1": 0.9758530183727034, "eval_recall-l1l2": 0.9759768451519537, "eval_recall-l2": 0.9720372836218375, "eval_runtime": 7.0867, "eval_samples_per_second": 95.39, "eval_steps_per_second": 6.068, "step": 1400 } ], "max_steps": 5000, "num_train_epochs": 14, "total_flos": 564085470663792.0, "trial_name": null, "trial_params": null }