{ "best_metric": 0.873456597328186, "best_model_checkpoint": "nyt-ingredient-tagger-gte-small/checkpoint-15000", "epoch": 5.0, "eval_steps": 1000, "global_step": 25255, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.1, "learning_rate": 4.9010097010492975e-05, "loss": 1.1066, "step": 500 }, { "epoch": 0.2, "learning_rate": 4.802019402098595e-05, "loss": 0.9427, "step": 1000 }, { "epoch": 0.2, "eval_COMMENT": { "f1": 0.6827173347214992, "number": 6735, "precision": 0.6076682497393722, "recall": 0.7789161098737936 }, "eval_NAME": { "f1": 0.7975022301516503, "number": 8801, "precision": 0.7829228243021347, "recall": 0.8126349278491081 }, "eval_QTY": { "f1": 0.9832785279507451, "number": 7088, "precision": 0.97529493407356, "recall": 0.9913939051918735 }, "eval_RANGE_END": { "f1": 0.6793893129770994, "number": 91, "precision": 0.52046783625731, "recall": 0.978021978021978 }, "eval_UNIT": { "f1": 0.9474663734032653, "number": 5697, "precision": 0.914435009797518, "recall": 0.982973494821836 }, "eval_loss": 0.9320821166038513, "eval_overall_accuracy": 0.8183442525312686, "eval_overall_f1": 0.8416219839142092, "eval_overall_precision": 0.8031853652296277, "eval_overall_recall": 0.883922286357877, "eval_runtime": 12.4448, "eval_samples_per_second": 683.5, "eval_steps_per_second": 21.374, "step": 1000 }, { "epoch": 0.3, "learning_rate": 4.703029103147892e-05, "loss": 0.9333, "step": 1500 }, { "epoch": 0.4, "learning_rate": 4.6040388041971886e-05, "loss": 0.9169, "step": 2000 }, { "epoch": 0.4, "eval_COMMENT": { "f1": 0.7030077684084721, "number": 6735, "precision": 0.6358395387941388, "recall": 0.7860430586488493 }, "eval_NAME": { "f1": 0.798910626945309, "number": 8801, "precision": 0.781960613643782, "recall": 0.8166117486649245 }, "eval_QTY": { "f1": 0.9835744740336898, "number": 7088, "precision": 0.9746502285635129, "recall": 0.9926636568848759 }, "eval_RANGE_END": { "f1": 0.7543859649122806, "number": 91, "precision": 0.6277372262773723, "recall": 0.945054945054945 }, "eval_UNIT": { "f1": 0.9503173931443081, "number": 5697, "precision": 0.9176201372997712, "recall": 0.9854309285588907 }, "eval_loss": 0.9112022519111633, "eval_overall_accuracy": 0.8256066398970201, "eval_overall_f1": 0.8490143595441308, "eval_overall_precision": 0.8136878448581847, "eval_overall_recall": 0.8875475151344502, "eval_runtime": 12.0886, "eval_samples_per_second": 703.64, "eval_steps_per_second": 22.004, "step": 2000 }, { "epoch": 0.49, "learning_rate": 4.505048505246486e-05, "loss": 0.9126, "step": 2500 }, { "epoch": 0.59, "learning_rate": 4.406058206295783e-05, "loss": 0.9, "step": 3000 }, { "epoch": 0.59, "eval_COMMENT": { "f1": 0.7219525171244263, "number": 6735, "precision": 0.6538183570224042, "recall": 0.8059391239792131 }, "eval_NAME": { "f1": 0.8061383928571427, "number": 8801, "precision": 0.7920824651825858, "recall": 0.8207021929326213 }, "eval_QTY": { "f1": 0.9870641169853768, "number": 7088, "precision": 0.9837443946188341, "recall": 0.9904063205417607 }, "eval_RANGE_END": { "f1": 0.7309644670050762, "number": 91, "precision": 0.6792452830188679, "recall": 0.7912087912087912 }, "eval_UNIT": { "f1": 0.9483108108108108, "number": 5697, "precision": 0.9138857235878235, "recall": 0.9854309285588907 }, "eval_loss": 0.902090847492218, "eval_overall_accuracy": 0.8302368921593114, "eval_overall_f1": 0.856395015029214, "eval_overall_precision": 0.8231188729468285, "eval_overall_recall": 0.8924750105589188, "eval_runtime": 14.5748, "eval_samples_per_second": 583.612, "eval_steps_per_second": 18.251, "step": 3000 }, { "epoch": 0.69, "learning_rate": 4.3070679073450804e-05, "loss": 0.9058, "step": 3500 }, { "epoch": 0.79, "learning_rate": 4.208077608394378e-05, "loss": 0.9061, "step": 4000 }, { "epoch": 0.79, "eval_COMMENT": { "f1": 0.7202272266179753, "number": 6735, "precision": 0.6613263785394933, "recall": 0.7906458797327395 }, "eval_NAME": { "f1": 0.8081158124196521, "number": 8801, "precision": 0.7952695269526953, "recall": 0.821383933643904 }, "eval_QTY": { "f1": 0.9869014084507043, "number": 7088, "precision": 0.985236220472441, "recall": 0.9885722347629797 }, "eval_RANGE_END": { "f1": 0.7592592592592593, "number": 91, "precision": 0.656, "recall": 0.9010989010989011 }, "eval_UNIT": { "f1": 0.9522355137015356, "number": 5697, "precision": 0.9215106732348112, "recall": 0.9850798665964543 }, "eval_loss": 0.8911505341529846, "eval_overall_accuracy": 0.8325616246229515, "eval_overall_f1": 0.857831898235424, "eval_overall_precision": 0.8288752502543569, "eval_overall_recall": 0.8888849781782345, "eval_runtime": 12.1725, "eval_samples_per_second": 698.791, "eval_steps_per_second": 21.853, "step": 4000 }, { "epoch": 0.89, "learning_rate": 4.109087309443675e-05, "loss": 0.8962, "step": 4500 }, { "epoch": 0.99, "learning_rate": 4.010097010492972e-05, "loss": 0.8889, "step": 5000 }, { "epoch": 0.99, "eval_COMMENT": { "f1": 0.7147275101367603, "number": 6735, "precision": 0.6653019447287615, "recall": 0.7720861172976986 }, "eval_NAME": { "f1": 0.8085439498993513, "number": 8801, "precision": 0.7959925134867335, "recall": 0.8214975570957845 }, "eval_QTY": { "f1": 0.9872508276396421, "number": 7088, "precision": 0.9857926571951048, "recall": 0.9887133182844243 }, "eval_RANGE_END": { "f1": 0.7623318385650225, "number": 91, "precision": 0.6439393939393939, "recall": 0.9340659340659341 }, "eval_UNIT": { "f1": 0.9522514868309261, "number": 5697, "precision": 0.9227729293594599, "recall": 0.9836756187467088 }, "eval_loss": 0.8908107876777649, "eval_overall_accuracy": 0.8310630367538281, "eval_overall_f1": 0.8572110874200426, "eval_overall_precision": 0.8316618674080694, "eval_overall_recall": 0.8843798395044348, "eval_runtime": 12.1451, "eval_samples_per_second": 700.364, "eval_steps_per_second": 21.902, "step": 5000 }, { "epoch": 1.09, "learning_rate": 3.911106711542269e-05, "loss": 0.8786, "step": 5500 }, { "epoch": 1.19, "learning_rate": 3.812116412591566e-05, "loss": 0.88, "step": 6000 }, { "epoch": 1.19, "eval_COMMENT": { "f1": 0.7254114813327982, "number": 6735, "precision": 0.660211910851297, "recall": 0.8048997772828508 }, "eval_NAME": { "f1": 0.8067433292397008, "number": 8801, "precision": 0.7929331723910896, "recall": 0.8210430632882627 }, "eval_QTY": { "f1": 0.9868633649455567, "number": 7088, "precision": 0.9827899818105499, "recall": 0.9909706546275395 }, "eval_RANGE_END": { "f1": 0.7631578947368421, "number": 91, "precision": 0.635036496350365, "recall": 0.9560439560439561 }, "eval_UNIT": { "f1": 0.9526315789473684, "number": 5697, "precision": 0.9224067072168338, "recall": 0.984904335615236 }, "eval_loss": 0.8873026371002197, "eval_overall_accuracy": 0.8337912351822321, "eval_overall_f1": 0.8584674212814917, "eval_overall_precision": 0.8265941155387573, "eval_overall_recall": 0.8928973673095875, "eval_runtime": 13.0658, "eval_samples_per_second": 651.014, "eval_steps_per_second": 20.359, "step": 6000 }, { "epoch": 1.29, "learning_rate": 3.7131261136408633e-05, "loss": 0.8761, "step": 6500 }, { "epoch": 1.39, "learning_rate": 3.6141358146901606e-05, "loss": 0.8751, "step": 7000 }, { "epoch": 1.39, "eval_COMMENT": { "f1": 0.7309149972929073, "number": 6735, "precision": 0.6715582638975252, "recall": 0.8017817371937639 }, "eval_NAME": { "f1": 0.8121178120617111, "number": 8801, "precision": 0.8020833333333334, "recall": 0.8224065447108283 }, "eval_QTY": { "f1": 0.9871903153153153, "number": 7088, "precision": 0.9849719101123595, "recall": 0.9894187358916479 }, "eval_RANGE_END": { "f1": 0.7565217391304349, "number": 91, "precision": 0.6258992805755396, "recall": 0.9560439560439561 }, "eval_UNIT": { "f1": 0.9523647209203238, "number": 5697, "precision": 0.9254720105995363, "recall": 0.9808671230472178 }, "eval_loss": 0.8865671157836914, "eval_overall_accuracy": 0.834847931756614, "eval_overall_f1": 0.8618096437200122, "eval_overall_precision": 0.8341347737303207, "eval_overall_recall": 0.8913839222863579, "eval_runtime": 12.663, "eval_samples_per_second": 671.721, "eval_steps_per_second": 21.006, "step": 7000 }, { "epoch": 1.48, "learning_rate": 3.515145515739457e-05, "loss": 0.8836, "step": 7500 }, { "epoch": 1.58, "learning_rate": 3.416155216788755e-05, "loss": 0.8816, "step": 8000 }, { "epoch": 1.58, "eval_COMMENT": { "f1": 0.7336898395721925, "number": 6735, "precision": 0.6672340425531915, "recall": 0.8148478099480326 }, "eval_NAME": { "f1": 0.8090705487122061, "number": 8801, "precision": 0.797549398388343, "recall": 0.8209294398363822 }, "eval_QTY": { "f1": 0.9869745828346124, "number": 7088, "precision": 0.9851018973998594, "recall": 0.988854401805869 }, "eval_RANGE_END": { "f1": 0.7623318385650225, "number": 91, "precision": 0.6439393939393939, "recall": 0.9340659340659341 }, "eval_UNIT": { "f1": 0.9534507701472215, "number": 5697, "precision": 0.9253386190948133, "recall": 0.9833245567842724 }, "eval_loss": 0.8822705745697021, "eval_overall_accuracy": 0.835962266325962, "eval_overall_f1": 0.8613658321609573, "eval_overall_precision": 0.8307667157103155, "eval_overall_recall": 0.8943052231451499, "eval_runtime": 12.6561, "eval_samples_per_second": 672.089, "eval_steps_per_second": 21.018, "step": 8000 }, { "epoch": 1.68, "learning_rate": 3.317164917838052e-05, "loss": 0.8785, "step": 8500 }, { "epoch": 1.78, "learning_rate": 3.218174618887349e-05, "loss": 0.8756, "step": 9000 }, { "epoch": 1.78, "eval_COMMENT": { "f1": 0.7321063394683027, "number": 6735, "precision": 0.6767485822306238, "recall": 0.7973273942093542 }, "eval_NAME": { "f1": 0.8122265844083006, "number": 8801, "precision": 0.8019714254070218, "recall": 0.8227474150664698 }, "eval_QTY": { "f1": 0.9867829021372329, "number": 7088, "precision": 0.9834641255605381, "recall": 0.9901241534988713 }, "eval_RANGE_END": { "f1": 0.7864077669902914, "number": 91, "precision": 0.7043478260869566, "recall": 0.8901098901098901 }, "eval_UNIT": { "f1": 0.9523567310952866, "number": 5697, "precision": 0.9209706509263814, "recall": 0.9859575215025452 }, "eval_loss": 0.8817200660705566, "eval_overall_accuracy": 0.8375377048550404, "eval_overall_f1": 0.8625481047576883, "eval_overall_precision": 0.8354885531437619, "eval_overall_recall": 0.891419118682247, "eval_runtime": 13.1407, "eval_samples_per_second": 647.302, "eval_steps_per_second": 20.242, "step": 9000 }, { "epoch": 1.88, "learning_rate": 3.119184319936647e-05, "loss": 0.8739, "step": 9500 }, { "epoch": 1.98, "learning_rate": 3.0201940209859435e-05, "loss": 0.8695, "step": 10000 }, { "epoch": 1.98, "eval_COMMENT": { "f1": 0.7372581084764241, "number": 6735, "precision": 0.6812743986903412, "recall": 0.8032665181885672 }, "eval_NAME": { "f1": 0.8095131505316173, "number": 8801, "precision": 0.7975521005623553, "recall": 0.821838427451426 }, "eval_QTY": { "f1": 0.9853692684634231, "number": 7088, "precision": 0.9779074614422676, "recall": 0.9929458239277652 }, "eval_RANGE_END": { "f1": 0.7639484978540774, "number": 91, "precision": 0.6267605633802817, "recall": 0.978021978021978 }, "eval_UNIT": { "f1": 0.9517510387518019, "number": 5697, "precision": 0.9206036745406824, "recall": 0.9850798665964543 }, "eval_loss": 0.8788286447525024, "eval_overall_accuracy": 0.8376145555149955, "eval_overall_f1": 0.8624972390709686, "eval_overall_precision": 0.8337001149614058, "eval_overall_recall": 0.8933549204561453, "eval_runtime": 12.7467, "eval_samples_per_second": 667.312, "eval_steps_per_second": 20.868, "step": 10000 }, { "epoch": 2.08, "learning_rate": 2.9212037220352405e-05, "loss": 0.8595, "step": 10500 }, { "epoch": 2.18, "learning_rate": 2.8222134230845377e-05, "loss": 0.8537, "step": 11000 }, { "epoch": 2.18, "eval_COMMENT": { "f1": 0.741655859668282, "number": 6735, "precision": 0.6863314805457301, "recall": 0.8066815144766147 }, "eval_NAME": { "f1": 0.8129971988795517, "number": 8801, "precision": 0.8018565587357719, "recall": 0.8244517668446767 }, "eval_QTY": { "f1": 0.9869308600337269, "number": 7088, "precision": 0.9830627099664053, "recall": 0.9908295711060948 }, "eval_RANGE_END": { "f1": 0.792626728110599, "number": 91, "precision": 0.6825396825396826, "recall": 0.945054945054945 }, "eval_UNIT": { "f1": 0.9528510638297872, "number": 5697, "precision": 0.9248306624814142, "recall": 0.9826224328593997 }, "eval_loss": 0.8804447650909424, "eval_overall_accuracy": 0.8384022747795347, "eval_overall_f1": 0.8652810902896081, "eval_overall_precision": 0.8384838880084522, "eval_overall_recall": 0.8938476699985921, "eval_runtime": 13.7729, "eval_samples_per_second": 617.589, "eval_steps_per_second": 19.313, "step": 11000 }, { "epoch": 2.28, "learning_rate": 2.7232231241338353e-05, "loss": 0.8543, "step": 11500 }, { "epoch": 2.38, "learning_rate": 2.6242328251831323e-05, "loss": 0.854, "step": 12000 }, { "epoch": 2.38, "eval_COMMENT": { "f1": 0.7438095238095238, "number": 6735, "precision": 0.6863779033270558, "recall": 0.8117297698589458 }, "eval_NAME": { "f1": 0.8151350137539999, "number": 8801, "precision": 0.8055925432756325, "recall": 0.8249062606521986 }, "eval_QTY": { "f1": 0.9872119168071951, "number": 7088, "precision": 0.9833426651735723, "recall": 0.9911117381489842 }, "eval_RANGE_END": { "f1": 0.7982062780269058, "number": 91, "precision": 0.6742424242424242, "recall": 0.978021978021978 }, "eval_UNIT": { "f1": 0.9521952873368368, "number": 5697, "precision": 0.9206687428290444, "recall": 0.9859575215025452 }, "eval_loss": 0.8816655278205872, "eval_overall_accuracy": 0.8389594420642087, "eval_overall_f1": 0.8664193581322533, "eval_overall_precision": 0.8387033010476379, "eval_overall_recall": 0.8960298465437139, "eval_runtime": 12.7157, "eval_samples_per_second": 668.937, "eval_steps_per_second": 20.919, "step": 12000 }, { "epoch": 2.47, "learning_rate": 2.5252425262324292e-05, "loss": 0.8609, "step": 12500 }, { "epoch": 2.57, "learning_rate": 2.4262522272817265e-05, "loss": 0.8582, "step": 13000 }, { "epoch": 2.57, "eval_COMMENT": { "f1": 0.7477459155311504, "number": 6735, "precision": 0.6879990019960079, "recall": 0.8188567186340014 }, "eval_NAME": { "f1": 0.8148396844049018, "number": 8801, "precision": 0.8027563395810364, "recall": 0.8272923531416885 }, "eval_QTY": { "f1": 0.9867996067967982, "number": 7088, "precision": 0.9822476935979871, "recall": 0.9913939051918735 }, "eval_RANGE_END": { "f1": 0.772093023255814, "number": 91, "precision": 0.6693548387096774, "recall": 0.9120879120879121 }, "eval_UNIT": { "f1": 0.9524215552523875, "number": 5697, "precision": 0.9260487481346377, "recall": 0.9803405301035633 }, "eval_loss": 0.8745654225349426, "eval_overall_accuracy": 0.8401890526234894, "eval_overall_f1": 0.8669376094682606, "eval_overall_precision": 0.8386576739595328, "eval_overall_recall": 0.897191327608053, "eval_runtime": 10.2599, "eval_samples_per_second": 829.055, "eval_steps_per_second": 25.926, "step": 13000 }, { "epoch": 2.67, "learning_rate": 2.3272619283310237e-05, "loss": 0.8617, "step": 13500 }, { "epoch": 2.77, "learning_rate": 2.2282716293803206e-05, "loss": 0.8554, "step": 14000 }, { "epoch": 2.77, "eval_COMMENT": { "f1": 0.7481907338518768, "number": 6735, "precision": 0.6870807453416149, "recall": 0.8212323682256867 }, "eval_NAME": { "f1": 0.8165394973070018, "number": 8801, "precision": 0.8064945140197274, "recall": 0.8268378593341665 }, "eval_QTY": { "f1": 0.9876282862364684, "number": 7088, "precision": 0.9841692350798543, "recall": 0.9911117381489842 }, "eval_RANGE_END": { "f1": 0.7777777777777778, "number": 91, "precision": 0.672, "recall": 0.9230769230769231 }, "eval_UNIT": { "f1": 0.9534646739130435, "number": 5697, "precision": 0.923507155782201, "recall": 0.9854309285588907 }, "eval_loss": 0.8742881417274475, "eval_overall_accuracy": 0.8416107898326577, "eval_overall_f1": 0.8680027878355177, "eval_overall_precision": 0.8394213381555153, "eval_overall_recall": 0.8985991834436153, "eval_runtime": 10.2908, "eval_samples_per_second": 826.561, "eval_steps_per_second": 25.848, "step": 14000 }, { "epoch": 2.87, "learning_rate": 2.129281330429618e-05, "loss": 0.8553, "step": 14500 }, { "epoch": 2.97, "learning_rate": 2.0302910314789152e-05, "loss": 0.86, "step": 15000 }, { "epoch": 2.97, "eval_COMMENT": { "f1": 0.7449105068998496, "number": 6735, "precision": 0.6898646083765658, "recall": 0.8095025983667409 }, "eval_NAME": { "f1": 0.8143625364104862, "number": 8801, "precision": 0.8031156778256546, "recall": 0.8259288717191229 }, "eval_QTY": { "f1": 0.9873542222846705, "number": 7088, "precision": 0.9833473271760426, "recall": 0.9913939051918735 }, "eval_RANGE_END": { "f1": 0.7547169811320755, "number": 91, "precision": 0.6611570247933884, "recall": 0.8791208791208791 }, "eval_UNIT": { "f1": 0.9538566320449514, "number": 5697, "precision": 0.9261034881798644, "recall": 0.9833245567842724 }, "eval_loss": 0.873456597328186, "eval_overall_accuracy": 0.8422640204422756, "eval_overall_f1": 0.866705292934801, "eval_overall_precision": 0.8401057152296003, "eval_overall_recall": 0.8950443474588202, "eval_runtime": 10.9665, "eval_samples_per_second": 775.635, "eval_steps_per_second": 24.256, "step": 15000 }, { "epoch": 3.07, "learning_rate": 1.9313007325282124e-05, "loss": 0.8414, "step": 15500 }, { "epoch": 3.17, "learning_rate": 1.8323104335775097e-05, "loss": 0.845, "step": 16000 }, { "epoch": 3.17, "eval_COMMENT": { "f1": 0.7413599325653274, "number": 6735, "precision": 0.7035061991734436, "recall": 0.7835189309576838 }, "eval_NAME": { "f1": 0.8080446927374302, "number": 8801, "precision": 0.7948126167710737, "recall": 0.8217248039995455 }, "eval_QTY": { "f1": 0.9871533871533871, "number": 7088, "precision": 0.982394858180802, "recall": 0.9919582392776524 }, "eval_RANGE_END": { "f1": 0.7777777777777778, "number": 91, "precision": 0.719626168224299, "recall": 0.8461538461538461 }, "eval_UNIT": { "f1": 0.9531036834924966, "number": 5697, "precision": 0.9267119880616813, "recall": 0.981042654028436 }, "eval_loss": 0.878207266330719, "eval_overall_accuracy": 0.8396895233337817, "eval_overall_f1": 0.8645960176308162, "eval_overall_precision": 0.8431510286001004, "eval_overall_recall": 0.8871603547796706, "eval_runtime": 11.5191, "eval_samples_per_second": 738.424, "eval_steps_per_second": 23.092, "step": 16000 }, { "epoch": 3.27, "learning_rate": 1.7333201346268066e-05, "loss": 0.8353, "step": 16500 }, { "epoch": 3.37, "learning_rate": 1.634329835676104e-05, "loss": 0.846, "step": 17000 }, { "epoch": 3.37, "eval_COMMENT": { "f1": 0.7456715182451542, "number": 6735, "precision": 0.6963411491883535, "recall": 0.8025241276911655 }, "eval_NAME": { "f1": 0.8116995693753145, "number": 8801, "precision": 0.7992290748898678, "recall": 0.8245653902965572 }, "eval_QTY": { "f1": 0.9874859392575928, "number": 7088, "precision": 0.984164798206278, "recall": 0.9908295711060948 }, "eval_RANGE_END": { "f1": 0.7641509433962264, "number": 91, "precision": 0.6694214876033058, "recall": 0.8901098901098901 }, "eval_UNIT": { "f1": 0.9531343029684443, "number": 5697, "precision": 0.9245874587458746, "recall": 0.9835000877654906 }, "eval_loss": 0.8758910298347473, "eval_overall_accuracy": 0.8402659032834444, "eval_overall_f1": 0.8662648751088423, "eval_overall_precision": 0.8411751052753739, "eval_overall_recall": 0.8928973673095875, "eval_runtime": 12.1757, "eval_samples_per_second": 698.602, "eval_steps_per_second": 21.847, "step": 17000 }, { "epoch": 3.46, "learning_rate": 1.535339536725401e-05, "loss": 0.8452, "step": 17500 }, { "epoch": 3.56, "learning_rate": 1.4363492377746981e-05, "loss": 0.8392, "step": 18000 }, { "epoch": 3.56, "eval_COMMENT": { "f1": 0.7475519133273144, "number": 6735, "precision": 0.7022442588726514, "recall": 0.799109131403118 }, "eval_NAME": { "f1": 0.8129017832187377, "number": 8801, "precision": 0.8000660211267606, "recall": 0.8261561186228837 }, "eval_QTY": { "f1": 0.987295570997403, "number": 7088, "precision": 0.9823997765050985, "recall": 0.9922404063205418 }, "eval_RANGE_END": { "f1": 0.7809523809523808, "number": 91, "precision": 0.6890756302521008, "recall": 0.9010989010989011 }, "eval_UNIT": { "f1": 0.9535298615240847, "number": 5697, "precision": 0.9239380968060587, "recall": 0.9850798665964543 }, "eval_loss": 0.8759370446205139, "eval_overall_accuracy": 0.8409191338930623, "eval_overall_f1": 0.8674550550276846, "eval_overall_precision": 0.8430773319160244, "eval_overall_recall": 0.8932845276643672, "eval_runtime": 12.9734, "eval_samples_per_second": 655.647, "eval_steps_per_second": 20.503, "step": 18000 }, { "epoch": 3.66, "learning_rate": 1.3373589388239954e-05, "loss": 0.8436, "step": 18500 }, { "epoch": 3.76, "learning_rate": 1.2383686398732925e-05, "loss": 0.8375, "step": 19000 }, { "epoch": 3.76, "eval_COMMENT": { "f1": 0.7500341670083366, "number": 6735, "precision": 0.6947714900620332, "recall": 0.8148478099480326 }, "eval_NAME": { "f1": 0.8153302283822457, "number": 8801, "precision": 0.8054323725055432, "recall": 0.8254743779116009 }, "eval_QTY": { "f1": 0.9877046300850137, "number": 7088, "precision": 0.9837648705388383, "recall": 0.991676072234763 }, "eval_RANGE_END": { "f1": 0.7751196172248803, "number": 91, "precision": 0.6864406779661016, "recall": 0.8901098901098901 }, "eval_UNIT": { "f1": 0.9524700280588385, "number": 5697, "precision": 0.9236477572559367, "recall": 0.9831490258030542 }, "eval_loss": 0.8779729008674622, "eval_overall_accuracy": 0.8412841745278488, "eval_overall_f1": 0.8682191687408367, "eval_overall_precision": 0.8418964491172386, "eval_overall_recall": 0.8962410249190483, "eval_runtime": 12.8106, "eval_samples_per_second": 663.98, "eval_steps_per_second": 20.764, "step": 19000 }, { "epoch": 3.86, "learning_rate": 1.1393783409225896e-05, "loss": 0.8358, "step": 19500 }, { "epoch": 3.96, "learning_rate": 1.0403880419718868e-05, "loss": 0.8366, "step": 20000 }, { "epoch": 3.96, "eval_COMMENT": { "f1": 0.7509641873278236, "number": 6735, "precision": 0.7003211303789338, "recall": 0.8095025983667409 }, "eval_NAME": { "f1": 0.8146694330735154, "number": 8801, "precision": 0.804251550044287, "recall": 0.8253607544597205 }, "eval_QTY": { "f1": 0.9872137136433891, "number": 7088, "precision": 0.9832073887489504, "recall": 0.9912528216704289 }, "eval_RANGE_END": { "f1": 0.7783251231527095, "number": 91, "precision": 0.7053571428571429, "recall": 0.8681318681318682 }, "eval_UNIT": { "f1": 0.9528422125924038, "number": 5697, "precision": 0.9234189723320159, "recall": 0.9842022116903634 }, "eval_loss": 0.8742325305938721, "eval_overall_accuracy": 0.841668427827624, "eval_overall_f1": 0.8684574531668914, "eval_overall_precision": 0.8434670116429496, "eval_overall_recall": 0.8949739546670421, "eval_runtime": 12.4853, "eval_samples_per_second": 681.281, "eval_steps_per_second": 21.305, "step": 20000 }, { "epoch": 4.06, "learning_rate": 9.41397743021184e-06, "loss": 0.8274, "step": 20500 }, { "epoch": 4.16, "learning_rate": 8.424074440704812e-06, "loss": 0.8189, "step": 21000 }, { "epoch": 4.16, "eval_COMMENT": { "f1": 0.7531697905181918, "number": 6735, "precision": 0.7027131284557027, "recall": 0.8114328136599851 }, "eval_NAME": { "f1": 0.8157082748948107, "number": 8801, "precision": 0.8056294326241135, "recall": 0.8260424951710033 }, "eval_QTY": { "f1": 0.9872937872937874, "number": 7088, "precision": 0.9825345815285734, "recall": 0.9920993227990971 }, "eval_RANGE_END": { "f1": 0.7751196172248803, "number": 91, "precision": 0.6864406779661016, "recall": 0.8901098901098901 }, "eval_UNIT": { "f1": 0.9539115646258504, "number": 5697, "precision": 0.9251195777667821, "recall": 0.9845532736527998 }, "eval_loss": 0.8799063563346863, "eval_overall_accuracy": 0.8425137850871295, "eval_overall_f1": 0.8695667025328346, "eval_overall_precision": 0.8446531072696506, "eval_overall_recall": 0.8959946501478249, "eval_runtime": 14.411, "eval_samples_per_second": 590.242, "eval_steps_per_second": 18.458, "step": 21000 }, { "epoch": 4.26, "learning_rate": 7.434171451197783e-06, "loss": 0.8352, "step": 21500 }, { "epoch": 4.36, "learning_rate": 6.444268461690754e-06, "loss": 0.8269, "step": 22000 }, { "epoch": 4.36, "eval_COMMENT": { "f1": 0.7478056534660309, "number": 6735, "precision": 0.6995086630462891, "recall": 0.8032665181885672 }, "eval_NAME": { "f1": 0.8122026308424294, "number": 8801, "precision": 0.8004192409532216, "recall": 0.8243381433927963 }, "eval_QTY": { "f1": 0.987140749068934, "number": 7088, "precision": 0.9833403331933361, "recall": 0.9909706546275395 }, "eval_RANGE_END": { "f1": 0.7843137254901961, "number": 91, "precision": 0.7079646017699115, "recall": 0.8791208791208791 }, "eval_UNIT": { "f1": 0.9531422740028915, "number": 5697, "precision": 0.9244473771032663, "recall": 0.9836756187467088 }, "eval_loss": 0.87808758020401, "eval_overall_accuracy": 0.8418029164825453, "eval_overall_f1": 0.8670379989065063, "eval_overall_precision": 0.8425089653340417, "eval_overall_recall": 0.8930381528931437, "eval_runtime": 13.8025, "eval_samples_per_second": 616.264, "eval_steps_per_second": 19.272, "step": 22000 }, { "epoch": 4.45, "learning_rate": 5.4543654721837265e-06, "loss": 0.8231, "step": 22500 }, { "epoch": 4.55, "learning_rate": 4.4644624826766974e-06, "loss": 0.829, "step": 23000 }, { "epoch": 4.55, "eval_COMMENT": { "f1": 0.7491170971539367, "number": 6735, "precision": 0.70192058136517, "recall": 0.8031180400890868 }, "eval_NAME": { "f1": 0.8114726601811473, "number": 8801, "precision": 0.7987892129884425, "recall": 0.8245653902965572 }, "eval_QTY": { "f1": 0.9874929735806632, "number": 7088, "precision": 0.9836226203807391, "recall": 0.9913939051918735 }, "eval_RANGE_END": { "f1": 0.7745098039215685, "number": 91, "precision": 0.6991150442477876, "recall": 0.8681318681318682 }, "eval_UNIT": { "f1": 0.9533855052739026, "number": 5697, "precision": 0.9249050998514606, "recall": 0.9836756187467088 }, "eval_loss": 0.8793897032737732, "eval_overall_accuracy": 0.8421679571173317, "eval_overall_f1": 0.8672738768605068, "eval_overall_precision": 0.8428604643438403, "eval_overall_recall": 0.8931437420808109, "eval_runtime": 11.6472, "eval_samples_per_second": 730.305, "eval_steps_per_second": 22.838, "step": 23000 }, { "epoch": 4.65, "learning_rate": 3.4745594931696697e-06, "loss": 0.8202, "step": 23500 }, { "epoch": 4.75, "learning_rate": 2.484656503662641e-06, "loss": 0.8183, "step": 24000 }, { "epoch": 4.75, "eval_COMMENT": { "f1": 0.7519550006859651, "number": 6735, "precision": 0.6988397296952696, "recall": 0.8138084632516703 }, "eval_NAME": { "f1": 0.8162898973467212, "number": 8801, "precision": 0.806115665854199, "recall": 0.826724235882286 }, "eval_QTY": { "f1": 0.9871389415981446, "number": 7088, "precision": 0.9834757036829576, "recall": 0.9908295711060948 }, "eval_RANGE_END": { "f1": 0.7692307692307692, "number": 91, "precision": 0.6837606837606838, "recall": 0.8791208791208791 }, "eval_UNIT": { "f1": 0.9531422740028915, "number": 5697, "precision": 0.9244473771032663, "recall": 0.9836756187467088 }, "eval_loss": 0.8815182447433472, "eval_overall_accuracy": 0.8428019750619609, "eval_overall_f1": 0.8690636678554975, "eval_overall_precision": 0.8434860379608466, "eval_overall_recall": 0.8962410249190483, "eval_runtime": 10.2447, "eval_samples_per_second": 830.287, "eval_steps_per_second": 25.965, "step": 24000 }, { "epoch": 4.85, "learning_rate": 1.4947535141556129e-06, "loss": 0.8271, "step": 24500 }, { "epoch": 4.95, "learning_rate": 5.048505246485845e-07, "loss": 0.8201, "step": 25000 }, { "epoch": 4.95, "eval_COMMENT": { "f1": 0.7506890848952591, "number": 6735, "precision": 0.7003986112897004, "recall": 0.8087602078693392 }, "eval_NAME": { "f1": 0.8135612216307089, "number": 8801, "precision": 0.8026315789473685, "recall": 0.8247926372003181 }, "eval_QTY": { "f1": 0.9874235930583853, "number": 7088, "precision": 0.9834849545136459, "recall": 0.9913939051918735 }, "eval_RANGE_END": { "f1": 0.7788461538461537, "number": 91, "precision": 0.6923076923076923, "recall": 0.8901098901098901 }, "eval_UNIT": { "f1": 0.9532153793807416, "number": 5697, "precision": 0.9247400561148704, "recall": 0.9835000877654906 }, "eval_loss": 0.8807578682899475, "eval_overall_accuracy": 0.8429172510518934, "eval_overall_f1": 0.8681558902893056, "eval_overall_precision": 0.8432419879238272, "eval_overall_recall": 0.8945867943122624, "eval_runtime": 10.211, "eval_samples_per_second": 833.024, "eval_steps_per_second": 26.05, "step": 25000 }, { "epoch": 5.0, "step": 25255, "total_flos": 3120524263271436.0, "train_loss": 0.8656694423182368, "train_runtime": 2424.3674, "train_samples_per_second": 333.289, "train_steps_per_second": 10.417 } ], "logging_steps": 500, "max_steps": 25255, "num_train_epochs": 5, "save_steps": 1000, "total_flos": 3120524263271436.0, "trial_name": null, "trial_params": null }