{ "best_metric": 0.9796159267425537, "best_model_checkpoint": "nyt-ingredient-tagger-jina-embeddings-v2-small-en/checkpoint-25000", "epoch": 5.0, "eval_steps": 1000, "global_step": 25255, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.1, "learning_rate": 4.9010097010492975e-05, "loss": 1.3131, "step": 500 }, { "epoch": 0.2, "learning_rate": 4.802019402098595e-05, "loss": 1.1585, "step": 1000 }, { "epoch": 0.2, "eval_COMMENT": { "f1": 0.454561770864493, "number": 6836, "precision": 0.38455309241826097, "recall": 0.5557343475716794 }, "eval_NAME": { "f1": 0.7002083333333333, "number": 8859, "precision": 0.6500338458563002, "recall": 0.7587763855965685 }, "eval_QTY": { "f1": 0.9200849140587551, "number": 7095, "precision": 0.8947789025039957, "recall": 0.9468639887244539 }, "eval_RANGE_END": { "f1": 0.0, "number": 74, "precision": 0.0, "recall": 0.0 }, "eval_UNIT": { "f1": 0.912968864917872, "number": 5723, "precision": 0.8575376112987412, "recall": 0.9760615062030403 }, "eval_loss": 1.1246980428695679, "eval_overall_accuracy": 0.7220226951438505, "eval_overall_f1": 0.7265753075808941, "eval_overall_precision": 0.6665790549617429, "eval_overall_recall": 0.7984398502815965, "eval_runtime": 10.7443, "eval_samples_per_second": 791.676, "eval_steps_per_second": 24.757, "step": 1000 }, { "epoch": 0.3, "learning_rate": 4.703029103147892e-05, "loss": 1.1236, "step": 1500 }, { "epoch": 0.4, "learning_rate": 4.6040388041971886e-05, "loss": 1.1018, "step": 2000 }, { "epoch": 0.4, "eval_COMMENT": { "f1": 0.48012443829934326, "number": 6836, "precision": 0.3960273712222011, "recall": 0.6095669982445875 }, "eval_NAME": { "f1": 0.733016860369946, "number": 8859, "precision": 0.7094423320659062, "recall": 0.7582119878090078 }, "eval_QTY": { "f1": 0.9238356164383562, "number": 7095, "precision": 0.8986009327115256, "recall": 0.9505285412262157 }, "eval_RANGE_END": { "f1": 0.047619047619047616, "number": 74, "precision": 0.2, "recall": 0.02702702702702703 }, "eval_UNIT": { "f1": 0.9199999999999999, "number": 5723, "precision": 0.8794009877329935, "recall": 0.9645290931329722 }, "eval_loss": 1.0676864385604858, "eval_overall_accuracy": 0.7414702173996103, "eval_overall_f1": 0.7423559781301609, "eval_overall_precision": 0.6852761825824404, "eval_overall_recall": 0.8098086542834155, "eval_runtime": 8.0746, "eval_samples_per_second": 1053.43, "eval_steps_per_second": 32.943, "step": 2000 }, { "epoch": 0.49, "learning_rate": 4.505048505246486e-05, "loss": 1.0885, "step": 2500 }, { "epoch": 0.59, "learning_rate": 4.406058206295783e-05, "loss": 1.0676, "step": 3000 }, { "epoch": 0.59, "eval_COMMENT": { "f1": 0.4957528957528958, "number": 6836, "precision": 0.41734173417341736, "recall": 0.6104447045055588 }, "eval_NAME": { "f1": 0.7383297644539616, "number": 8859, "precision": 0.7021688219122288, "recall": 0.7784174286036799 }, "eval_QTY": { "f1": 0.9259863945578231, "number": 7095, "precision": 0.8949375410913872, "recall": 0.9592670894996477 }, "eval_RANGE_END": { "f1": 0.3047619047619048, "number": 74, "precision": 0.5161290322580645, "recall": 0.21621621621621623 }, "eval_UNIT": { "f1": 0.9193198866477745, "number": 5723, "precision": 0.8788844621513944, "recall": 0.9636554254761489 }, "eval_loss": 1.0472389459609985, "eval_overall_accuracy": 0.7540595269934666, "eval_overall_f1": 0.7511794345133026, "eval_overall_precision": 0.6939017520974771, "eval_overall_recall": 0.8187637737433099, "eval_runtime": 7.2751, "eval_samples_per_second": 1169.193, "eval_steps_per_second": 36.563, "step": 3000 }, { "epoch": 0.69, "learning_rate": 4.3070679073450804e-05, "loss": 1.0667, "step": 3500 }, { "epoch": 0.79, "learning_rate": 4.208077608394378e-05, "loss": 1.0613, "step": 4000 }, { "epoch": 0.79, "eval_COMMENT": { "f1": 0.5095226317091268, "number": 6836, "precision": 0.4413024850042845, "recall": 0.6026916325336454 }, "eval_NAME": { "f1": 0.7497392545424604, "number": 8859, "precision": 0.7297499465697799, "recall": 0.7708544982503669 }, "eval_QTY": { "f1": 0.9260893546607832, "number": 7095, "precision": 0.9064651100013497, "recall": 0.9465821000704722 }, "eval_RANGE_END": { "f1": 0.23214285714285715, "number": 74, "precision": 0.34210526315789475, "recall": 0.17567567567567569 }, "eval_UNIT": { "f1": 0.9216135881104034, "number": 5723, "precision": 0.8965631196298744, "recall": 0.9481041411846933 }, "eval_loss": 1.045949101448059, "eval_overall_accuracy": 0.7502196920490581, "eval_overall_f1": 0.7602500822639027, "eval_overall_precision": 0.717671543503246, "eval_overall_recall": 0.8081995312554657, "eval_runtime": 9.0484, "eval_samples_per_second": 940.052, "eval_steps_per_second": 29.397, "step": 4000 }, { "epoch": 0.89, "learning_rate": 4.109087309443675e-05, "loss": 1.0532, "step": 4500 }, { "epoch": 0.99, "learning_rate": 4.010097010492972e-05, "loss": 1.045, "step": 5000 }, { "epoch": 0.99, "eval_COMMENT": { "f1": 0.5115396388123661, "number": 6836, "precision": 0.43983577218654596, "recall": 0.6111761263897015 }, "eval_NAME": { "f1": 0.7500674909562118, "number": 8859, "precision": 0.7188987787207618, "recall": 0.7840614064792866 }, "eval_QTY": { "f1": 0.9248702917593155, "number": 7095, "precision": 0.886005680351149, "recall": 0.9673009161381254 }, "eval_RANGE_END": { "f1": 0.27868852459016397, "number": 74, "precision": 0.3541666666666667, "recall": 0.22972972972972974 }, "eval_UNIT": { "f1": 0.9236628580890875, "number": 5723, "precision": 0.8777340676632572, "recall": 0.974663637952123 }, "eval_loss": 1.029239296913147, "eval_overall_accuracy": 0.7610323615940091, "eval_overall_f1": 0.7619755400100165, "eval_overall_precision": 0.7079555688982287, "eval_overall_recall": 0.8249204183719873, "eval_runtime": 10.4805, "eval_samples_per_second": 811.605, "eval_steps_per_second": 25.381, "step": 5000 }, { "epoch": 1.09, "learning_rate": 3.911106711542269e-05, "loss": 1.0391, "step": 5500 }, { "epoch": 1.19, "learning_rate": 3.812116412591566e-05, "loss": 1.0334, "step": 6000 }, { "epoch": 1.19, "eval_COMMENT": { "f1": 0.5539883268482491, "number": 6836, "precision": 0.47399084477736164, "recall": 0.6664716208308953 }, "eval_NAME": { "f1": 0.7479798253701395, "number": 8859, "precision": 0.7198329853862213, "recall": 0.7784174286036799 }, "eval_QTY": { "f1": 0.92860166502046, "number": 7095, "precision": 0.9296510806611104, "recall": 0.927554615926709 }, "eval_RANGE_END": { "f1": 0.3283582089552239, "number": 74, "precision": 0.36666666666666664, "recall": 0.2972972972972973 }, "eval_UNIT": { "f1": 0.9286739258884106, "number": 5723, "precision": 0.8982691051600261, "recall": 0.9612091560370435 }, "eval_loss": 1.034406065940857, "eval_overall_accuracy": 0.759465861765942, "eval_overall_f1": 0.7717964680056355, "eval_overall_precision": 0.7258049607148359, "eval_overall_recall": 0.8240109140518418, "eval_runtime": 8.1039, "eval_samples_per_second": 1049.615, "eval_steps_per_second": 32.824, "step": 6000 }, { "epoch": 1.29, "learning_rate": 3.7131261136408633e-05, "loss": 1.026, "step": 6500 }, { "epoch": 1.39, "learning_rate": 3.6141358146901606e-05, "loss": 1.0187, "step": 7000 }, { "epoch": 1.39, "eval_COMMENT": { "f1": 0.5136793031529874, "number": 6836, "precision": 0.4423198816818086, "recall": 0.6124926857811586 }, "eval_NAME": { "f1": 0.751153062318996, "number": 8859, "precision": 0.7155410238070911, "recall": 0.7904955412574782 }, "eval_QTY": { "f1": 0.9245735607675907, "number": 7095, "precision": 0.8767850372804247, "recall": 0.9778717406624383 }, "eval_RANGE_END": { "f1": 0.23853211009174313, "number": 74, "precision": 0.37142857142857144, "recall": 0.17567567567567569 }, "eval_UNIT": { "f1": 0.927461139896373, "number": 5723, "precision": 0.8888354957552459, "recall": 0.9695963655425476 }, "eval_loss": 1.021018385887146, "eval_overall_accuracy": 0.7651014404156956, "eval_overall_f1": 0.7638116425658138, "eval_overall_precision": 0.7083482836981222, "eval_overall_recall": 0.8286983593941302, "eval_runtime": 7.3061, "eval_samples_per_second": 1164.235, "eval_steps_per_second": 36.408, "step": 7000 }, { "epoch": 1.48, "learning_rate": 3.515145515739457e-05, "loss": 1.0186, "step": 7500 }, { "epoch": 1.58, "learning_rate": 3.416155216788755e-05, "loss": 1.0319, "step": 8000 }, { "epoch": 1.58, "eval_COMMENT": { "f1": 0.5439773496645535, "number": 6836, "precision": 0.46955690149824675, "recall": 0.6464306612053833 }, "eval_NAME": { "f1": 0.7617639003012875, "number": 8859, "precision": 0.7399957428693061, "recall": 0.7848515633818716 }, "eval_QTY": { "f1": 0.9297781396295542, "number": 7095, "precision": 0.8963893249607535, "recall": 0.9657505285412262 }, "eval_RANGE_END": { "f1": 0.368, "number": 74, "precision": 0.45098039215686275, "recall": 0.3108108108108108 }, "eval_UNIT": { "f1": 0.9286800743620078, "number": 5723, "precision": 0.8991981672394044, "recall": 0.9601607548488555 }, "eval_loss": 1.0136394500732422, "eval_overall_accuracy": 0.7699919764642953, "eval_overall_f1": 0.7758823529411765, "eval_overall_precision": 0.727991905068531, "eval_overall_recall": 0.8305173680344212, "eval_runtime": 9.7068, "eval_samples_per_second": 876.293, "eval_steps_per_second": 27.403, "step": 8000 }, { "epoch": 1.68, "learning_rate": 3.317164917838052e-05, "loss": 1.0243, "step": 8500 }, { "epoch": 1.78, "learning_rate": 3.218174618887349e-05, "loss": 1.0154, "step": 9000 }, { "epoch": 1.78, "eval_COMMENT": { "f1": 0.5554884675763797, "number": 6836, "precision": 0.47295907875796833, "recall": 0.6729081334113517 }, "eval_NAME": { "f1": 0.7644151565074134, "number": 8859, "precision": 0.7443054218800128, "recall": 0.7856417202844564 }, "eval_QTY": { "f1": 0.9317274604267033, "number": 7095, "precision": 0.9104236718224613, "recall": 0.9540521494009866 }, "eval_RANGE_END": { "f1": 0.3795620437956204, "number": 74, "precision": 0.4126984126984127, "recall": 0.35135135135135137 }, "eval_UNIT": { "f1": 0.9292205085452273, "number": 5723, "precision": 0.8885522959183674, "recall": 0.9737899702952997 }, "eval_loss": 1.0071077346801758, "eval_overall_accuracy": 0.7732204944026286, "eval_overall_f1": 0.7789823224924309, "eval_overall_precision": 0.7284683532742716, "eval_overall_recall": 0.8370238220170008, "eval_runtime": 10.018, "eval_samples_per_second": 849.074, "eval_steps_per_second": 26.552, "step": 9000 }, { "epoch": 1.88, "learning_rate": 3.119184319936647e-05, "loss": 1.0185, "step": 9500 }, { "epoch": 1.98, "learning_rate": 3.0201940209859435e-05, "loss": 1.011, "step": 10000 }, { "epoch": 1.98, "eval_COMMENT": { "f1": 0.5534477566997892, "number": 6836, "precision": 0.4703654417033473, "recall": 0.6721767115272089 }, "eval_NAME": { "f1": 0.7638995503892971, "number": 8859, "precision": 0.742723104808615, "recall": 0.7863189976295293 }, "eval_QTY": { "f1": 0.9353837666367836, "number": 7095, "precision": 0.915743991358358, "recall": 0.9558844256518675 }, "eval_RANGE_END": { "f1": 0.3384615384615385, "number": 74, "precision": 0.39285714285714285, "recall": 0.2972972972972973 }, "eval_UNIT": { "f1": 0.9314305016044586, "number": 5723, "precision": 0.901291060630822, "recall": 0.9636554254761489 }, "eval_loss": 1.0126872062683105, "eval_overall_accuracy": 0.7711955068200054, "eval_overall_f1": 0.7789157805466762, "eval_overall_precision": 0.7296281585138562, "eval_overall_recall": 0.8353447371182705, "eval_runtime": 7.6383, "eval_samples_per_second": 1113.597, "eval_steps_per_second": 34.824, "step": 10000 }, { "epoch": 2.08, "learning_rate": 2.9212037220352405e-05, "loss": 1.0062, "step": 10500 }, { "epoch": 2.18, "learning_rate": 2.8222134230845377e-05, "loss": 0.9958, "step": 11000 }, { "epoch": 2.18, "eval_COMMENT": { "f1": 0.5524928818077179, "number": 6836, "precision": 0.4715127701375246, "recall": 0.6670567583382094 }, "eval_NAME": { "f1": 0.7657111356119073, "number": 8859, "precision": 0.7483029845921776, "recall": 0.7839485269217744 }, "eval_QTY": { "f1": 0.9343237989447376, "number": 7095, "precision": 0.9206457791763579, "recall": 0.9484143763213531 }, "eval_RANGE_END": { "f1": 0.36363636363636365, "number": 74, "precision": 0.35, "recall": 0.3783783783783784 }, "eval_UNIT": { "f1": 0.9317363263254879, "number": 5723, "precision": 0.8947876447876448, "recall": 0.9718679014502883 }, "eval_loss": 1.0023564100265503, "eval_overall_accuracy": 0.7762770794330035, "eval_overall_f1": 0.7792751537354442, "eval_overall_precision": 0.7317627545535522, "eval_overall_recall": 0.8333858047364187, "eval_runtime": 8.2445, "eval_samples_per_second": 1031.712, "eval_steps_per_second": 32.264, "step": 11000 }, { "epoch": 2.28, "learning_rate": 2.7232231241338353e-05, "loss": 0.9969, "step": 11500 }, { "epoch": 2.38, "learning_rate": 2.6242328251831323e-05, "loss": 1.0042, "step": 12000 }, { "epoch": 2.38, "eval_COMMENT": { "f1": 0.5542747950440732, "number": 6836, "precision": 0.4789602641951635, "recall": 0.657694558221182 }, "eval_NAME": { "f1": 0.7601839329185826, "number": 8859, "precision": 0.7298981923955953, "recall": 0.7930917710802574 }, "eval_QTY": { "f1": 0.9347491965907503, "number": 7095, "precision": 0.9267211525141986, "recall": 0.9429175475687104 }, "eval_RANGE_END": { "f1": 0.3902439024390244, "number": 74, "precision": 0.35555555555555557, "recall": 0.43243243243243246 }, "eval_UNIT": { "f1": 0.932516381584546, "number": 5723, "precision": 0.9089250165892502, "recall": 0.9573650183470208 }, "eval_loss": 1.0006664991378784, "eval_overall_accuracy": 0.7768883964390785, "eval_overall_f1": 0.7786074142146806, "eval_overall_precision": 0.733323029366306, "eval_overall_recall": 0.8298527302620072, "eval_runtime": 10.2957, "eval_samples_per_second": 826.172, "eval_steps_per_second": 25.836, "step": 12000 }, { "epoch": 2.47, "learning_rate": 2.5252425262324292e-05, "loss": 1.0, "step": 12500 }, { "epoch": 2.57, "learning_rate": 2.4262522272817265e-05, "loss": 1.0048, "step": 13000 }, { "epoch": 2.57, "eval_COMMENT": { "f1": 0.542151434082001, "number": 6836, "precision": 0.47168994262206343, "recall": 0.6373610298420129 }, "eval_NAME": { "f1": 0.7605572485851111, "number": 8859, "precision": 0.7342649994746243, "recall": 0.7888023478947963 }, "eval_QTY": { "f1": 0.9334144527817211, "number": 7095, "precision": 0.8968563263185243, "recall": 0.9730796335447498 }, "eval_RANGE_END": { "f1": 0.4028776978417266, "number": 74, "precision": 0.4307692307692308, "recall": 0.3783783783783784 }, "eval_UNIT": { "f1": 0.9308501753799899, "number": 5723, "precision": 0.8915373540233562, "recall": 0.9737899702952997 }, "eval_loss": 0.9942804574966431, "eval_overall_accuracy": 0.7787414511137432, "eval_overall_f1": 0.777442751202021, "eval_overall_precision": 0.72784423828125, "eval_overall_recall": 0.8342953090565641, "eval_runtime": 9.9772, "eval_samples_per_second": 852.54, "eval_steps_per_second": 26.661, "step": 13000 }, { "epoch": 2.67, "learning_rate": 2.3272619283310237e-05, "loss": 0.9991, "step": 13500 }, { "epoch": 2.77, "learning_rate": 2.2282716293803206e-05, "loss": 0.9911, "step": 14000 }, { "epoch": 2.77, "eval_COMMENT": { "f1": 0.5497025285076846, "number": 6836, "precision": 0.4768817204301075, "recall": 0.6487712112346401 }, "eval_NAME": { "f1": 0.7610256410256411, "number": 8859, "precision": 0.729257190151045, "recall": 0.7956880009030365 }, "eval_QTY": { "f1": 0.9355014287658184, "number": 7095, "precision": 0.9042483230303827, "recall": 0.9689922480620154 }, "eval_RANGE_END": { "f1": 0.4132231404958678, "number": 74, "precision": 0.5319148936170213, "recall": 0.33783783783783783 }, "eval_UNIT": { "f1": 0.9322147651006711, "number": 5723, "precision": 0.8965628529933839, "recall": 0.9708195002621003 }, "eval_loss": 0.9951051473617554, "eval_overall_accuracy": 0.7786077255186643, "eval_overall_f1": 0.7798045602605863, "eval_overall_precision": 0.7295888824551245, "eval_overall_recall": 0.8374435932416833, "eval_runtime": 11.0903, "eval_samples_per_second": 766.978, "eval_steps_per_second": 23.985, "step": 14000 }, { "epoch": 2.87, "learning_rate": 2.129281330429618e-05, "loss": 0.9912, "step": 14500 }, { "epoch": 2.97, "learning_rate": 2.0302910314789152e-05, "loss": 0.9991, "step": 15000 }, { "epoch": 2.97, "eval_COMMENT": { "f1": 0.5583836904107916, "number": 6836, "precision": 0.4791033832617576, "recall": 0.6691047396138092 }, "eval_NAME": { "f1": 0.7690366469168313, "number": 8859, "precision": 0.7481054541573273, "recall": 0.7911728186025511 }, "eval_QTY": { "f1": 0.935168616655196, "number": 7095, "precision": 0.9137861466039005, "recall": 0.9575757575757575 }, "eval_RANGE_END": { "f1": 0.4109589041095891, "number": 74, "precision": 0.4166666666666667, "recall": 0.40540540540540543 }, "eval_UNIT": { "f1": 0.9313129631171426, "number": 5723, "precision": 0.8894720101781171, "recall": 0.977284640922593 }, "eval_loss": 0.9920729398727417, "eval_overall_accuracy": 0.7806709204141673, "eval_overall_f1": 0.783059806192698, "eval_overall_precision": 0.7336981443551099, "eval_overall_recall": 0.839542449365096, "eval_runtime": 9.9635, "eval_samples_per_second": 853.712, "eval_steps_per_second": 26.697, "step": 15000 }, { "epoch": 3.07, "learning_rate": 1.9313007325282124e-05, "loss": 0.9903, "step": 15500 }, { "epoch": 3.17, "learning_rate": 1.8323104335775097e-05, "loss": 0.9805, "step": 16000 }, { "epoch": 3.17, "eval_COMMENT": { "f1": 0.5583219220714553, "number": 6836, "precision": 0.4859154929577465, "recall": 0.6560854300760679 }, "eval_NAME": { "f1": 0.7669049828084921, "number": 8859, "precision": 0.7423922231614539, "recall": 0.7930917710802574 }, "eval_QTY": { "f1": 0.9368610113290964, "number": 7095, "precision": 0.9187102018696653, "recall": 0.9557434813248766 }, "eval_RANGE_END": { "f1": 0.4087591240875913, "number": 74, "precision": 0.4444444444444444, "recall": 0.3783783783783784 }, "eval_UNIT": { "f1": 0.9333669863705198, "number": 5723, "precision": 0.9000486775920817, "recall": 0.9692468984798183 }, "eval_loss": 0.987960696220398, "eval_overall_accuracy": 0.7821992129293547, "eval_overall_f1": 0.783963999474445, "eval_overall_precision": 0.7388935327079657, "eval_overall_recall": 0.8348899849581978, "eval_runtime": 9.4297, "eval_samples_per_second": 902.044, "eval_steps_per_second": 28.209, "step": 16000 }, { "epoch": 3.27, "learning_rate": 1.7333201346268066e-05, "loss": 0.9868, "step": 16500 }, { "epoch": 3.37, "learning_rate": 1.634329835676104e-05, "loss": 0.9848, "step": 17000 }, { "epoch": 3.37, "eval_COMMENT": { "f1": 0.5623249735515589, "number": 6836, "precision": 0.48933174482833314, "recall": 0.6609128145114102 }, "eval_NAME": { "f1": 0.7673142355394577, "number": 8859, "precision": 0.7466623945316672, "recall": 0.7891409865673327 }, "eval_QTY": { "f1": 0.936261013215859, "number": 7095, "precision": 0.9149737656397148, "recall": 0.9585623678646934 }, "eval_RANGE_END": { "f1": 0.3795620437956204, "number": 74, "precision": 0.4126984126984127, "recall": 0.35135135135135137 }, "eval_UNIT": { "f1": 0.9321663019693655, "number": 5723, "precision": 0.899171943497321, "recall": 0.9676742966975362 }, "eval_loss": 0.9842170476913452, "eval_overall_accuracy": 0.7823902494937531, "eval_overall_f1": 0.7848384233538249, "eval_overall_precision": 0.7402561160894235, "eval_overall_recall": 0.8351348515059293, "eval_runtime": 7.8716, "eval_samples_per_second": 1080.599, "eval_steps_per_second": 33.793, "step": 17000 }, { "epoch": 3.46, "learning_rate": 1.535339536725401e-05, "loss": 0.9841, "step": 17500 }, { "epoch": 3.56, "learning_rate": 1.4363492377746981e-05, "loss": 0.9771, "step": 18000 }, { "epoch": 3.56, "eval_COMMENT": { "f1": 0.5630382256365777, "number": 6836, "precision": 0.4883396023643203, "recall": 0.6647162083089526 }, "eval_NAME": { "f1": 0.7652202248411449, "number": 8859, "precision": 0.7373874816830647, "recall": 0.795236482672988 }, "eval_QTY": { "f1": 0.9356418569359177, "number": 7095, "precision": 0.9162388543636855, "recall": 0.9558844256518675 }, "eval_RANGE_END": { "f1": 0.4520547945205479, "number": 74, "precision": 0.4583333333333333, "recall": 0.44594594594594594 }, "eval_UNIT": { "f1": 0.9327950206072841, "number": 5723, "precision": 0.8992864093415505, "recall": 0.968897431417089 }, "eval_loss": 0.983447253704071, "eval_overall_accuracy": 0.7836510908187827, "eval_overall_f1": 0.7841076515077104, "eval_overall_precision": 0.7369149819994462, "eval_overall_recall": 0.8377584216601952, "eval_runtime": 9.9588, "eval_samples_per_second": 854.123, "eval_steps_per_second": 26.71, "step": 18000 }, { "epoch": 3.66, "learning_rate": 1.3373589388239954e-05, "loss": 0.9815, "step": 18500 }, { "epoch": 3.76, "learning_rate": 1.2383686398732925e-05, "loss": 0.9787, "step": 19000 }, { "epoch": 3.76, "eval_COMMENT": { "f1": 0.5682919349892671, "number": 6836, "precision": 0.4892808110676946, "recall": 0.677735517846694 }, "eval_NAME": { "f1": 0.7695169319984682, "number": 8859, "precision": 0.7466029723991507, "recall": 0.7938819279828423 }, "eval_QTY": { "f1": 0.9372361774271676, "number": 7095, "precision": 0.9206090266449157, "recall": 0.9544749823819592 }, "eval_RANGE_END": { "f1": 0.4189189189189189, "number": 74, "precision": 0.4189189189189189, "recall": 0.4189189189189189 }, "eval_UNIT": { "f1": 0.9332317847169331, "number": 5723, "precision": 0.9048244174597965, "recall": 0.9634806919447843 }, "eval_loss": 0.9832035899162292, "eval_overall_accuracy": 0.7843961334199365, "eval_overall_f1": 0.786327868852459, "eval_overall_precision": 0.7399191682349675, "eval_overall_recall": 0.8389477734634624, "eval_runtime": 10.5172, "eval_samples_per_second": 808.772, "eval_steps_per_second": 25.292, "step": 19000 }, { "epoch": 3.86, "learning_rate": 1.1393783409225896e-05, "loss": 0.9744, "step": 19500 }, { "epoch": 3.96, "learning_rate": 1.0403880419718868e-05, "loss": 0.9746, "step": 20000 }, { "epoch": 3.96, "eval_COMMENT": { "f1": 0.5697782746413266, "number": 6836, "precision": 0.4950890447922288, "recall": 0.6710064365125804 }, "eval_NAME": { "f1": 0.768101654069449, "number": 8859, "precision": 0.7460368124268539, "recall": 0.7915114572750874 }, "eval_QTY": { "f1": 0.9370073342929603, "number": 7095, "precision": 0.9120629837203096, "recall": 0.9633544749823819 }, "eval_RANGE_END": { "f1": 0.43312101910828027, "number": 74, "precision": 0.40963855421686746, "recall": 0.4594594594594595 }, "eval_UNIT": { "f1": 0.9337932194834694, "number": 5723, "precision": 0.9003893575600259, "recall": 0.9697710990739122 }, "eval_loss": 0.9827048778533936, "eval_overall_accuracy": 0.7846444809536546, "eval_overall_f1": 0.7875786988457503, "eval_overall_precision": 0.7411819163709304, "eval_overall_recall": 0.8401721062021198, "eval_runtime": 8.1048, "eval_samples_per_second": 1049.503, "eval_steps_per_second": 32.82, "step": 20000 }, { "epoch": 4.06, "learning_rate": 9.41397743021184e-06, "loss": 0.9818, "step": 20500 }, { "epoch": 4.16, "learning_rate": 8.424074440704812e-06, "loss": 0.976, "step": 21000 }, { "epoch": 4.16, "eval_COMMENT": { "f1": 0.5667608401916225, "number": 6836, "precision": 0.4884607241160279, "recall": 0.6749561146869514 }, "eval_NAME": { "f1": 0.7705115565779385, "number": 8859, "precision": 0.7483774869666986, "recall": 0.7939948075403545 }, "eval_QTY": { "f1": 0.936799394814662, "number": 7095, "precision": 0.9147193123824873, "recall": 0.9599718111346018 }, "eval_RANGE_END": { "f1": 0.42857142857142855, "number": 74, "precision": 0.4125, "recall": 0.44594594594594594 }, "eval_UNIT": { "f1": 0.9335247909451813, "number": 5723, "precision": 0.9035317200784827, "recall": 0.9655774943211602 }, "eval_loss": 0.9835863709449768, "eval_overall_accuracy": 0.7854086272112483, "eval_overall_f1": 0.7865212692798899, "eval_overall_precision": 0.7393111090590082, "eval_overall_recall": 0.8401721062021198, "eval_runtime": 10.4319, "eval_samples_per_second": 815.38, "eval_steps_per_second": 25.499, "step": 21000 }, { "epoch": 4.26, "learning_rate": 7.434171451197783e-06, "loss": 0.9902, "step": 21500 }, { "epoch": 4.36, "learning_rate": 6.444268461690754e-06, "loss": 0.9635, "step": 22000 }, { "epoch": 4.36, "eval_COMMENT": { "f1": 0.5716760502381983, "number": 6836, "precision": 0.49533612093920876, "recall": 0.6758338209479228 }, "eval_NAME": { "f1": 0.7705016685814322, "number": 8859, "precision": 0.7475583864118895, "recall": 0.7948978440004515 }, "eval_QTY": { "f1": 0.9371633752244165, "number": 7095, "precision": 0.9186408555570597, "recall": 0.9564482029598309 }, "eval_RANGE_END": { "f1": 0.43373493975903615, "number": 74, "precision": 0.391304347826087, "recall": 0.4864864864864865 }, "eval_UNIT": { "f1": 0.9337832138338253, "number": 5723, "precision": 0.9026418786692759, "recall": 0.9671500961034423 }, "eval_loss": 0.9831692576408386, "eval_overall_accuracy": 0.7850838650517709, "eval_overall_f1": 0.7882188858807121, "eval_overall_precision": 0.7422893874775944, "eval_overall_recall": 0.84020708713751, "eval_runtime": 9.9258, "eval_samples_per_second": 856.957, "eval_steps_per_second": 26.799, "step": 22000 }, { "epoch": 4.45, "learning_rate": 5.4543654721837265e-06, "loss": 0.967, "step": 22500 }, { "epoch": 4.55, "learning_rate": 4.4644624826766974e-06, "loss": 0.9688, "step": 23000 }, { "epoch": 4.55, "eval_COMMENT": { "f1": 0.5723930522310194, "number": 6836, "precision": 0.4930739135032251, "recall": 0.6821240491515506 }, "eval_NAME": { "f1": 0.7698282463625424, "number": 8859, "precision": 0.7467897697124058, "recall": 0.7943334462128908 }, "eval_QTY": { "f1": 0.9373659076752716, "number": 7095, "precision": 0.9208593962469405, "recall": 0.9544749823819592 }, "eval_RANGE_END": { "f1": 0.4301075268817204, "number": 74, "precision": 0.35714285714285715, "recall": 0.5405405405405406 }, "eval_UNIT": { "f1": 0.9337379868487607, "number": 5723, "precision": 0.9021013194331324, "recall": 0.9676742966975362 }, "eval_loss": 0.9836147427558899, "eval_overall_accuracy": 0.7860008405608834, "eval_overall_f1": 0.7875949698716269, "eval_overall_precision": 0.7403416961674619, "eval_overall_recall": 0.8412914961346066, "eval_runtime": 8.0875, "eval_samples_per_second": 1051.747, "eval_steps_per_second": 32.89, "step": 23000 }, { "epoch": 4.65, "learning_rate": 3.4745594931696697e-06, "loss": 0.9686, "step": 23500 }, { "epoch": 4.75, "learning_rate": 2.484656503662641e-06, "loss": 0.9669, "step": 24000 }, { "epoch": 4.75, "eval_COMMENT": { "f1": 0.5733910891089109, "number": 6836, "precision": 0.4968897468897469, "recall": 0.677735517846694 }, "eval_NAME": { "f1": 0.7695764151460354, "number": 8859, "precision": 0.7478168264110756, "recall": 0.7926402528502088 }, "eval_QTY": { "f1": 0.9377799214497348, "number": 7095, "precision": 0.9173631706659477, "recall": 0.9591261451726568 }, "eval_RANGE_END": { "f1": 0.43902439024390244, "number": 74, "precision": 0.4, "recall": 0.4864864864864865 }, "eval_UNIT": { "f1": 0.9331987211845869, "number": 5723, "precision": 0.8998864189518092, "recall": 0.9690721649484536 }, "eval_loss": 0.9803335070610046, "eval_overall_accuracy": 0.7873189928552325, "eval_overall_f1": 0.7886242865577643, "eval_overall_precision": 0.7423807318202872, "eval_overall_recall": 0.8410116486514849, "eval_runtime": 11.2838, "eval_samples_per_second": 753.825, "eval_steps_per_second": 23.574, "step": 24000 }, { "epoch": 4.85, "learning_rate": 1.4947535141556129e-06, "loss": 0.965, "step": 24500 }, { "epoch": 4.95, "learning_rate": 5.048505246485845e-07, "loss": 0.9691, "step": 25000 }, { "epoch": 4.95, "eval_COMMENT": { "f1": 0.5725781491798204, "number": 6836, "precision": 0.4962978860392746, "recall": 0.6765652428320655 }, "eval_NAME": { "f1": 0.7694330320460149, "number": 8859, "precision": 0.7474457215836526, "recall": 0.7927531324077209 }, "eval_QTY": { "f1": 0.9377026560883062, "number": 7095, "precision": 0.9183783783783783, "recall": 0.9578576462297392 }, "eval_RANGE_END": { "f1": 0.4484848484848485, "number": 74, "precision": 0.4065934065934066, "recall": 0.5 }, "eval_UNIT": { "f1": 0.933075174678003, "number": 5723, "precision": 0.9002599090318388, "recall": 0.968373230822995 }, "eval_loss": 0.9796159267425537, "eval_overall_accuracy": 0.7870897489779544, "eval_overall_f1": 0.7882984134276199, "eval_overall_precision": 0.7423212409616217, "eval_overall_recall": 0.8403470108790709, "eval_runtime": 8.9053, "eval_samples_per_second": 955.162, "eval_steps_per_second": 29.87, "step": 25000 }, { "epoch": 5.0, "step": 25255, "total_flos": 1840716078790068.0, "train_loss": 1.016139645029875, "train_runtime": 1364.1405, "train_samples_per_second": 592.325, "train_steps_per_second": 18.513 } ], "logging_steps": 500, "max_steps": 25255, "num_train_epochs": 5, "save_steps": 1000, "total_flos": 1840716078790068.0, "trial_name": null, "trial_params": null }