{ "best_metric": 2.1034367084503174, "best_model_checkpoint": "nyt_ingredients-crf-tagger-gte-small-L3-ingredient-v2/checkpoint-40000", "epoch": 10.0, "eval_steps": 1000, "global_step": 50510, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.1, "learning_rate": 4.9505048505246485e-05, "loss": 6.8194, "step": 500 }, { "epoch": 0.2, "learning_rate": 4.9010097010492975e-05, "loss": 4.134, "step": 1000 }, { "epoch": 0.2, "eval_COMMENT": { "f1": 0.5763258721516435, "number": 6854, "precision": 0.5343387760189455, "recall": 0.6254741756638459 }, "eval_NAME": { "f1": 0.78330041694097, "number": 8845, "precision": 0.7608440797186401, "recall": 0.8071226681741097 }, "eval_QTY": { "f1": 0.9729431253451132, "number": 7152, "precision": 0.960741548527808, "recall": 0.9854586129753915 }, "eval_RANGE_END": { "f1": 0.0, "number": 105, "precision": 0.0, "recall": 0.0 }, "eval_UNIT": { "f1": 0.9476944253269098, "number": 5646, "precision": 0.921378387420542, "recall": 0.975557917109458 }, "eval_loss": 3.7770841121673584, "eval_overall_accuracy": 0.7948864068079933, "eval_overall_f1": 0.8085364620208354, "eval_overall_precision": 0.7806640625, "eval_overall_recall": 0.8384728340675477, "eval_runtime": 11.1289, "eval_samples_per_second": 764.316, "eval_steps_per_second": 23.902, "step": 1000 }, { "epoch": 0.3, "learning_rate": 4.851514551573946e-05, "loss": 3.7402, "step": 1500 }, { "epoch": 0.4, "learning_rate": 4.802019402098595e-05, "loss": 3.5226, "step": 2000 }, { "epoch": 0.4, "eval_COMMENT": { "f1": 0.6215112776922562, "number": 6854, "precision": 0.5741313218746136, "recall": 0.6774146483805077 }, "eval_NAME": { "f1": 0.7914056489724146, "number": 8845, "precision": 0.7699133967710895, "recall": 0.8141322781232334 }, "eval_QTY": { "f1": 0.9796598403332176, "number": 7152, "precision": 0.9728388253136633, "recall": 0.9865771812080537 }, "eval_RANGE_END": { "f1": 0.6425339366515838, "number": 105, "precision": 0.6120689655172413, "recall": 0.6761904761904762 }, "eval_UNIT": { "f1": 0.9472432248746921, "number": 5646, "precision": 0.9102040816326531, "recall": 0.9874247254693589 }, "eval_loss": 3.3654797077178955, "eval_overall_accuracy": 0.8063976901451257, "eval_overall_f1": 0.8245767266863746, "eval_overall_precision": 0.7934958298312537, "eval_overall_recall": 0.8581917348437172, "eval_runtime": 11.014, "eval_samples_per_second": 772.292, "eval_steps_per_second": 24.151, "step": 2000 }, { "epoch": 0.49, "learning_rate": 4.752524252623243e-05, "loss": 3.3189, "step": 2500 }, { "epoch": 0.59, "learning_rate": 4.703029103147892e-05, "loss": 3.1948, "step": 3000 }, { "epoch": 0.59, "eval_COMMENT": { "f1": 0.6503977349332615, "number": 6854, "precision": 0.6045112781954888, "recall": 0.7038225853516195 }, "eval_NAME": { "f1": 0.8008250181169521, "number": 8845, "precision": 0.7898614471079833, "recall": 0.8120972300734879 }, "eval_QTY": { "f1": 0.9830792896098447, "number": 7152, "precision": 0.9832167832167832, "recall": 0.9829418344519015 }, "eval_RANGE_END": { "f1": 0.7035573122529643, "number": 105, "precision": 0.6013513513513513, "recall": 0.8476190476190476 }, "eval_UNIT": { "f1": 0.9492858975455399, "number": 5646, "precision": 0.9178104845377874, "recall": 0.9829968119022316 }, "eval_loss": 3.1104416847229004, "eval_overall_accuracy": 0.8160474128105767, "eval_overall_f1": 0.8361769539655378, "eval_overall_precision": 0.8112035241132187, "eval_overall_recall": 0.8627368715474443, "eval_runtime": 9.4851, "eval_samples_per_second": 896.774, "eval_steps_per_second": 28.044, "step": 3000 }, { "epoch": 0.69, "learning_rate": 4.65353395367254e-05, "loss": 3.1131, "step": 3500 }, { "epoch": 0.79, "learning_rate": 4.6040388041971886e-05, "loss": 3.0233, "step": 4000 }, { "epoch": 0.79, "eval_COMMENT": { "f1": 0.6598611678236015, "number": 6854, "precision": 0.6183673469387755, "recall": 0.7073241902538664 }, "eval_NAME": { "f1": 0.8091748251748251, "number": 8845, "precision": 0.8008859357696567, "recall": 0.8176370830977954 }, "eval_QTY": { "f1": 0.9835126449629734, "number": 7152, "precision": 0.982826026249651, "recall": 0.9842002237136466 }, "eval_RANGE_END": { "f1": 0.5851063829787234, "number": 105, "precision": 0.6626506024096386, "recall": 0.5238095238095238 }, "eval_UNIT": { "f1": 0.9505612201182417, "number": 5646, "precision": 0.9206639004149377, "recall": 0.9824654622741764 }, "eval_loss": 3.005340576171875, "eval_overall_accuracy": 0.8174150900387509, "eval_overall_f1": 0.8416805692690068, "eval_overall_precision": 0.8202057067020571, "eval_overall_recall": 0.8643101880987344, "eval_runtime": 11.0513, "eval_samples_per_second": 769.68, "eval_steps_per_second": 24.069, "step": 4000 }, { "epoch": 0.89, "learning_rate": 4.5545436547218376e-05, "loss": 2.9721, "step": 4500 }, { "epoch": 0.99, "learning_rate": 4.505048505246486e-05, "loss": 2.9567, "step": 5000 }, { "epoch": 0.99, "eval_COMMENT": { "f1": 0.677434679334917, "number": 6854, "precision": 0.633295267098084, "recall": 0.7281879194630873 }, "eval_NAME": { "f1": 0.8113767426235933, "number": 8845, "precision": 0.8036823425022183, "recall": 0.8192198982475976 }, "eval_QTY": { "f1": 0.9826323498639883, "number": 7152, "precision": 0.9803757828810021, "recall": 0.9848993288590604 }, "eval_RANGE_END": { "f1": 0.6288659793814434, "number": 105, "precision": 0.6853932584269663, "recall": 0.580952380952381 }, "eval_UNIT": { "f1": 0.9479768786127167, "number": 5646, "precision": 0.9114089571755476, "recall": 0.9876018420120439 }, "eval_loss": 2.910010814666748, "eval_overall_accuracy": 0.8215941037915052, "eval_overall_f1": 0.8462413611587509, "eval_overall_precision": 0.8226748984779954, "eval_overall_recall": 0.8711978183343823, "eval_runtime": 11.1963, "eval_samples_per_second": 759.713, "eval_steps_per_second": 23.758, "step": 5000 }, { "epoch": 1.09, "learning_rate": 4.455553355771135e-05, "loss": 2.794, "step": 5500 }, { "epoch": 1.19, "learning_rate": 4.406058206295783e-05, "loss": 2.738, "step": 6000 }, { "epoch": 1.19, "eval_COMMENT": { "f1": 0.6844883595018949, "number": 6854, "precision": 0.6383489017924766, "recall": 0.7378173329442661 }, "eval_NAME": { "f1": 0.809906216656371, "number": 8845, "precision": 0.8046195045748716, "recall": 0.8152628603730921 }, "eval_QTY": { "f1": 0.9817170663885992, "number": 7152, "precision": 0.9762201023088621, "recall": 0.9872762863534675 }, "eval_RANGE_END": { "f1": 0.7286821705426357, "number": 105, "precision": 0.6143790849673203, "recall": 0.8952380952380953 }, "eval_UNIT": { "f1": 0.9514546393527284, "number": 5646, "precision": 0.9254855994641661, "recall": 0.9789231314204747 }, "eval_loss": 2.8514182567596436, "eval_overall_accuracy": 0.8213471620697516, "eval_overall_f1": 0.8480048942967846, "eval_overall_precision": 0.8250115733086436, "eval_overall_recall": 0.8723166212152996, "eval_runtime": 8.7005, "eval_samples_per_second": 977.64, "eval_steps_per_second": 30.573, "step": 6000 }, { "epoch": 1.29, "learning_rate": 4.356563056820432e-05, "loss": 2.7896, "step": 6500 }, { "epoch": 1.39, "learning_rate": 4.3070679073450804e-05, "loss": 2.8132, "step": 7000 }, { "epoch": 1.39, "eval_COMMENT": { "f1": 0.680542242913871, "number": 6854, "precision": 0.641124871001032, "recall": 0.7251240151736212 }, "eval_NAME": { "f1": 0.8072829131652661, "number": 8845, "precision": 0.8001110494169905, "recall": 0.814584511023177 }, "eval_QTY": { "f1": 0.9839452743263996, "number": 7152, "precision": 0.9824365765263451, "recall": 0.9854586129753915 }, "eval_RANGE_END": { "f1": 0.7421875, "number": 105, "precision": 0.6291390728476821, "recall": 0.9047619047619048 }, "eval_UNIT": { "f1": 0.9518423307626392, "number": 5646, "precision": 0.9219787516600265, "recall": 0.983705278072972 }, "eval_loss": 2.776045322418213, "eval_overall_accuracy": 0.8222589468885343, "eval_overall_f1": 0.8473121210056551, "eval_overall_precision": 0.8261476117717399, "eval_overall_recall": 0.8695895391930635, "eval_runtime": 11.1273, "eval_samples_per_second": 764.429, "eval_steps_per_second": 23.905, "step": 7000 }, { "epoch": 1.48, "learning_rate": 4.257572757869729e-05, "loss": 2.7089, "step": 7500 }, { "epoch": 1.58, "learning_rate": 4.208077608394378e-05, "loss": 2.6976, "step": 8000 }, { "epoch": 1.58, "eval_COMMENT": { "f1": 0.6947368421052631, "number": 6854, "precision": 0.6535493827160493, "recall": 0.7414648380507732 }, "eval_NAME": { "f1": 0.8145306859205775, "number": 8845, "precision": 0.8127884723629405, "recall": 0.8162803843979649 }, "eval_QTY": { "f1": 0.9840759882665177, "number": 7152, "precision": 0.9831147083449623, "recall": 0.9850391498881432 }, "eval_RANGE_END": { "f1": 0.75098814229249, "number": 105, "precision": 0.6418918918918919, "recall": 0.9047619047619048 }, "eval_UNIT": { "f1": 0.9538461538461539, "number": 5646, "precision": 0.926531975288028, "recall": 0.9828196953595466 }, "eval_loss": 2.707292318344116, "eval_overall_accuracy": 0.826172023402477, "eval_overall_f1": 0.8534594631514241, "eval_overall_precision": 0.8340898471397103, "eval_overall_recall": 0.8737500874064751, "eval_runtime": 10.8076, "eval_samples_per_second": 787.041, "eval_steps_per_second": 24.612, "step": 8000 }, { "epoch": 1.68, "learning_rate": 4.158582458919026e-05, "loss": 2.6869, "step": 8500 }, { "epoch": 1.78, "learning_rate": 4.109087309443675e-05, "loss": 2.6347, "step": 9000 }, { "epoch": 1.78, "eval_COMMENT": { "f1": 0.6949685534591195, "number": 6854, "precision": 0.6538461538461539, "recall": 0.7416107382550335 }, "eval_NAME": { "f1": 0.8143807055111011, "number": 8845, "precision": 0.8118188967531738, "recall": 0.8169587337478802 }, "eval_QTY": { "f1": 0.9832394464149107, "number": 7152, "precision": 0.9781375397813754, "recall": 0.9883948545861297 }, "eval_RANGE_END": { "f1": 0.7588932806324111, "number": 105, "precision": 0.6486486486486487, "recall": 0.9142857142857143 }, "eval_UNIT": { "f1": 0.9523400601116359, "number": 5646, "precision": 0.92432072012002, "recall": 0.9821112291888062 }, "eval_loss": 2.6447880268096924, "eval_overall_accuracy": 0.8236836106678824, "eval_overall_f1": 0.8531482839167277, "eval_overall_precision": 0.832606742320876, "eval_overall_recall": 0.8747290399272778, "eval_runtime": 10.4718, "eval_samples_per_second": 812.274, "eval_steps_per_second": 25.401, "step": 9000 }, { "epoch": 1.88, "learning_rate": 4.059592159968323e-05, "loss": 2.5569, "step": 9500 }, { "epoch": 1.98, "learning_rate": 4.010097010492972e-05, "loss": 2.5847, "step": 10000 }, { "epoch": 1.98, "eval_COMMENT": { "f1": 0.6963045290358433, "number": 6854, "precision": 0.6645452134712277, "recall": 0.7312518237525533 }, "eval_NAME": { "f1": 0.8156796390298928, "number": 8845, "precision": 0.8138435565559933, "recall": 0.8175240248728095 }, "eval_QTY": { "f1": 0.9831476323119777, "number": 7152, "precision": 0.9793285238623751, "recall": 0.986996644295302 }, "eval_RANGE_END": { "f1": 0.7639484978540773, "number": 105, "precision": 0.6953125, "recall": 0.8476190476190476 }, "eval_UNIT": { "f1": 0.9530017152658663, "number": 5646, "precision": 0.9238443631526438, "recall": 0.9840595111583422 }, "eval_loss": 2.591038227081299, "eval_overall_accuracy": 0.8253172251348682, "eval_overall_f1": 0.8546566402302197, "eval_overall_precision": 0.8377942707458776, "eval_overall_recall": 0.8722117334452136, "eval_runtime": 10.9908, "eval_samples_per_second": 773.919, "eval_steps_per_second": 24.202, "step": 10000 }, { "epoch": 2.08, "learning_rate": 3.9606018610176205e-05, "loss": 2.5001, "step": 10500 }, { "epoch": 2.18, "learning_rate": 3.911106711542269e-05, "loss": 2.4321, "step": 11000 }, { "epoch": 2.18, "eval_COMMENT": { "f1": 0.7009998630324613, "number": 6854, "precision": 0.660557563242127, "recall": 0.7467172454041435 }, "eval_NAME": { "f1": 0.8124085125548924, "number": 8845, "precision": 0.8091286307053942, "recall": 0.8157150932730356 }, "eval_QTY": { "f1": 0.9833752444816989, "number": 7152, "precision": 0.9825516471245115, "recall": 0.9842002237136466 }, "eval_RANGE_END": { "f1": 0.7404580152671757, "number": 105, "precision": 0.6178343949044586, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9521690767519465, "number": 5646, "precision": 0.9210395629862606, "recall": 0.9854764434998229 }, "eval_loss": 2.5731780529022217, "eval_overall_accuracy": 0.8255071803054479, "eval_overall_f1": 0.8539459994200822, "eval_overall_precision": 0.8336830186165785, "eval_overall_recall": 0.8752185161876792, "eval_runtime": 9.4187, "eval_samples_per_second": 903.101, "eval_steps_per_second": 28.242, "step": 11000 }, { "epoch": 2.28, "learning_rate": 3.861611562066917e-05, "loss": 2.5117, "step": 11500 }, { "epoch": 2.38, "learning_rate": 3.812116412591566e-05, "loss": 2.4326, "step": 12000 }, { "epoch": 2.38, "eval_COMMENT": { "f1": 0.7086570477247504, "number": 6854, "precision": 0.6754826765405977, "recall": 0.7452582433615407 }, "eval_NAME": { "f1": 0.8158534516876803, "number": 8845, "precision": 0.8159918570459173, "recall": 0.8157150932730356 }, "eval_QTY": { "f1": 0.9844993715961456, "number": 7152, "precision": 0.9832635983263598, "recall": 0.985738255033557 }, "eval_RANGE_END": { "f1": 0.7654320987654321, "number": 105, "precision": 0.6739130434782609, "recall": 0.8857142857142857 }, "eval_UNIT": { "f1": 0.9534265374388883, "number": 5646, "precision": 0.9243306169965075, "recall": 0.9844137442437123 }, "eval_loss": 2.5278468132019043, "eval_overall_accuracy": 0.8280525795912165, "eval_overall_f1": 0.8580588749635675, "eval_overall_precision": 0.8418502943650126, "eval_overall_recall": 0.8749038528774211, "eval_runtime": 11.4233, "eval_samples_per_second": 744.616, "eval_steps_per_second": 23.286, "step": 12000 }, { "epoch": 2.47, "learning_rate": 3.762621263116215e-05, "loss": 2.3983, "step": 12500 }, { "epoch": 2.57, "learning_rate": 3.7131261136408633e-05, "loss": 2.3705, "step": 13000 }, { "epoch": 2.57, "eval_COMMENT": { "f1": 0.7056559686619477, "number": 6854, "precision": 0.6670131219955827, "recall": 0.7490516486723081 }, "eval_NAME": { "f1": 0.8140058545372664, "number": 8845, "precision": 0.8106289942818702, "recall": 0.8174109666478236 }, "eval_QTY": { "f1": 0.9845080251221213, "number": 7152, "precision": 0.9827249930342714, "recall": 0.9862975391498882 }, "eval_RANGE_END": { "f1": 0.7415730337078652, "number": 105, "precision": 0.6111111111111112, "recall": 0.9428571428571428 }, "eval_UNIT": { "f1": 0.952819725279413, "number": 5646, "precision": 0.9191769547325103, "recall": 0.9890187743535246 }, "eval_loss": 2.4818899631500244, "eval_overall_accuracy": 0.8270458171871439, "eval_overall_f1": 0.8562072552999164, "eval_overall_precision": 0.8358363024874297, "eval_overall_recall": 0.8775959723096287, "eval_runtime": 9.7776, "eval_samples_per_second": 869.945, "eval_steps_per_second": 27.205, "step": 13000 }, { "epoch": 2.67, "learning_rate": 3.663630964165512e-05, "loss": 2.4183, "step": 13500 }, { "epoch": 2.77, "learning_rate": 3.6141358146901606e-05, "loss": 2.364, "step": 14000 }, { "epoch": 2.77, "eval_COMMENT": { "f1": 0.7068350260774088, "number": 6854, "precision": 0.6672713138118683, "recall": 0.7513860519404727 }, "eval_NAME": { "f1": 0.8130456824198727, "number": 8845, "precision": 0.8101706331387517, "recall": 0.8159412097230073 }, "eval_QTY": { "f1": 0.9847269684078387, "number": 7152, "precision": 0.9823292055099485, "recall": 0.9871364653243848 }, "eval_RANGE_END": { "f1": 0.7729083665338645, "number": 105, "precision": 0.6643835616438356, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9542999228328902, "number": 5646, "precision": 0.9248795080604952, "recall": 0.9856535600425079 }, "eval_loss": 2.4206130504608154, "eval_overall_accuracy": 0.8284704809664919, "eval_overall_f1": 0.8566014544709617, "eval_overall_precision": 0.8369695756605284, "eval_overall_recall": 0.8771764212292846, "eval_runtime": 10.6958, "eval_samples_per_second": 795.265, "eval_steps_per_second": 24.87, "step": 14000 }, { "epoch": 2.87, "learning_rate": 3.564640665214809e-05, "loss": 2.3089, "step": 14500 }, { "epoch": 2.97, "learning_rate": 3.515145515739457e-05, "loss": 2.3349, "step": 15000 }, { "epoch": 2.97, "eval_COMMENT": { "f1": 0.7115305703734099, "number": 6854, "precision": 0.6696704428424305, "recall": 0.7589728625620076 }, "eval_NAME": { "f1": 0.8152284263959392, "number": 8845, "precision": 0.8133933595948227, "recall": 0.8170717919728661 }, "eval_QTY": { "f1": 0.9854223338215806, "number": 7152, "precision": 0.9831593597773138, "recall": 0.9876957494407159 }, "eval_RANGE_END": { "f1": 0.7320754716981133, "number": 105, "precision": 0.60625, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.954592186429061, "number": 5646, "precision": 0.9244938599402589, "recall": 0.9867162592986185 }, "eval_loss": 2.390350103378296, "eval_overall_accuracy": 0.8285084720006078, "eval_overall_f1": 0.8583563606590933, "eval_overall_precision": 0.8380295763389288, "eval_overall_recall": 0.8796937277113489, "eval_runtime": 13.4662, "eval_samples_per_second": 631.657, "eval_steps_per_second": 19.753, "step": 15000 }, { "epoch": 3.07, "learning_rate": 3.465650366264107e-05, "loss": 2.251, "step": 15500 }, { "epoch": 3.17, "learning_rate": 3.416155216788755e-05, "loss": 2.253, "step": 16000 }, { "epoch": 3.17, "eval_COMMENT": { "f1": 0.7120891136472357, "number": 6854, "precision": 0.669751896130608, "recall": 0.7601400641960899 }, "eval_NAME": { "f1": 0.8165914221218961, "number": 8845, "precision": 0.8152112676056338, "recall": 0.817976257772753 }, "eval_QTY": { "f1": 0.9850704618389843, "number": 7152, "precision": 0.9830130882762461, "recall": 0.9871364653243848 }, "eval_RANGE_END": { "f1": 0.7529411764705883, "number": 105, "precision": 0.64, "recall": 0.9142857142857143 }, "eval_UNIT": { "f1": 0.9538013199622868, "number": 5646, "precision": 0.924098986879256, "recall": 0.9854764434998229 }, "eval_loss": 2.3770651817321777, "eval_overall_accuracy": 0.8302180685358256, "eval_overall_f1": 0.8587418314593322, "eval_overall_precision": 0.8386376512147166, "eval_overall_recall": 0.8798335780714636, "eval_runtime": 11.0556, "eval_samples_per_second": 769.382, "eval_steps_per_second": 24.06, "step": 16000 }, { "epoch": 3.27, "learning_rate": 3.3666600673134034e-05, "loss": 2.1955, "step": 16500 }, { "epoch": 3.37, "learning_rate": 3.317164917838052e-05, "loss": 2.2137, "step": 17000 }, { "epoch": 3.37, "eval_COMMENT": { "f1": 0.7152373022481265, "number": 6854, "precision": 0.6819264355649642, "recall": 0.7519696527575138 }, "eval_NAME": { "f1": 0.816918906708832, "number": 8845, "precision": 0.8160893602617624, "recall": 0.8177501413227812 }, "eval_QTY": { "f1": 0.9852099902330124, "number": 7152, "precision": 0.9831523252575884, "recall": 0.9872762863534675 }, "eval_RANGE_END": { "f1": 0.7619047619047618, "number": 105, "precision": 0.6530612244897959, "recall": 0.9142857142857143 }, "eval_UNIT": { "f1": 0.9529855868222373, "number": 5646, "precision": 0.924126455906822, "recall": 0.983705278072972 }, "eval_loss": 2.378207206726074, "eval_overall_accuracy": 0.8285464630347238, "eval_overall_f1": 0.8600801891641822, "eval_overall_precision": 0.8433467741935484, "eval_overall_recall": 0.8774910845395427, "eval_runtime": 10.7102, "eval_samples_per_second": 794.197, "eval_steps_per_second": 24.836, "step": 17000 }, { "epoch": 3.46, "learning_rate": 3.267669768362701e-05, "loss": 2.2027, "step": 17500 }, { "epoch": 3.56, "learning_rate": 3.218174618887349e-05, "loss": 2.2065, "step": 18000 }, { "epoch": 3.56, "eval_COMMENT": { "f1": 0.715327462850853, "number": 6854, "precision": 0.6767768810205675, "recall": 0.7585351619492268 }, "eval_NAME": { "f1": 0.8111738148984199, "number": 8845, "precision": 0.8098028169014084, "recall": 0.8125494629734313 }, "eval_QTY": { "f1": 0.9852766729467587, "number": 7152, "precision": 0.9834238751915308, "recall": 0.9871364653243848 }, "eval_RANGE_END": { "f1": 0.751937984496124, "number": 105, "precision": 0.6339869281045751, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9542920847268673, "number": 5646, "precision": 0.9250207813798836, "recall": 0.9854764434998229 }, "eval_loss": 2.3392648696899414, "eval_overall_accuracy": 0.829154319580579, "eval_overall_f1": 0.8582709465695826, "eval_overall_precision": 0.8395866773675762, "eval_overall_recall": 0.8778057478498007, "eval_runtime": 10.643, "eval_samples_per_second": 799.209, "eval_steps_per_second": 24.993, "step": 18000 }, { "epoch": 3.66, "learning_rate": 3.168679469411997e-05, "loss": 2.17, "step": 18500 }, { "epoch": 3.76, "learning_rate": 3.119184319936647e-05, "loss": 2.1758, "step": 19000 }, { "epoch": 3.76, "eval_COMMENT": { "f1": 0.7196268093572066, "number": 6854, "precision": 0.6791402304803833, "recall": 0.7652465713451999 }, "eval_NAME": { "f1": 0.8154011420817548, "number": 8845, "precision": 0.8155394707079846, "recall": 0.8152628603730921 }, "eval_QTY": { "f1": 0.9850017439832579, "number": 7152, "precision": 0.9828762355561743, "recall": 0.9871364653243848 }, "eval_RANGE_END": { "f1": 0.7637795275590552, "number": 105, "precision": 0.6510067114093959, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9544714052988081, "number": 5646, "precision": 0.9250457038391224, "recall": 0.9858306765851931 }, "eval_loss": 2.306312322616577, "eval_overall_accuracy": 0.827710660284173, "eval_overall_f1": 0.8605851391072529, "eval_overall_precision": 0.8417129103429832, "eval_overall_recall": 0.8803230543318649, "eval_runtime": 11.977, "eval_samples_per_second": 710.192, "eval_steps_per_second": 22.209, "step": 19000 }, { "epoch": 3.86, "learning_rate": 3.069689170461295e-05, "loss": 2.2238, "step": 19500 }, { "epoch": 3.96, "learning_rate": 3.0201940209859435e-05, "loss": 2.1417, "step": 20000 }, { "epoch": 3.96, "eval_COMMENT": { "f1": 0.7152720243026789, "number": 6854, "precision": 0.6788990825688074, "recall": 0.7557630580682813 }, "eval_NAME": { "f1": 0.815481242573417, "number": 8845, "precision": 0.8162664250113276, "recall": 0.8146975692481628 }, "eval_QTY": { "f1": 0.9854263998326477, "number": 7152, "precision": 0.9828905271943247, "recall": 0.9879753914988815 }, "eval_RANGE_END": { "f1": 0.7634854771784232, "number": 105, "precision": 0.6764705882352942, "recall": 0.8761904761904762 }, "eval_UNIT": { "f1": 0.9533384893013664, "number": 5646, "precision": 0.9258888332498748, "recall": 0.9824654622741764 }, "eval_loss": 2.288215398788452, "eval_overall_accuracy": 0.8285084720006078, "eval_overall_f1": 0.8596340962039195, "eval_overall_precision": 0.8427151205749983, "eval_overall_recall": 0.877246346409342, "eval_runtime": 9.5122, "eval_samples_per_second": 894.221, "eval_steps_per_second": 27.964, "step": 20000 }, { "epoch": 4.06, "learning_rate": 2.970698871510592e-05, "loss": 2.1114, "step": 20500 }, { "epoch": 4.16, "learning_rate": 2.9212037220352405e-05, "loss": 2.0271, "step": 21000 }, { "epoch": 4.16, "eval_COMMENT": { "f1": 0.7168075752451809, "number": 6854, "precision": 0.6681376875551632, "recall": 0.7731251823752553 }, "eval_NAME": { "f1": 0.8170380818053596, "number": 8845, "precision": 0.815427927927928, "recall": 0.8186546071226681 }, "eval_QTY": { "f1": 0.9858546442756603, "number": 7152, "precision": 0.9826364772885123, "recall": 0.9890939597315436 }, "eval_RANGE_END": { "f1": 0.7717842323651452, "number": 105, "precision": 0.6838235294117647, "recall": 0.8857142857142857 }, "eval_UNIT": { "f1": 0.9534565366187543, "number": 5646, "precision": 0.922211188348229, "recall": 0.9868933758413035 }, "eval_loss": 2.350003242492676, "eval_overall_accuracy": 0.82989514474584, "eval_overall_f1": 0.859976186426263, "eval_overall_precision": 0.837385716178614, "eval_overall_recall": 0.8838193133347318, "eval_runtime": 11.0178, "eval_samples_per_second": 772.02, "eval_steps_per_second": 24.143, "step": 21000 }, { "epoch": 4.26, "learning_rate": 2.871708572559889e-05, "loss": 2.0589, "step": 21500 }, { "epoch": 4.36, "learning_rate": 2.8222134230845377e-05, "loss": 2.0488, "step": 22000 }, { "epoch": 4.36, "eval_COMMENT": { "f1": 0.7173793103448276, "number": 6854, "precision": 0.6802249542244311, "recall": 0.7588269623577473 }, "eval_NAME": { "f1": 0.814222122048797, "number": 8845, "precision": 0.8116153673331835, "recall": 0.8168456755228943 }, "eval_QTY": { "f1": 0.9854284319877291, "number": 7152, "precision": 0.9827562230565985, "recall": 0.9881152125279642 }, "eval_RANGE_END": { "f1": 0.7686274509803921, "number": 105, "precision": 0.6533333333333333, "recall": 0.9333333333333333 }, "eval_UNIT": { "f1": 0.9529190207156308, "number": 5646, "precision": 0.9221338634857521, "recall": 0.9858306765851931 }, "eval_loss": 2.2779643535614014, "eval_overall_accuracy": 0.8274067320112454, "eval_overall_f1": 0.8596716045585798, "eval_overall_precision": 0.8406683375104428, "eval_overall_recall": 0.8795538773512341, "eval_runtime": 10.9882, "eval_samples_per_second": 774.104, "eval_steps_per_second": 24.208, "step": 22000 }, { "epoch": 4.45, "learning_rate": 2.7727182736091867e-05, "loss": 2.0377, "step": 22500 }, { "epoch": 4.55, "learning_rate": 2.7232231241338353e-05, "loss": 2.0403, "step": 23000 }, { "epoch": 4.55, "eval_COMMENT": { "f1": 0.7213069552629764, "number": 6854, "precision": 0.6836534692277538, "recall": 0.7633498686898161 }, "eval_NAME": { "f1": 0.8175446529504862, "number": 8845, "precision": 0.8174522436984288, "recall": 0.8176370830977954 }, "eval_QTY": { "f1": 0.9858447806986962, "number": 7152, "precision": 0.9833078314090973, "recall": 0.9883948545861297 }, "eval_RANGE_END": { "f1": 0.7868852459016393, "number": 105, "precision": 0.6906474820143885, "recall": 0.9142857142857143 }, "eval_UNIT": { "f1": 0.9541991267870901, "number": 5646, "precision": 0.9234465617232809, "recall": 0.9870704923839887 }, "eval_loss": 2.255697250366211, "eval_overall_accuracy": 0.8292303016488108, "eval_overall_f1": 0.8621226374754127, "eval_overall_precision": 0.8439205706057663, "eval_overall_recall": 0.8811271939025243, "eval_runtime": 11.1445, "eval_samples_per_second": 763.249, "eval_steps_per_second": 23.868, "step": 23000 }, { "epoch": 4.65, "learning_rate": 2.6737279746584836e-05, "loss": 2.0887, "step": 23500 }, { "epoch": 4.75, "learning_rate": 2.6242328251831323e-05, "loss": 2.0443, "step": 24000 }, { "epoch": 4.75, "eval_COMMENT": { "f1": 0.7226055754899255, "number": 6854, "precision": 0.6855197695731867, "recall": 0.7639334695068573 }, "eval_NAME": { "f1": 0.8165780843605112, "number": 8845, "precision": 0.8167628096369189, "recall": 0.8163934426229508 }, "eval_QTY": { "f1": 0.9852161785216179, "number": 7152, "precision": 0.9827490261547023, "recall": 0.9876957494407159 }, "eval_RANGE_END": { "f1": 0.7854251012145749, "number": 105, "precision": 0.6830985915492958, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9537354352296092, "number": 5646, "precision": 0.9236641221374046, "recall": 0.9858306765851931 }, "eval_loss": 2.228408098220825, "eval_overall_accuracy": 0.829097333029405, "eval_overall_f1": 0.8619196741790305, "eval_overall_precision": 0.8441092676386794, "eval_overall_recall": 0.8804978672820083, "eval_runtime": 10.5005, "eval_samples_per_second": 810.058, "eval_steps_per_second": 25.332, "step": 24000 }, { "epoch": 4.85, "learning_rate": 2.5747376757077806e-05, "loss": 2.068, "step": 24500 }, { "epoch": 4.95, "learning_rate": 2.5252425262324292e-05, "loss": 2.0214, "step": 25000 }, { "epoch": 4.95, "eval_COMMENT": { "f1": 0.7221103783408538, "number": 6854, "precision": 0.6887829426566018, "recall": 0.7588269623577473 }, "eval_NAME": { "f1": 0.8139863300005649, "number": 8845, "precision": 0.8133890268683676, "recall": 0.814584511023177 }, "eval_QTY": { "f1": 0.9864751812604574, "number": 7152, "precision": 0.9837319243604005, "recall": 0.9892337807606264 }, "eval_RANGE_END": { "f1": 0.7713004484304932, "number": 105, "precision": 0.7288135593220338, "recall": 0.819047619047619 }, "eval_UNIT": { "f1": 0.9553288176283975, "number": 5646, "precision": 0.9258766827322586, "recall": 0.9867162592986185 }, "eval_loss": 2.2036967277526855, "eval_overall_accuracy": 0.8304270192234633, "eval_overall_f1": 0.8618053412869828, "eval_overall_precision": 0.8453726123217649, "eval_overall_recall": 0.8788895881406895, "eval_runtime": 10.7118, "eval_samples_per_second": 794.075, "eval_steps_per_second": 24.832, "step": 25000 }, { "epoch": 5.05, "learning_rate": 2.4757473767570778e-05, "loss": 2.0164, "step": 25500 }, { "epoch": 5.15, "learning_rate": 2.4262522272817265e-05, "loss": 2.0081, "step": 26000 }, { "epoch": 5.15, "eval_COMMENT": { "f1": 0.719671201814059, "number": 6854, "precision": 0.6996417745935519, "recall": 0.7408812372337321 }, "eval_NAME": { "f1": 0.8098846414838272, "number": 8845, "precision": 0.8101595203077271, "recall": 0.8096099491237988 }, "eval_QTY": { "f1": 0.9862001672706997, "number": 7152, "precision": 0.9831851028349082, "recall": 0.9892337807606264 }, "eval_RANGE_END": { "f1": 0.7918367346938776, "number": 105, "precision": 0.6928571428571428, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9546235819869371, "number": 5646, "precision": 0.927212020033389, "recall": 0.983705278072972 }, "eval_loss": 2.2013936042785645, "eval_overall_accuracy": 0.8273117544259555, "eval_overall_f1": 0.8604911676001723, "eval_overall_precision": 0.8484858783944533, "eval_overall_recall": 0.8728410600657297, "eval_runtime": 11.2303, "eval_samples_per_second": 757.413, "eval_steps_per_second": 23.686, "step": 26000 }, { "epoch": 5.25, "learning_rate": 2.376757077806375e-05, "loss": 1.9905, "step": 26500 }, { "epoch": 5.35, "learning_rate": 2.3272619283310237e-05, "loss": 1.9138, "step": 27000 }, { "epoch": 5.35, "eval_COMMENT": { "f1": 0.7232730263157895, "number": 6854, "precision": 0.6819591625743086, "recall": 0.7699153778815291 }, "eval_NAME": { "f1": 0.8175660419959357, "number": 8845, "precision": 0.8163679404802164, "recall": 0.818767665347654 }, "eval_QTY": { "f1": 0.9861333704968295, "number": 7152, "precision": 0.9829142936518961, "recall": 0.9893736017897091 }, "eval_RANGE_END": { "f1": 0.7679324894514767, "number": 105, "precision": 0.6893939393939394, "recall": 0.8666666666666667 }, "eval_UNIT": { "f1": 0.9538567493112948, "number": 5646, "precision": 0.9279731993299832, "recall": 0.9812256464753808 }, "eval_loss": 2.1838574409484863, "eval_overall_accuracy": 0.8322695843780867, "eval_overall_f1": 0.8622504785343178, "eval_overall_precision": 0.8433968572383818, "eval_overall_recall": 0.8819662960632124, "eval_runtime": 10.2972, "eval_samples_per_second": 826.053, "eval_steps_per_second": 25.832, "step": 27000 }, { "epoch": 5.44, "learning_rate": 2.2777667788556724e-05, "loss": 1.9236, "step": 27500 }, { "epoch": 5.54, "learning_rate": 2.2282716293803206e-05, "loss": 1.9304, "step": 28000 }, { "epoch": 5.54, "eval_COMMENT": { "f1": 0.7215675336447948, "number": 6854, "precision": 0.6910645118204889, "recall": 0.7548876568427196 }, "eval_NAME": { "f1": 0.8127016471387332, "number": 8845, "precision": 0.8137610519156654, "recall": 0.8116449971735443 }, "eval_QTY": { "f1": 0.9857760423929716, "number": 7152, "precision": 0.9831710709318497, "recall": 0.9883948545861297 }, "eval_RANGE_END": { "f1": 0.776, "number": 105, "precision": 0.6689655172413793, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9539864109400533, "number": 5646, "precision": 0.9272696873432537, "recall": 0.9822883457314914 }, "eval_loss": 2.1557235717773438, "eval_overall_accuracy": 0.8287364182053035, "eval_overall_f1": 0.860940800659488, "eval_overall_precision": 0.8460759493670886, "eval_overall_recall": 0.8763373190685966, "eval_runtime": 11.4111, "eval_samples_per_second": 745.412, "eval_steps_per_second": 23.311, "step": 28000 }, { "epoch": 5.64, "learning_rate": 2.1787764799049696e-05, "loss": 1.908, "step": 28500 }, { "epoch": 5.74, "learning_rate": 2.129281330429618e-05, "loss": 1.9369, "step": 29000 }, { "epoch": 5.74, "eval_COMMENT": { "f1": 0.7214330697641872, "number": 6854, "precision": 0.6931558424095737, "recall": 0.7521155529617741 }, "eval_NAME": { "f1": 0.8120292235374073, "number": 8845, "precision": 0.8135497049477984, "recall": 0.8105144149236857 }, "eval_QTY": { "f1": 0.9862020905923344, "number": 7152, "precision": 0.9830508474576272, "recall": 0.9893736017897091 }, "eval_RANGE_END": { "f1": 0.7841409691629957, "number": 105, "precision": 0.7295081967213115, "recall": 0.8476190476190476 }, "eval_UNIT": { "f1": 0.9530419880034275, "number": 5646, "precision": 0.923140770252324, "recall": 0.9849450938717677 }, "eval_loss": 2.152221918106079, "eval_overall_accuracy": 0.8286794316541296, "eval_overall_f1": 0.8608987026376836, "eval_overall_precision": 0.8464839658027237, "eval_overall_recall": 0.8758128802181666, "eval_runtime": 8.8394, "eval_samples_per_second": 962.281, "eval_steps_per_second": 30.093, "step": 29000 }, { "epoch": 5.84, "learning_rate": 2.0797861809542665e-05, "loss": 1.9176, "step": 29500 }, { "epoch": 5.94, "learning_rate": 2.0302910314789152e-05, "loss": 1.8944, "step": 30000 }, { "epoch": 5.94, "eval_COMMENT": { "f1": 0.723598615916955, "number": 6854, "precision": 0.6882569773565034, "recall": 0.762766267872775 }, "eval_NAME": { "f1": 0.8156853881794554, "number": 8845, "precision": 0.8153168417485598, "recall": 0.8160542679479932 }, "eval_QTY": { "f1": 0.9857272157627236, "number": 7152, "precision": 0.9816946331992789, "recall": 0.9897930648769575 }, "eval_RANGE_END": { "f1": 0.7631578947368421, "number": 105, "precision": 0.7073170731707317, "recall": 0.8285714285714286 }, "eval_UNIT": { "f1": 0.9549935705100728, "number": 5646, "precision": 0.9254028908456554, "recall": 0.9865391427559334 }, "eval_loss": 2.128391742706299, "eval_overall_accuracy": 0.8317377099004635, "eval_overall_f1": 0.8623381960139715, "eval_overall_precision": 0.8449768471914637, "eval_overall_recall": 0.880427942101951, "eval_runtime": 11.5016, "eval_samples_per_second": 739.547, "eval_steps_per_second": 23.127, "step": 30000 }, { "epoch": 6.04, "learning_rate": 1.9807958820035638e-05, "loss": 1.837, "step": 30500 }, { "epoch": 6.14, "learning_rate": 1.9313007325282124e-05, "loss": 1.8311, "step": 31000 }, { "epoch": 6.14, "eval_COMMENT": { "f1": 0.7244426318651441, "number": 6854, "precision": 0.6781623822855688, "recall": 0.7775021885030639 }, "eval_NAME": { "f1": 0.818961625282167, "number": 8845, "precision": 0.8175774647887324, "recall": 0.8203504804974562 }, "eval_QTY": { "f1": 0.9856425982715361, "number": 7152, "precision": 0.9826292384658143, "recall": 0.9886744966442953 }, "eval_RANGE_END": { "f1": 0.7896995708154506, "number": 105, "precision": 0.71875, "recall": 0.8761904761904762 }, "eval_UNIT": { "f1": 0.9552008238928938, "number": 5646, "precision": 0.9265734265734266, "recall": 0.9856535600425079 }, "eval_loss": 2.171062469482422, "eval_overall_accuracy": 0.8314527771445939, "eval_overall_f1": 0.8629676979459644, "eval_overall_precision": 0.8419984698799189, "eval_overall_recall": 0.8850080413957065, "eval_runtime": 11.2938, "eval_samples_per_second": 753.154, "eval_steps_per_second": 23.553, "step": 31000 }, { "epoch": 6.24, "learning_rate": 1.8818055830528607e-05, "loss": 1.8426, "step": 31500 }, { "epoch": 6.34, "learning_rate": 1.8323104335775097e-05, "loss": 1.879, "step": 32000 }, { "epoch": 6.34, "eval_COMMENT": { "f1": 0.7243460764587525, "number": 6854, "precision": 0.6905675353882789, "recall": 0.7615990662386928 }, "eval_NAME": { "f1": 0.8148399502318742, "number": 8845, "precision": 0.8152087812606088, "recall": 0.8144714527981911 }, "eval_QTY": { "f1": 0.985952712100139, "number": 7152, "precision": 0.9807692307692307, "recall": 0.9911912751677853 }, "eval_RANGE_END": { "f1": 0.7796610169491526, "number": 105, "precision": 0.7022900763358778, "recall": 0.8761904761904762 }, "eval_UNIT": { "f1": 0.9541174456428694, "number": 5646, "precision": 0.9232935719019219, "recall": 0.9870704923839887 }, "eval_loss": 2.1472506523132324, "eval_overall_accuracy": 0.830635969911101, "eval_overall_f1": 0.8623636394773346, "eval_overall_precision": 0.8451545768856366, "eval_overall_recall": 0.8802880917418362, "eval_runtime": 12.4001, "eval_samples_per_second": 685.964, "eval_steps_per_second": 21.452, "step": 32000 }, { "epoch": 6.43, "learning_rate": 1.782815284102158e-05, "loss": 1.8605, "step": 32500 }, { "epoch": 6.53, "learning_rate": 1.7333201346268066e-05, "loss": 1.8279, "step": 33000 }, { "epoch": 6.53, "eval_COMMENT": { "f1": 0.7266004792879152, "number": 6854, "precision": 0.6845568313765966, "recall": 0.7741464838050773 }, "eval_NAME": { "f1": 0.8171618650279078, "number": 8845, "precision": 0.8150022492127755, "recall": 0.8193329564725834 }, "eval_QTY": { "f1": 0.9857839721254356, "number": 7152, "precision": 0.9826340650180606, "recall": 0.9889541387024608 }, "eval_RANGE_END": { "f1": 0.7860262008733625, "number": 105, "precision": 0.7258064516129032, "recall": 0.8571428571428571 }, "eval_UNIT": { "f1": 0.9554850330216998, "number": 5646, "precision": 0.9263262930317645, "recall": 0.9865391427559334 }, "eval_loss": 2.1636247634887695, "eval_overall_accuracy": 0.83139579059342, "eval_overall_f1": 0.8632980539433255, "eval_overall_precision": 0.8434852224964974, "eval_overall_recall": 0.8840640514649325, "eval_runtime": 11.6243, "eval_samples_per_second": 731.745, "eval_steps_per_second": 22.883, "step": 33000 }, { "epoch": 6.63, "learning_rate": 1.6838249851514553e-05, "loss": 1.8596, "step": 33500 }, { "epoch": 6.73, "learning_rate": 1.634329835676104e-05, "loss": 1.8613, "step": 34000 }, { "epoch": 6.73, "eval_COMMENT": { "f1": 0.7281226369698219, "number": 6854, "precision": 0.6884180423761861, "recall": 0.7726874817624745 }, "eval_NAME": { "f1": 0.8162550161080653, "number": 8845, "precision": 0.8161166365280289, "recall": 0.8163934426229508 }, "eval_QTY": { "f1": 0.9855233853006681, "number": 7152, "precision": 0.9811529933481153, "recall": 0.9899328859060402 }, "eval_RANGE_END": { "f1": 0.7777777777777778, "number": 105, "precision": 0.6666666666666666, "recall": 0.9333333333333333 }, "eval_UNIT": { "f1": 0.9550600343053174, "number": 5646, "precision": 0.9258397073495178, "recall": 0.9861849096705633 }, "eval_loss": 2.119246482849121, "eval_overall_accuracy": 0.8333523288503913, "eval_overall_f1": 0.8633971291866029, "eval_overall_precision": 0.8444080486663547, "eval_overall_recall": 0.8832599118942731, "eval_runtime": 9.0301, "eval_samples_per_second": 941.963, "eval_steps_per_second": 29.457, "step": 34000 }, { "epoch": 6.83, "learning_rate": 1.5848346862007525e-05, "loss": 1.8804, "step": 34500 }, { "epoch": 6.93, "learning_rate": 1.535339536725401e-05, "loss": 1.8604, "step": 35000 }, { "epoch": 6.93, "eval_COMMENT": { "f1": 0.7285265601529427, "number": 6854, "precision": 0.68467659137577, "recall": 0.7783775897286256 }, "eval_NAME": { "f1": 0.8183306055646481, "number": 8845, "precision": 0.8169934640522876, "recall": 0.819672131147541 }, "eval_QTY": { "f1": 0.9865589525732991, "number": 7152, "precision": 0.9827945053420286, "recall": 0.9903523489932886 }, "eval_RANGE_END": { "f1": 0.7818930041152263, "number": 105, "precision": 0.6884057971014492, "recall": 0.9047619047619048 }, "eval_UNIT": { "f1": 0.9555517418911963, "number": 5646, "precision": 0.9267643142476698, "recall": 0.9861849096705633 }, "eval_loss": 2.1069583892822266, "eval_overall_accuracy": 0.834340095737406, "eval_overall_f1": 0.8642295423141878, "eval_overall_precision": 0.8438322395815984, "eval_overall_recall": 0.8856373680162226, "eval_runtime": 11.4858, "eval_samples_per_second": 740.57, "eval_steps_per_second": 23.159, "step": 35000 }, { "epoch": 7.03, "learning_rate": 1.4858443872500496e-05, "loss": 1.7995, "step": 35500 }, { "epoch": 7.13, "learning_rate": 1.4363492377746981e-05, "loss": 1.8026, "step": 36000 }, { "epoch": 7.13, "eval_COMMENT": { "f1": 0.7254587315984092, "number": 6854, "precision": 0.695146409947854, "recall": 0.7585351619492268 }, "eval_NAME": { "f1": 0.8138180584610165, "number": 8845, "precision": 0.8139561185252205, "recall": 0.81368004522329 }, "eval_QTY": { "f1": 0.9861982434127978, "number": 7152, "precision": 0.9833194328607172, "recall": 0.9890939597315436 }, "eval_RANGE_END": { "f1": 0.7692307692307693, "number": 105, "precision": 0.6976744186046512, "recall": 0.8571428571428571 }, "eval_UNIT": { "f1": 0.9548265200961868, "number": 5646, "precision": 0.926808936312104, "recall": 0.9845908607863975 }, "eval_loss": 2.1282002925872803, "eval_overall_accuracy": 0.8295152344046804, "eval_overall_f1": 0.8625437813336996, "eval_overall_precision": 0.8474124552999123, "eval_overall_recall": 0.8782252989301448, "eval_runtime": 9.0618, "eval_samples_per_second": 938.668, "eval_steps_per_second": 29.354, "step": 36000 }, { "epoch": 7.23, "learning_rate": 1.3868540882993467e-05, "loss": 1.7692, "step": 36500 }, { "epoch": 7.33, "learning_rate": 1.3373589388239954e-05, "loss": 1.774, "step": 37000 }, { "epoch": 7.33, "eval_COMMENT": { "f1": 0.7252502780867629, "number": 6854, "precision": 0.6926958831341301, "recall": 0.7610154654216515 }, "eval_NAME": { "f1": 0.8135153429602889, "number": 8845, "precision": 0.8117753011370032, "recall": 0.8152628603730921 }, "eval_QTY": { "f1": 0.9858644941160087, "number": 7152, "precision": 0.9819669857123041, "recall": 0.9897930648769575 }, "eval_RANGE_END": { "f1": 0.7948717948717948, "number": 105, "precision": 0.7209302325581395, "recall": 0.8857142857142857 }, "eval_UNIT": { "f1": 0.953885787891799, "number": 5646, "precision": 0.9258209701616936, "recall": 0.983705278072972 }, "eval_loss": 2.1374754905700684, "eval_overall_accuracy": 0.829952131297014, "eval_overall_f1": 0.8621126953660542, "eval_overall_precision": 0.8454789915966386, "eval_overall_recall": 0.8794140269911195, "eval_runtime": 13.9271, "eval_samples_per_second": 610.751, "eval_steps_per_second": 19.099, "step": 37000 }, { "epoch": 7.42, "learning_rate": 1.287863789348644e-05, "loss": 1.7909, "step": 37500 }, { "epoch": 7.52, "learning_rate": 1.2383686398732925e-05, "loss": 1.8132, "step": 38000 }, { "epoch": 7.52, "eval_COMMENT": { "f1": 0.7251632624704737, "number": 6854, "precision": 0.6921750663129973, "recall": 0.7614531660344325 }, "eval_NAME": { "f1": 0.8144125798970531, "number": 8845, "precision": 0.8149196287072674, "recall": 0.8139061616732617 }, "eval_QTY": { "f1": 0.9862059356276995, "number": 7152, "precision": 0.9827825603998889, "recall": 0.9896532438478747 }, "eval_RANGE_END": { "f1": 0.7966804979253113, "number": 105, "precision": 0.7058823529411765, "recall": 0.9142857142857143 }, "eval_UNIT": { "f1": 0.9550012856775519, "number": 5646, "precision": 0.9252615844544095, "recall": 0.9867162592986185 }, "eval_loss": 2.1093838214874268, "eval_overall_accuracy": 0.8298571537117241, "eval_overall_f1": 0.8627067798062913, "eval_overall_precision": 0.8462987253220328, "eval_overall_recall": 0.8797636528914062, "eval_runtime": 10.2321, "eval_samples_per_second": 831.306, "eval_steps_per_second": 25.997, "step": 38000 }, { "epoch": 7.62, "learning_rate": 1.1888734903979411e-05, "loss": 1.7708, "step": 38500 }, { "epoch": 7.72, "learning_rate": 1.1393783409225896e-05, "loss": 1.805, "step": 39000 }, { "epoch": 7.72, "eval_COMMENT": { "f1": 0.7264215888751205, "number": 6854, "precision": 0.6876955161626694, "recall": 0.7697694776772688 }, "eval_NAME": { "f1": 0.815460358779922, "number": 8845, "precision": 0.8163380920009065, "recall": 0.814584511023177 }, "eval_QTY": { "f1": 0.9862822923194763, "number": 7152, "precision": 0.9823831321958663, "recall": 0.9902125279642058 }, "eval_RANGE_END": { "f1": 0.7844827586206896, "number": 105, "precision": 0.7165354330708661, "recall": 0.8666666666666667 }, "eval_UNIT": { "f1": 0.9549858526965618, "number": 5646, "precision": 0.9255442911750041, "recall": 0.9863620262132483 }, "eval_loss": 2.1103549003601074, "eval_overall_accuracy": 0.8331053871286377, "eval_overall_f1": 0.8630181513352608, "eval_overall_precision": 0.8449633178117986, "eval_overall_recall": 0.8818614082931263, "eval_runtime": 10.8182, "eval_samples_per_second": 786.27, "eval_steps_per_second": 24.588, "step": 39000 }, { "epoch": 7.82, "learning_rate": 1.0898831914472382e-05, "loss": 1.8185, "step": 39500 }, { "epoch": 7.92, "learning_rate": 1.0403880419718868e-05, "loss": 1.7337, "step": 40000 }, { "epoch": 7.92, "eval_COMMENT": { "f1": 0.7251437677544517, "number": 6854, "precision": 0.6904604829133131, "recall": 0.7634957688940764 }, "eval_NAME": { "f1": 0.8154846001695395, "number": 8845, "precision": 0.8152542372881356, "recall": 0.8157150932730356 }, "eval_QTY": { "f1": 0.9866220735785953, "number": 7152, "precision": 0.9833333333333333, "recall": 0.9899328859060402 }, "eval_RANGE_END": { "f1": 0.8, "number": 105, "precision": 0.7, "recall": 0.9333333333333333 }, "eval_UNIT": { "f1": 0.9544557852302942, "number": 5646, "precision": 0.9253284550141361, "recall": 0.9854764434998229 }, "eval_loss": 2.1034367084503174, "eval_overall_accuracy": 0.830616974394043, "eval_overall_f1": 0.8629076459303919, "eval_overall_precision": 0.8458129071251091, "eval_overall_recall": 0.8807076428221803, "eval_runtime": 10.7303, "eval_samples_per_second": 792.708, "eval_steps_per_second": 24.79, "step": 40000 }, { "epoch": 8.02, "learning_rate": 9.908928924965353e-06, "loss": 1.7519, "step": 40500 }, { "epoch": 8.12, "learning_rate": 9.41397743021184e-06, "loss": 1.7771, "step": 41000 }, { "epoch": 8.12, "eval_COMMENT": { "f1": 0.7258660347110893, "number": 6854, "precision": 0.6949152542372882, "recall": 0.759702363583309 }, "eval_NAME": { "f1": 0.8134750169568167, "number": 8845, "precision": 0.8133830677065672, "recall": 0.8135669869983041 }, "eval_QTY": { "f1": 0.9863395595204906, "number": 7152, "precision": 0.9833240689271817, "recall": 0.9893736017897091 }, "eval_RANGE_END": { "f1": 0.7931034482758621, "number": 105, "precision": 0.7244094488188977, "recall": 0.8761904761904762 }, "eval_UNIT": { "f1": 0.9552213149978513, "number": 5646, "precision": 0.9278677575555184, "recall": 0.9842366277010273 }, "eval_loss": 2.107405424118042, "eval_overall_accuracy": 0.8285654585517818, "eval_overall_f1": 0.8627047069729117, "eval_overall_precision": 0.8474301902063942, "eval_overall_recall": 0.8785399622404028, "eval_runtime": 11.3451, "eval_samples_per_second": 749.75, "eval_steps_per_second": 23.446, "step": 41000 }, { "epoch": 8.22, "learning_rate": 8.919025935458326e-06, "loss": 1.7381, "step": 41500 }, { "epoch": 8.32, "learning_rate": 8.424074440704812e-06, "loss": 1.7179, "step": 42000 }, { "epoch": 8.32, "eval_COMMENT": { "f1": 0.7297001232370259, "number": 6854, "precision": 0.6874355005159959, "recall": 0.7775021885030639 }, "eval_NAME": { "f1": 0.8157106527267589, "number": 8845, "precision": 0.8154802259887005, "recall": 0.8159412097230073 }, "eval_QTY": { "f1": 0.9864158829676071, "number": 7152, "precision": 0.982923781757601, "recall": 0.9899328859060402 }, "eval_RANGE_END": { "f1": 0.8016194331983806, "number": 105, "precision": 0.6971830985915493, "recall": 0.9428571428571428 }, "eval_UNIT": { "f1": 0.954233801851217, "number": 5646, "precision": 0.9244437064098306, "recall": 0.9860077931278781 }, "eval_loss": 2.1069343090057373, "eval_overall_accuracy": 0.8319276650710432, "eval_overall_f1": 0.86363558757747, "eval_overall_precision": 0.8439387366945844, "eval_overall_recall": 0.8842738270051045, "eval_runtime": 11.303, "eval_samples_per_second": 752.544, "eval_steps_per_second": 23.534, "step": 42000 }, { "epoch": 8.41, "learning_rate": 7.929122945951298e-06, "loss": 1.7763, "step": 42500 }, { "epoch": 8.51, "learning_rate": 7.434171451197783e-06, "loss": 1.7005, "step": 43000 }, { "epoch": 8.51, "eval_COMMENT": { "f1": 0.7259434619133825, "number": 6854, "precision": 0.694326052210975, "recall": 0.7605777648088707 }, "eval_NAME": { "f1": 0.8142243328810492, "number": 8845, "precision": 0.8143164084586678, "recall": 0.8141322781232334 }, "eval_QTY": { "f1": 0.9863471719141822, "number": 7152, "precision": 0.9827873403664631, "recall": 0.9899328859060402 }, "eval_RANGE_END": { "f1": 0.7894736842105263, "number": 105, "precision": 0.7317073170731707, "recall": 0.8571428571428571 }, "eval_UNIT": { "f1": 0.9534087016101404, "number": 5646, "precision": 0.9230514096185738, "recall": 0.9858306765851931 }, "eval_loss": 2.1151254177093506, "eval_overall_accuracy": 0.8293252792341007, "eval_overall_f1": 0.8626307665923513, "eval_overall_precision": 0.8465733135855662, "eval_overall_recall": 0.8793091392210335, "eval_runtime": 10.9284, "eval_samples_per_second": 778.339, "eval_steps_per_second": 24.34, "step": 43000 }, { "epoch": 8.61, "learning_rate": 6.939219956444269e-06, "loss": 1.7224, "step": 43500 }, { "epoch": 8.71, "learning_rate": 6.444268461690754e-06, "loss": 1.7078, "step": 44000 }, { "epoch": 8.71, "eval_COMMENT": { "f1": 0.7251940133037693, "number": 6854, "precision": 0.6905515967273687, "recall": 0.7634957688940764 }, "eval_NAME": { "f1": 0.8152167768922051, "number": 8845, "precision": 0.8151706986208456, "recall": 0.8152628603730921 }, "eval_QTY": { "f1": 0.9865495853369572, "number": 7152, "precision": 0.9834653327775462, "recall": 0.9896532438478747 }, "eval_RANGE_END": { "f1": 0.7899159663865547, "number": 105, "precision": 0.706766917293233, "recall": 0.8952380952380953 }, "eval_UNIT": { "f1": 0.9550831476084348, "number": 5646, "precision": 0.9254152823920265, "recall": 0.9867162592986185 }, "eval_loss": 2.1110451221466064, "eval_overall_accuracy": 0.8313008130081301, "eval_overall_f1": 0.8629231190900369, "eval_overall_precision": 0.8459394102236851, "eval_overall_recall": 0.8806027550520943, "eval_runtime": 11.2874, "eval_samples_per_second": 753.583, "eval_steps_per_second": 23.566, "step": 44000 }, { "epoch": 8.81, "learning_rate": 5.949316966937241e-06, "loss": 1.768, "step": 44500 }, { "epoch": 8.91, "learning_rate": 5.4543654721837265e-06, "loss": 1.7494, "step": 45000 }, { "epoch": 8.91, "eval_COMMENT": { "f1": 0.7275605726872247, "number": 6854, "precision": 0.6886890800104248, "recall": 0.7710825795156113 }, "eval_NAME": { "f1": 0.8160244095378009, "number": 8845, "precision": 0.8156557099288377, "recall": 0.8163934426229508 }, "eval_QTY": { "f1": 0.9865552072448623, "number": 7152, "precision": 0.9830626128002221, "recall": 0.9900727069351231 }, "eval_RANGE_END": { "f1": 0.7899159663865547, "number": 105, "precision": 0.706766917293233, "recall": 0.8952380952380953 }, "eval_UNIT": { "f1": 0.9546817441960078, "number": 5646, "precision": 0.924506387921022, "recall": 0.9868933758413035 }, "eval_loss": 2.1094605922698975, "eval_overall_accuracy": 0.8318896740369273, "eval_overall_f1": 0.8634685085139848, "eval_overall_precision": 0.8448645031783205, "eval_overall_recall": 0.8829102859939865, "eval_runtime": 10.8603, "eval_samples_per_second": 783.222, "eval_steps_per_second": 24.493, "step": 45000 }, { "epoch": 9.01, "learning_rate": 4.959413977430212e-06, "loss": 1.7068, "step": 45500 }, { "epoch": 9.11, "learning_rate": 4.4644624826766974e-06, "loss": 1.6805, "step": 46000 }, { "epoch": 9.11, "eval_COMMENT": { "f1": 0.727134881797505, "number": 6854, "precision": 0.6890920966688439, "recall": 0.7696235774730085 }, "eval_NAME": { "f1": 0.8148566905986773, "number": 8845, "precision": 0.8149027589326097, "recall": 0.8148106274731487 }, "eval_QTY": { "f1": 0.9866963850386571, "number": 7152, "precision": 0.9830673143650243, "recall": 0.9903523489932886 }, "eval_RANGE_END": { "f1": 0.7950819672131149, "number": 105, "precision": 0.697841726618705, "recall": 0.9238095238095239 }, "eval_UNIT": { "f1": 0.9543739279588336, "number": 5646, "precision": 0.9251745926172265, "recall": 0.9854764434998229 }, "eval_loss": 2.113201856613159, "eval_overall_accuracy": 0.8326874857533622, "eval_overall_f1": 0.8630322106091448, "eval_overall_precision": 0.8448939947081087, "eval_overall_recall": 0.8819662960632124, "eval_runtime": 9.5944, "eval_samples_per_second": 886.557, "eval_steps_per_second": 27.724, "step": 46000 }, { "epoch": 9.21, "learning_rate": 3.969510987923184e-06, "loss": 1.7258, "step": 46500 }, { "epoch": 9.31, "learning_rate": 3.4745594931696697e-06, "loss": 1.6867, "step": 47000 }, { "epoch": 9.31, "eval_COMMENT": { "f1": 0.7311783679912154, "number": 6854, "precision": 0.6902941557600104, "recall": 0.7772103880945433 }, "eval_NAME": { "f1": 0.8176065092100803, "number": 8845, "precision": 0.8172370947701344, "recall": 0.817976257772753 }, "eval_QTY": { "f1": 0.9865533337978123, "number": 7152, "precision": 0.9831967782252465, "recall": 0.9899328859060402 }, "eval_RANGE_END": { "f1": 0.7932489451476793, "number": 105, "precision": 0.7121212121212122, "recall": 0.8952380952380953 }, "eval_UNIT": { "f1": 0.9545610425240054, "number": 5646, "precision": 0.925058158856763, "recall": 0.9860077931278781 }, "eval_loss": 2.1125941276550293, "eval_overall_accuracy": 0.8326115036851303, "eval_overall_f1": 0.8647198537327205, "eval_overall_precision": 0.8456602386283881, "eval_overall_recall": 0.8846584154954199, "eval_runtime": 11.2863, "eval_samples_per_second": 753.659, "eval_steps_per_second": 23.568, "step": 47000 }, { "epoch": 9.4, "learning_rate": 2.979607998416155e-06, "loss": 1.6794, "step": 47500 }, { "epoch": 9.5, "learning_rate": 2.484656503662641e-06, "loss": 1.7212, "step": 48000 }, { "epoch": 9.5, "eval_COMMENT": { "f1": 0.7277605779153767, "number": 6854, "precision": 0.6885822158573103, "recall": 0.7716661803326524 }, "eval_NAME": { "f1": 0.8148064424978807, "number": 8845, "precision": 0.8145762711864407, "recall": 0.8150367439231204 }, "eval_QTY": { "f1": 0.9864120967179988, "number": 7152, "precision": 0.98319211001528, "recall": 0.9896532438478747 }, "eval_RANGE_END": { "f1": 0.7901234567901234, "number": 105, "precision": 0.6956521739130435, "recall": 0.9142857142857143 }, "eval_UNIT": { "f1": 0.9545104086353122, "number": 5646, "precision": 0.9243404678944749, "recall": 0.9867162592986185 }, "eval_loss": 2.105802297592163, "eval_overall_accuracy": 0.8318706785198693, "eval_overall_f1": 0.86305280612681, "eval_overall_precision": 0.8443886937614986, "eval_overall_recall": 0.8825606600936997, "eval_runtime": 10.3961, "eval_samples_per_second": 818.189, "eval_steps_per_second": 25.586, "step": 48000 }, { "epoch": 9.6, "learning_rate": 1.989705008909127e-06, "loss": 1.6992, "step": 48500 }, { "epoch": 9.7, "learning_rate": 1.4947535141556129e-06, "loss": 1.6952, "step": 49000 }, { "epoch": 9.7, "eval_COMMENT": { "f1": 0.7261049723756906, "number": 6854, "precision": 0.6893522161028062, "recall": 0.7669973737963233 }, "eval_NAME": { "f1": 0.81525854761232, "number": 8845, "precision": 0.8150282485875706, "recall": 0.8154889768230639 }, "eval_QTY": { "f1": 0.9866276640200585, "number": 7152, "precision": 0.9829308909242298, "recall": 0.9903523489932886 }, "eval_RANGE_END": { "f1": 0.7916666666666667, "number": 105, "precision": 0.7037037037037037, "recall": 0.9047619047619048 }, "eval_UNIT": { "f1": 0.9544792113159023, "number": 5646, "precision": 0.9249044691809271, "recall": 0.9860077931278781 }, "eval_loss": 2.1103529930114746, "eval_overall_accuracy": 0.8311488488716663, "eval_overall_f1": 0.8629658783668163, "eval_overall_precision": 0.8451199892747017, "eval_overall_recall": 0.881581707572897, "eval_runtime": 11.1488, "eval_samples_per_second": 762.95, "eval_steps_per_second": 23.859, "step": 49000 }, { "epoch": 9.8, "learning_rate": 9.998020194020988e-07, "loss": 1.7282, "step": 49500 }, { "epoch": 9.9, "learning_rate": 5.048505246485845e-07, "loss": 1.7128, "step": 50000 }, { "epoch": 9.9, "eval_COMMENT": { "f1": 0.7280375120673009, "number": 6854, "precision": 0.6902458158995816, "recall": 0.7702071782900496 }, "eval_NAME": { "f1": 0.8154846001695395, "number": 8845, "precision": 0.8152542372881356, "recall": 0.8157150932730356 }, "eval_QTY": { "f1": 0.9866276640200585, "number": 7152, "precision": 0.9829308909242298, "recall": 0.9903523489932886 }, "eval_RANGE_END": { "f1": 0.7851239669421487, "number": 105, "precision": 0.6934306569343066, "recall": 0.9047619047619048 }, "eval_UNIT": { "f1": 0.9546351084812623, "number": 5646, "precision": 0.9253532834580216, "recall": 0.9858306765851931 }, "eval_loss": 2.104012966156006, "eval_overall_accuracy": 0.8311298533546083, "eval_overall_f1": 0.8634575250607274, "eval_overall_precision": 0.8453242229367631, "eval_overall_recall": 0.8823858471435564, "eval_runtime": 10.6017, "eval_samples_per_second": 802.322, "eval_steps_per_second": 25.09, "step": 50000 }, { "epoch": 10.0, "learning_rate": 9.899029895070283e-09, "loss": 1.7318, "step": 50500 }, { "epoch": 10.0, "step": 50510, "total_flos": 1554473524185192.0, "train_loss": 2.2027091482279917, "train_runtime": 3516.1179, "train_samples_per_second": 459.606, "train_steps_per_second": 14.365 } ], "logging_steps": 500, "max_steps": 50510, "num_train_epochs": 10, "save_steps": 1000, "total_flos": 1554473524185192.0, "trial_name": null, "trial_params": null }