napsternxg's picture
End of training
25ad7c7
raw
history blame contribute delete
No virus
74.7 kB
{
"best_metric": 2.1034367084503174,
"best_model_checkpoint": "nyt_ingredients-crf-tagger-gte-small-L3-ingredient-v2/checkpoint-40000",
"epoch": 10.0,
"eval_steps": 1000,
"global_step": 50510,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.1,
"learning_rate": 4.9505048505246485e-05,
"loss": 6.8194,
"step": 500
},
{
"epoch": 0.2,
"learning_rate": 4.9010097010492975e-05,
"loss": 4.134,
"step": 1000
},
{
"epoch": 0.2,
"eval_COMMENT": {
"f1": 0.5763258721516435,
"number": 6854,
"precision": 0.5343387760189455,
"recall": 0.6254741756638459
},
"eval_NAME": {
"f1": 0.78330041694097,
"number": 8845,
"precision": 0.7608440797186401,
"recall": 0.8071226681741097
},
"eval_QTY": {
"f1": 0.9729431253451132,
"number": 7152,
"precision": 0.960741548527808,
"recall": 0.9854586129753915
},
"eval_RANGE_END": {
"f1": 0.0,
"number": 105,
"precision": 0.0,
"recall": 0.0
},
"eval_UNIT": {
"f1": 0.9476944253269098,
"number": 5646,
"precision": 0.921378387420542,
"recall": 0.975557917109458
},
"eval_loss": 3.7770841121673584,
"eval_overall_accuracy": 0.7948864068079933,
"eval_overall_f1": 0.8085364620208354,
"eval_overall_precision": 0.7806640625,
"eval_overall_recall": 0.8384728340675477,
"eval_runtime": 11.1289,
"eval_samples_per_second": 764.316,
"eval_steps_per_second": 23.902,
"step": 1000
},
{
"epoch": 0.3,
"learning_rate": 4.851514551573946e-05,
"loss": 3.7402,
"step": 1500
},
{
"epoch": 0.4,
"learning_rate": 4.802019402098595e-05,
"loss": 3.5226,
"step": 2000
},
{
"epoch": 0.4,
"eval_COMMENT": {
"f1": 0.6215112776922562,
"number": 6854,
"precision": 0.5741313218746136,
"recall": 0.6774146483805077
},
"eval_NAME": {
"f1": 0.7914056489724146,
"number": 8845,
"precision": 0.7699133967710895,
"recall": 0.8141322781232334
},
"eval_QTY": {
"f1": 0.9796598403332176,
"number": 7152,
"precision": 0.9728388253136633,
"recall": 0.9865771812080537
},
"eval_RANGE_END": {
"f1": 0.6425339366515838,
"number": 105,
"precision": 0.6120689655172413,
"recall": 0.6761904761904762
},
"eval_UNIT": {
"f1": 0.9472432248746921,
"number": 5646,
"precision": 0.9102040816326531,
"recall": 0.9874247254693589
},
"eval_loss": 3.3654797077178955,
"eval_overall_accuracy": 0.8063976901451257,
"eval_overall_f1": 0.8245767266863746,
"eval_overall_precision": 0.7934958298312537,
"eval_overall_recall": 0.8581917348437172,
"eval_runtime": 11.014,
"eval_samples_per_second": 772.292,
"eval_steps_per_second": 24.151,
"step": 2000
},
{
"epoch": 0.49,
"learning_rate": 4.752524252623243e-05,
"loss": 3.3189,
"step": 2500
},
{
"epoch": 0.59,
"learning_rate": 4.703029103147892e-05,
"loss": 3.1948,
"step": 3000
},
{
"epoch": 0.59,
"eval_COMMENT": {
"f1": 0.6503977349332615,
"number": 6854,
"precision": 0.6045112781954888,
"recall": 0.7038225853516195
},
"eval_NAME": {
"f1": 0.8008250181169521,
"number": 8845,
"precision": 0.7898614471079833,
"recall": 0.8120972300734879
},
"eval_QTY": {
"f1": 0.9830792896098447,
"number": 7152,
"precision": 0.9832167832167832,
"recall": 0.9829418344519015
},
"eval_RANGE_END": {
"f1": 0.7035573122529643,
"number": 105,
"precision": 0.6013513513513513,
"recall": 0.8476190476190476
},
"eval_UNIT": {
"f1": 0.9492858975455399,
"number": 5646,
"precision": 0.9178104845377874,
"recall": 0.9829968119022316
},
"eval_loss": 3.1104416847229004,
"eval_overall_accuracy": 0.8160474128105767,
"eval_overall_f1": 0.8361769539655378,
"eval_overall_precision": 0.8112035241132187,
"eval_overall_recall": 0.8627368715474443,
"eval_runtime": 9.4851,
"eval_samples_per_second": 896.774,
"eval_steps_per_second": 28.044,
"step": 3000
},
{
"epoch": 0.69,
"learning_rate": 4.65353395367254e-05,
"loss": 3.1131,
"step": 3500
},
{
"epoch": 0.79,
"learning_rate": 4.6040388041971886e-05,
"loss": 3.0233,
"step": 4000
},
{
"epoch": 0.79,
"eval_COMMENT": {
"f1": 0.6598611678236015,
"number": 6854,
"precision": 0.6183673469387755,
"recall": 0.7073241902538664
},
"eval_NAME": {
"f1": 0.8091748251748251,
"number": 8845,
"precision": 0.8008859357696567,
"recall": 0.8176370830977954
},
"eval_QTY": {
"f1": 0.9835126449629734,
"number": 7152,
"precision": 0.982826026249651,
"recall": 0.9842002237136466
},
"eval_RANGE_END": {
"f1": 0.5851063829787234,
"number": 105,
"precision": 0.6626506024096386,
"recall": 0.5238095238095238
},
"eval_UNIT": {
"f1": 0.9505612201182417,
"number": 5646,
"precision": 0.9206639004149377,
"recall": 0.9824654622741764
},
"eval_loss": 3.005340576171875,
"eval_overall_accuracy": 0.8174150900387509,
"eval_overall_f1": 0.8416805692690068,
"eval_overall_precision": 0.8202057067020571,
"eval_overall_recall": 0.8643101880987344,
"eval_runtime": 11.0513,
"eval_samples_per_second": 769.68,
"eval_steps_per_second": 24.069,
"step": 4000
},
{
"epoch": 0.89,
"learning_rate": 4.5545436547218376e-05,
"loss": 2.9721,
"step": 4500
},
{
"epoch": 0.99,
"learning_rate": 4.505048505246486e-05,
"loss": 2.9567,
"step": 5000
},
{
"epoch": 0.99,
"eval_COMMENT": {
"f1": 0.677434679334917,
"number": 6854,
"precision": 0.633295267098084,
"recall": 0.7281879194630873
},
"eval_NAME": {
"f1": 0.8113767426235933,
"number": 8845,
"precision": 0.8036823425022183,
"recall": 0.8192198982475976
},
"eval_QTY": {
"f1": 0.9826323498639883,
"number": 7152,
"precision": 0.9803757828810021,
"recall": 0.9848993288590604
},
"eval_RANGE_END": {
"f1": 0.6288659793814434,
"number": 105,
"precision": 0.6853932584269663,
"recall": 0.580952380952381
},
"eval_UNIT": {
"f1": 0.9479768786127167,
"number": 5646,
"precision": 0.9114089571755476,
"recall": 0.9876018420120439
},
"eval_loss": 2.910010814666748,
"eval_overall_accuracy": 0.8215941037915052,
"eval_overall_f1": 0.8462413611587509,
"eval_overall_precision": 0.8226748984779954,
"eval_overall_recall": 0.8711978183343823,
"eval_runtime": 11.1963,
"eval_samples_per_second": 759.713,
"eval_steps_per_second": 23.758,
"step": 5000
},
{
"epoch": 1.09,
"learning_rate": 4.455553355771135e-05,
"loss": 2.794,
"step": 5500
},
{
"epoch": 1.19,
"learning_rate": 4.406058206295783e-05,
"loss": 2.738,
"step": 6000
},
{
"epoch": 1.19,
"eval_COMMENT": {
"f1": 0.6844883595018949,
"number": 6854,
"precision": 0.6383489017924766,
"recall": 0.7378173329442661
},
"eval_NAME": {
"f1": 0.809906216656371,
"number": 8845,
"precision": 0.8046195045748716,
"recall": 0.8152628603730921
},
"eval_QTY": {
"f1": 0.9817170663885992,
"number": 7152,
"precision": 0.9762201023088621,
"recall": 0.9872762863534675
},
"eval_RANGE_END": {
"f1": 0.7286821705426357,
"number": 105,
"precision": 0.6143790849673203,
"recall": 0.8952380952380953
},
"eval_UNIT": {
"f1": 0.9514546393527284,
"number": 5646,
"precision": 0.9254855994641661,
"recall": 0.9789231314204747
},
"eval_loss": 2.8514182567596436,
"eval_overall_accuracy": 0.8213471620697516,
"eval_overall_f1": 0.8480048942967846,
"eval_overall_precision": 0.8250115733086436,
"eval_overall_recall": 0.8723166212152996,
"eval_runtime": 8.7005,
"eval_samples_per_second": 977.64,
"eval_steps_per_second": 30.573,
"step": 6000
},
{
"epoch": 1.29,
"learning_rate": 4.356563056820432e-05,
"loss": 2.7896,
"step": 6500
},
{
"epoch": 1.39,
"learning_rate": 4.3070679073450804e-05,
"loss": 2.8132,
"step": 7000
},
{
"epoch": 1.39,
"eval_COMMENT": {
"f1": 0.680542242913871,
"number": 6854,
"precision": 0.641124871001032,
"recall": 0.7251240151736212
},
"eval_NAME": {
"f1": 0.8072829131652661,
"number": 8845,
"precision": 0.8001110494169905,
"recall": 0.814584511023177
},
"eval_QTY": {
"f1": 0.9839452743263996,
"number": 7152,
"precision": 0.9824365765263451,
"recall": 0.9854586129753915
},
"eval_RANGE_END": {
"f1": 0.7421875,
"number": 105,
"precision": 0.6291390728476821,
"recall": 0.9047619047619048
},
"eval_UNIT": {
"f1": 0.9518423307626392,
"number": 5646,
"precision": 0.9219787516600265,
"recall": 0.983705278072972
},
"eval_loss": 2.776045322418213,
"eval_overall_accuracy": 0.8222589468885343,
"eval_overall_f1": 0.8473121210056551,
"eval_overall_precision": 0.8261476117717399,
"eval_overall_recall": 0.8695895391930635,
"eval_runtime": 11.1273,
"eval_samples_per_second": 764.429,
"eval_steps_per_second": 23.905,
"step": 7000
},
{
"epoch": 1.48,
"learning_rate": 4.257572757869729e-05,
"loss": 2.7089,
"step": 7500
},
{
"epoch": 1.58,
"learning_rate": 4.208077608394378e-05,
"loss": 2.6976,
"step": 8000
},
{
"epoch": 1.58,
"eval_COMMENT": {
"f1": 0.6947368421052631,
"number": 6854,
"precision": 0.6535493827160493,
"recall": 0.7414648380507732
},
"eval_NAME": {
"f1": 0.8145306859205775,
"number": 8845,
"precision": 0.8127884723629405,
"recall": 0.8162803843979649
},
"eval_QTY": {
"f1": 0.9840759882665177,
"number": 7152,
"precision": 0.9831147083449623,
"recall": 0.9850391498881432
},
"eval_RANGE_END": {
"f1": 0.75098814229249,
"number": 105,
"precision": 0.6418918918918919,
"recall": 0.9047619047619048
},
"eval_UNIT": {
"f1": 0.9538461538461539,
"number": 5646,
"precision": 0.926531975288028,
"recall": 0.9828196953595466
},
"eval_loss": 2.707292318344116,
"eval_overall_accuracy": 0.826172023402477,
"eval_overall_f1": 0.8534594631514241,
"eval_overall_precision": 0.8340898471397103,
"eval_overall_recall": 0.8737500874064751,
"eval_runtime": 10.8076,
"eval_samples_per_second": 787.041,
"eval_steps_per_second": 24.612,
"step": 8000
},
{
"epoch": 1.68,
"learning_rate": 4.158582458919026e-05,
"loss": 2.6869,
"step": 8500
},
{
"epoch": 1.78,
"learning_rate": 4.109087309443675e-05,
"loss": 2.6347,
"step": 9000
},
{
"epoch": 1.78,
"eval_COMMENT": {
"f1": 0.6949685534591195,
"number": 6854,
"precision": 0.6538461538461539,
"recall": 0.7416107382550335
},
"eval_NAME": {
"f1": 0.8143807055111011,
"number": 8845,
"precision": 0.8118188967531738,
"recall": 0.8169587337478802
},
"eval_QTY": {
"f1": 0.9832394464149107,
"number": 7152,
"precision": 0.9781375397813754,
"recall": 0.9883948545861297
},
"eval_RANGE_END": {
"f1": 0.7588932806324111,
"number": 105,
"precision": 0.6486486486486487,
"recall": 0.9142857142857143
},
"eval_UNIT": {
"f1": 0.9523400601116359,
"number": 5646,
"precision": 0.92432072012002,
"recall": 0.9821112291888062
},
"eval_loss": 2.6447880268096924,
"eval_overall_accuracy": 0.8236836106678824,
"eval_overall_f1": 0.8531482839167277,
"eval_overall_precision": 0.832606742320876,
"eval_overall_recall": 0.8747290399272778,
"eval_runtime": 10.4718,
"eval_samples_per_second": 812.274,
"eval_steps_per_second": 25.401,
"step": 9000
},
{
"epoch": 1.88,
"learning_rate": 4.059592159968323e-05,
"loss": 2.5569,
"step": 9500
},
{
"epoch": 1.98,
"learning_rate": 4.010097010492972e-05,
"loss": 2.5847,
"step": 10000
},
{
"epoch": 1.98,
"eval_COMMENT": {
"f1": 0.6963045290358433,
"number": 6854,
"precision": 0.6645452134712277,
"recall": 0.7312518237525533
},
"eval_NAME": {
"f1": 0.8156796390298928,
"number": 8845,
"precision": 0.8138435565559933,
"recall": 0.8175240248728095
},
"eval_QTY": {
"f1": 0.9831476323119777,
"number": 7152,
"precision": 0.9793285238623751,
"recall": 0.986996644295302
},
"eval_RANGE_END": {
"f1": 0.7639484978540773,
"number": 105,
"precision": 0.6953125,
"recall": 0.8476190476190476
},
"eval_UNIT": {
"f1": 0.9530017152658663,
"number": 5646,
"precision": 0.9238443631526438,
"recall": 0.9840595111583422
},
"eval_loss": 2.591038227081299,
"eval_overall_accuracy": 0.8253172251348682,
"eval_overall_f1": 0.8546566402302197,
"eval_overall_precision": 0.8377942707458776,
"eval_overall_recall": 0.8722117334452136,
"eval_runtime": 10.9908,
"eval_samples_per_second": 773.919,
"eval_steps_per_second": 24.202,
"step": 10000
},
{
"epoch": 2.08,
"learning_rate": 3.9606018610176205e-05,
"loss": 2.5001,
"step": 10500
},
{
"epoch": 2.18,
"learning_rate": 3.911106711542269e-05,
"loss": 2.4321,
"step": 11000
},
{
"epoch": 2.18,
"eval_COMMENT": {
"f1": 0.7009998630324613,
"number": 6854,
"precision": 0.660557563242127,
"recall": 0.7467172454041435
},
"eval_NAME": {
"f1": 0.8124085125548924,
"number": 8845,
"precision": 0.8091286307053942,
"recall": 0.8157150932730356
},
"eval_QTY": {
"f1": 0.9833752444816989,
"number": 7152,
"precision": 0.9825516471245115,
"recall": 0.9842002237136466
},
"eval_RANGE_END": {
"f1": 0.7404580152671757,
"number": 105,
"precision": 0.6178343949044586,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9521690767519465,
"number": 5646,
"precision": 0.9210395629862606,
"recall": 0.9854764434998229
},
"eval_loss": 2.5731780529022217,
"eval_overall_accuracy": 0.8255071803054479,
"eval_overall_f1": 0.8539459994200822,
"eval_overall_precision": 0.8336830186165785,
"eval_overall_recall": 0.8752185161876792,
"eval_runtime": 9.4187,
"eval_samples_per_second": 903.101,
"eval_steps_per_second": 28.242,
"step": 11000
},
{
"epoch": 2.28,
"learning_rate": 3.861611562066917e-05,
"loss": 2.5117,
"step": 11500
},
{
"epoch": 2.38,
"learning_rate": 3.812116412591566e-05,
"loss": 2.4326,
"step": 12000
},
{
"epoch": 2.38,
"eval_COMMENT": {
"f1": 0.7086570477247504,
"number": 6854,
"precision": 0.6754826765405977,
"recall": 0.7452582433615407
},
"eval_NAME": {
"f1": 0.8158534516876803,
"number": 8845,
"precision": 0.8159918570459173,
"recall": 0.8157150932730356
},
"eval_QTY": {
"f1": 0.9844993715961456,
"number": 7152,
"precision": 0.9832635983263598,
"recall": 0.985738255033557
},
"eval_RANGE_END": {
"f1": 0.7654320987654321,
"number": 105,
"precision": 0.6739130434782609,
"recall": 0.8857142857142857
},
"eval_UNIT": {
"f1": 0.9534265374388883,
"number": 5646,
"precision": 0.9243306169965075,
"recall": 0.9844137442437123
},
"eval_loss": 2.5278468132019043,
"eval_overall_accuracy": 0.8280525795912165,
"eval_overall_f1": 0.8580588749635675,
"eval_overall_precision": 0.8418502943650126,
"eval_overall_recall": 0.8749038528774211,
"eval_runtime": 11.4233,
"eval_samples_per_second": 744.616,
"eval_steps_per_second": 23.286,
"step": 12000
},
{
"epoch": 2.47,
"learning_rate": 3.762621263116215e-05,
"loss": 2.3983,
"step": 12500
},
{
"epoch": 2.57,
"learning_rate": 3.7131261136408633e-05,
"loss": 2.3705,
"step": 13000
},
{
"epoch": 2.57,
"eval_COMMENT": {
"f1": 0.7056559686619477,
"number": 6854,
"precision": 0.6670131219955827,
"recall": 0.7490516486723081
},
"eval_NAME": {
"f1": 0.8140058545372664,
"number": 8845,
"precision": 0.8106289942818702,
"recall": 0.8174109666478236
},
"eval_QTY": {
"f1": 0.9845080251221213,
"number": 7152,
"precision": 0.9827249930342714,
"recall": 0.9862975391498882
},
"eval_RANGE_END": {
"f1": 0.7415730337078652,
"number": 105,
"precision": 0.6111111111111112,
"recall": 0.9428571428571428
},
"eval_UNIT": {
"f1": 0.952819725279413,
"number": 5646,
"precision": 0.9191769547325103,
"recall": 0.9890187743535246
},
"eval_loss": 2.4818899631500244,
"eval_overall_accuracy": 0.8270458171871439,
"eval_overall_f1": 0.8562072552999164,
"eval_overall_precision": 0.8358363024874297,
"eval_overall_recall": 0.8775959723096287,
"eval_runtime": 9.7776,
"eval_samples_per_second": 869.945,
"eval_steps_per_second": 27.205,
"step": 13000
},
{
"epoch": 2.67,
"learning_rate": 3.663630964165512e-05,
"loss": 2.4183,
"step": 13500
},
{
"epoch": 2.77,
"learning_rate": 3.6141358146901606e-05,
"loss": 2.364,
"step": 14000
},
{
"epoch": 2.77,
"eval_COMMENT": {
"f1": 0.7068350260774088,
"number": 6854,
"precision": 0.6672713138118683,
"recall": 0.7513860519404727
},
"eval_NAME": {
"f1": 0.8130456824198727,
"number": 8845,
"precision": 0.8101706331387517,
"recall": 0.8159412097230073
},
"eval_QTY": {
"f1": 0.9847269684078387,
"number": 7152,
"precision": 0.9823292055099485,
"recall": 0.9871364653243848
},
"eval_RANGE_END": {
"f1": 0.7729083665338645,
"number": 105,
"precision": 0.6643835616438356,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9542999228328902,
"number": 5646,
"precision": 0.9248795080604952,
"recall": 0.9856535600425079
},
"eval_loss": 2.4206130504608154,
"eval_overall_accuracy": 0.8284704809664919,
"eval_overall_f1": 0.8566014544709617,
"eval_overall_precision": 0.8369695756605284,
"eval_overall_recall": 0.8771764212292846,
"eval_runtime": 10.6958,
"eval_samples_per_second": 795.265,
"eval_steps_per_second": 24.87,
"step": 14000
},
{
"epoch": 2.87,
"learning_rate": 3.564640665214809e-05,
"loss": 2.3089,
"step": 14500
},
{
"epoch": 2.97,
"learning_rate": 3.515145515739457e-05,
"loss": 2.3349,
"step": 15000
},
{
"epoch": 2.97,
"eval_COMMENT": {
"f1": 0.7115305703734099,
"number": 6854,
"precision": 0.6696704428424305,
"recall": 0.7589728625620076
},
"eval_NAME": {
"f1": 0.8152284263959392,
"number": 8845,
"precision": 0.8133933595948227,
"recall": 0.8170717919728661
},
"eval_QTY": {
"f1": 0.9854223338215806,
"number": 7152,
"precision": 0.9831593597773138,
"recall": 0.9876957494407159
},
"eval_RANGE_END": {
"f1": 0.7320754716981133,
"number": 105,
"precision": 0.60625,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.954592186429061,
"number": 5646,
"precision": 0.9244938599402589,
"recall": 0.9867162592986185
},
"eval_loss": 2.390350103378296,
"eval_overall_accuracy": 0.8285084720006078,
"eval_overall_f1": 0.8583563606590933,
"eval_overall_precision": 0.8380295763389288,
"eval_overall_recall": 0.8796937277113489,
"eval_runtime": 13.4662,
"eval_samples_per_second": 631.657,
"eval_steps_per_second": 19.753,
"step": 15000
},
{
"epoch": 3.07,
"learning_rate": 3.465650366264107e-05,
"loss": 2.251,
"step": 15500
},
{
"epoch": 3.17,
"learning_rate": 3.416155216788755e-05,
"loss": 2.253,
"step": 16000
},
{
"epoch": 3.17,
"eval_COMMENT": {
"f1": 0.7120891136472357,
"number": 6854,
"precision": 0.669751896130608,
"recall": 0.7601400641960899
},
"eval_NAME": {
"f1": 0.8165914221218961,
"number": 8845,
"precision": 0.8152112676056338,
"recall": 0.817976257772753
},
"eval_QTY": {
"f1": 0.9850704618389843,
"number": 7152,
"precision": 0.9830130882762461,
"recall": 0.9871364653243848
},
"eval_RANGE_END": {
"f1": 0.7529411764705883,
"number": 105,
"precision": 0.64,
"recall": 0.9142857142857143
},
"eval_UNIT": {
"f1": 0.9538013199622868,
"number": 5646,
"precision": 0.924098986879256,
"recall": 0.9854764434998229
},
"eval_loss": 2.3770651817321777,
"eval_overall_accuracy": 0.8302180685358256,
"eval_overall_f1": 0.8587418314593322,
"eval_overall_precision": 0.8386376512147166,
"eval_overall_recall": 0.8798335780714636,
"eval_runtime": 11.0556,
"eval_samples_per_second": 769.382,
"eval_steps_per_second": 24.06,
"step": 16000
},
{
"epoch": 3.27,
"learning_rate": 3.3666600673134034e-05,
"loss": 2.1955,
"step": 16500
},
{
"epoch": 3.37,
"learning_rate": 3.317164917838052e-05,
"loss": 2.2137,
"step": 17000
},
{
"epoch": 3.37,
"eval_COMMENT": {
"f1": 0.7152373022481265,
"number": 6854,
"precision": 0.6819264355649642,
"recall": 0.7519696527575138
},
"eval_NAME": {
"f1": 0.816918906708832,
"number": 8845,
"precision": 0.8160893602617624,
"recall": 0.8177501413227812
},
"eval_QTY": {
"f1": 0.9852099902330124,
"number": 7152,
"precision": 0.9831523252575884,
"recall": 0.9872762863534675
},
"eval_RANGE_END": {
"f1": 0.7619047619047618,
"number": 105,
"precision": 0.6530612244897959,
"recall": 0.9142857142857143
},
"eval_UNIT": {
"f1": 0.9529855868222373,
"number": 5646,
"precision": 0.924126455906822,
"recall": 0.983705278072972
},
"eval_loss": 2.378207206726074,
"eval_overall_accuracy": 0.8285464630347238,
"eval_overall_f1": 0.8600801891641822,
"eval_overall_precision": 0.8433467741935484,
"eval_overall_recall": 0.8774910845395427,
"eval_runtime": 10.7102,
"eval_samples_per_second": 794.197,
"eval_steps_per_second": 24.836,
"step": 17000
},
{
"epoch": 3.46,
"learning_rate": 3.267669768362701e-05,
"loss": 2.2027,
"step": 17500
},
{
"epoch": 3.56,
"learning_rate": 3.218174618887349e-05,
"loss": 2.2065,
"step": 18000
},
{
"epoch": 3.56,
"eval_COMMENT": {
"f1": 0.715327462850853,
"number": 6854,
"precision": 0.6767768810205675,
"recall": 0.7585351619492268
},
"eval_NAME": {
"f1": 0.8111738148984199,
"number": 8845,
"precision": 0.8098028169014084,
"recall": 0.8125494629734313
},
"eval_QTY": {
"f1": 0.9852766729467587,
"number": 7152,
"precision": 0.9834238751915308,
"recall": 0.9871364653243848
},
"eval_RANGE_END": {
"f1": 0.751937984496124,
"number": 105,
"precision": 0.6339869281045751,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9542920847268673,
"number": 5646,
"precision": 0.9250207813798836,
"recall": 0.9854764434998229
},
"eval_loss": 2.3392648696899414,
"eval_overall_accuracy": 0.829154319580579,
"eval_overall_f1": 0.8582709465695826,
"eval_overall_precision": 0.8395866773675762,
"eval_overall_recall": 0.8778057478498007,
"eval_runtime": 10.643,
"eval_samples_per_second": 799.209,
"eval_steps_per_second": 24.993,
"step": 18000
},
{
"epoch": 3.66,
"learning_rate": 3.168679469411997e-05,
"loss": 2.17,
"step": 18500
},
{
"epoch": 3.76,
"learning_rate": 3.119184319936647e-05,
"loss": 2.1758,
"step": 19000
},
{
"epoch": 3.76,
"eval_COMMENT": {
"f1": 0.7196268093572066,
"number": 6854,
"precision": 0.6791402304803833,
"recall": 0.7652465713451999
},
"eval_NAME": {
"f1": 0.8154011420817548,
"number": 8845,
"precision": 0.8155394707079846,
"recall": 0.8152628603730921
},
"eval_QTY": {
"f1": 0.9850017439832579,
"number": 7152,
"precision": 0.9828762355561743,
"recall": 0.9871364653243848
},
"eval_RANGE_END": {
"f1": 0.7637795275590552,
"number": 105,
"precision": 0.6510067114093959,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9544714052988081,
"number": 5646,
"precision": 0.9250457038391224,
"recall": 0.9858306765851931
},
"eval_loss": 2.306312322616577,
"eval_overall_accuracy": 0.827710660284173,
"eval_overall_f1": 0.8605851391072529,
"eval_overall_precision": 0.8417129103429832,
"eval_overall_recall": 0.8803230543318649,
"eval_runtime": 11.977,
"eval_samples_per_second": 710.192,
"eval_steps_per_second": 22.209,
"step": 19000
},
{
"epoch": 3.86,
"learning_rate": 3.069689170461295e-05,
"loss": 2.2238,
"step": 19500
},
{
"epoch": 3.96,
"learning_rate": 3.0201940209859435e-05,
"loss": 2.1417,
"step": 20000
},
{
"epoch": 3.96,
"eval_COMMENT": {
"f1": 0.7152720243026789,
"number": 6854,
"precision": 0.6788990825688074,
"recall": 0.7557630580682813
},
"eval_NAME": {
"f1": 0.815481242573417,
"number": 8845,
"precision": 0.8162664250113276,
"recall": 0.8146975692481628
},
"eval_QTY": {
"f1": 0.9854263998326477,
"number": 7152,
"precision": 0.9828905271943247,
"recall": 0.9879753914988815
},
"eval_RANGE_END": {
"f1": 0.7634854771784232,
"number": 105,
"precision": 0.6764705882352942,
"recall": 0.8761904761904762
},
"eval_UNIT": {
"f1": 0.9533384893013664,
"number": 5646,
"precision": 0.9258888332498748,
"recall": 0.9824654622741764
},
"eval_loss": 2.288215398788452,
"eval_overall_accuracy": 0.8285084720006078,
"eval_overall_f1": 0.8596340962039195,
"eval_overall_precision": 0.8427151205749983,
"eval_overall_recall": 0.877246346409342,
"eval_runtime": 9.5122,
"eval_samples_per_second": 894.221,
"eval_steps_per_second": 27.964,
"step": 20000
},
{
"epoch": 4.06,
"learning_rate": 2.970698871510592e-05,
"loss": 2.1114,
"step": 20500
},
{
"epoch": 4.16,
"learning_rate": 2.9212037220352405e-05,
"loss": 2.0271,
"step": 21000
},
{
"epoch": 4.16,
"eval_COMMENT": {
"f1": 0.7168075752451809,
"number": 6854,
"precision": 0.6681376875551632,
"recall": 0.7731251823752553
},
"eval_NAME": {
"f1": 0.8170380818053596,
"number": 8845,
"precision": 0.815427927927928,
"recall": 0.8186546071226681
},
"eval_QTY": {
"f1": 0.9858546442756603,
"number": 7152,
"precision": 0.9826364772885123,
"recall": 0.9890939597315436
},
"eval_RANGE_END": {
"f1": 0.7717842323651452,
"number": 105,
"precision": 0.6838235294117647,
"recall": 0.8857142857142857
},
"eval_UNIT": {
"f1": 0.9534565366187543,
"number": 5646,
"precision": 0.922211188348229,
"recall": 0.9868933758413035
},
"eval_loss": 2.350003242492676,
"eval_overall_accuracy": 0.82989514474584,
"eval_overall_f1": 0.859976186426263,
"eval_overall_precision": 0.837385716178614,
"eval_overall_recall": 0.8838193133347318,
"eval_runtime": 11.0178,
"eval_samples_per_second": 772.02,
"eval_steps_per_second": 24.143,
"step": 21000
},
{
"epoch": 4.26,
"learning_rate": 2.871708572559889e-05,
"loss": 2.0589,
"step": 21500
},
{
"epoch": 4.36,
"learning_rate": 2.8222134230845377e-05,
"loss": 2.0488,
"step": 22000
},
{
"epoch": 4.36,
"eval_COMMENT": {
"f1": 0.7173793103448276,
"number": 6854,
"precision": 0.6802249542244311,
"recall": 0.7588269623577473
},
"eval_NAME": {
"f1": 0.814222122048797,
"number": 8845,
"precision": 0.8116153673331835,
"recall": 0.8168456755228943
},
"eval_QTY": {
"f1": 0.9854284319877291,
"number": 7152,
"precision": 0.9827562230565985,
"recall": 0.9881152125279642
},
"eval_RANGE_END": {
"f1": 0.7686274509803921,
"number": 105,
"precision": 0.6533333333333333,
"recall": 0.9333333333333333
},
"eval_UNIT": {
"f1": 0.9529190207156308,
"number": 5646,
"precision": 0.9221338634857521,
"recall": 0.9858306765851931
},
"eval_loss": 2.2779643535614014,
"eval_overall_accuracy": 0.8274067320112454,
"eval_overall_f1": 0.8596716045585798,
"eval_overall_precision": 0.8406683375104428,
"eval_overall_recall": 0.8795538773512341,
"eval_runtime": 10.9882,
"eval_samples_per_second": 774.104,
"eval_steps_per_second": 24.208,
"step": 22000
},
{
"epoch": 4.45,
"learning_rate": 2.7727182736091867e-05,
"loss": 2.0377,
"step": 22500
},
{
"epoch": 4.55,
"learning_rate": 2.7232231241338353e-05,
"loss": 2.0403,
"step": 23000
},
{
"epoch": 4.55,
"eval_COMMENT": {
"f1": 0.7213069552629764,
"number": 6854,
"precision": 0.6836534692277538,
"recall": 0.7633498686898161
},
"eval_NAME": {
"f1": 0.8175446529504862,
"number": 8845,
"precision": 0.8174522436984288,
"recall": 0.8176370830977954
},
"eval_QTY": {
"f1": 0.9858447806986962,
"number": 7152,
"precision": 0.9833078314090973,
"recall": 0.9883948545861297
},
"eval_RANGE_END": {
"f1": 0.7868852459016393,
"number": 105,
"precision": 0.6906474820143885,
"recall": 0.9142857142857143
},
"eval_UNIT": {
"f1": 0.9541991267870901,
"number": 5646,
"precision": 0.9234465617232809,
"recall": 0.9870704923839887
},
"eval_loss": 2.255697250366211,
"eval_overall_accuracy": 0.8292303016488108,
"eval_overall_f1": 0.8621226374754127,
"eval_overall_precision": 0.8439205706057663,
"eval_overall_recall": 0.8811271939025243,
"eval_runtime": 11.1445,
"eval_samples_per_second": 763.249,
"eval_steps_per_second": 23.868,
"step": 23000
},
{
"epoch": 4.65,
"learning_rate": 2.6737279746584836e-05,
"loss": 2.0887,
"step": 23500
},
{
"epoch": 4.75,
"learning_rate": 2.6242328251831323e-05,
"loss": 2.0443,
"step": 24000
},
{
"epoch": 4.75,
"eval_COMMENT": {
"f1": 0.7226055754899255,
"number": 6854,
"precision": 0.6855197695731867,
"recall": 0.7639334695068573
},
"eval_NAME": {
"f1": 0.8165780843605112,
"number": 8845,
"precision": 0.8167628096369189,
"recall": 0.8163934426229508
},
"eval_QTY": {
"f1": 0.9852161785216179,
"number": 7152,
"precision": 0.9827490261547023,
"recall": 0.9876957494407159
},
"eval_RANGE_END": {
"f1": 0.7854251012145749,
"number": 105,
"precision": 0.6830985915492958,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9537354352296092,
"number": 5646,
"precision": 0.9236641221374046,
"recall": 0.9858306765851931
},
"eval_loss": 2.228408098220825,
"eval_overall_accuracy": 0.829097333029405,
"eval_overall_f1": 0.8619196741790305,
"eval_overall_precision": 0.8441092676386794,
"eval_overall_recall": 0.8804978672820083,
"eval_runtime": 10.5005,
"eval_samples_per_second": 810.058,
"eval_steps_per_second": 25.332,
"step": 24000
},
{
"epoch": 4.85,
"learning_rate": 2.5747376757077806e-05,
"loss": 2.068,
"step": 24500
},
{
"epoch": 4.95,
"learning_rate": 2.5252425262324292e-05,
"loss": 2.0214,
"step": 25000
},
{
"epoch": 4.95,
"eval_COMMENT": {
"f1": 0.7221103783408538,
"number": 6854,
"precision": 0.6887829426566018,
"recall": 0.7588269623577473
},
"eval_NAME": {
"f1": 0.8139863300005649,
"number": 8845,
"precision": 0.8133890268683676,
"recall": 0.814584511023177
},
"eval_QTY": {
"f1": 0.9864751812604574,
"number": 7152,
"precision": 0.9837319243604005,
"recall": 0.9892337807606264
},
"eval_RANGE_END": {
"f1": 0.7713004484304932,
"number": 105,
"precision": 0.7288135593220338,
"recall": 0.819047619047619
},
"eval_UNIT": {
"f1": 0.9553288176283975,
"number": 5646,
"precision": 0.9258766827322586,
"recall": 0.9867162592986185
},
"eval_loss": 2.2036967277526855,
"eval_overall_accuracy": 0.8304270192234633,
"eval_overall_f1": 0.8618053412869828,
"eval_overall_precision": 0.8453726123217649,
"eval_overall_recall": 0.8788895881406895,
"eval_runtime": 10.7118,
"eval_samples_per_second": 794.075,
"eval_steps_per_second": 24.832,
"step": 25000
},
{
"epoch": 5.05,
"learning_rate": 2.4757473767570778e-05,
"loss": 2.0164,
"step": 25500
},
{
"epoch": 5.15,
"learning_rate": 2.4262522272817265e-05,
"loss": 2.0081,
"step": 26000
},
{
"epoch": 5.15,
"eval_COMMENT": {
"f1": 0.719671201814059,
"number": 6854,
"precision": 0.6996417745935519,
"recall": 0.7408812372337321
},
"eval_NAME": {
"f1": 0.8098846414838272,
"number": 8845,
"precision": 0.8101595203077271,
"recall": 0.8096099491237988
},
"eval_QTY": {
"f1": 0.9862001672706997,
"number": 7152,
"precision": 0.9831851028349082,
"recall": 0.9892337807606264
},
"eval_RANGE_END": {
"f1": 0.7918367346938776,
"number": 105,
"precision": 0.6928571428571428,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9546235819869371,
"number": 5646,
"precision": 0.927212020033389,
"recall": 0.983705278072972
},
"eval_loss": 2.2013936042785645,
"eval_overall_accuracy": 0.8273117544259555,
"eval_overall_f1": 0.8604911676001723,
"eval_overall_precision": 0.8484858783944533,
"eval_overall_recall": 0.8728410600657297,
"eval_runtime": 11.2303,
"eval_samples_per_second": 757.413,
"eval_steps_per_second": 23.686,
"step": 26000
},
{
"epoch": 5.25,
"learning_rate": 2.376757077806375e-05,
"loss": 1.9905,
"step": 26500
},
{
"epoch": 5.35,
"learning_rate": 2.3272619283310237e-05,
"loss": 1.9138,
"step": 27000
},
{
"epoch": 5.35,
"eval_COMMENT": {
"f1": 0.7232730263157895,
"number": 6854,
"precision": 0.6819591625743086,
"recall": 0.7699153778815291
},
"eval_NAME": {
"f1": 0.8175660419959357,
"number": 8845,
"precision": 0.8163679404802164,
"recall": 0.818767665347654
},
"eval_QTY": {
"f1": 0.9861333704968295,
"number": 7152,
"precision": 0.9829142936518961,
"recall": 0.9893736017897091
},
"eval_RANGE_END": {
"f1": 0.7679324894514767,
"number": 105,
"precision": 0.6893939393939394,
"recall": 0.8666666666666667
},
"eval_UNIT": {
"f1": 0.9538567493112948,
"number": 5646,
"precision": 0.9279731993299832,
"recall": 0.9812256464753808
},
"eval_loss": 2.1838574409484863,
"eval_overall_accuracy": 0.8322695843780867,
"eval_overall_f1": 0.8622504785343178,
"eval_overall_precision": 0.8433968572383818,
"eval_overall_recall": 0.8819662960632124,
"eval_runtime": 10.2972,
"eval_samples_per_second": 826.053,
"eval_steps_per_second": 25.832,
"step": 27000
},
{
"epoch": 5.44,
"learning_rate": 2.2777667788556724e-05,
"loss": 1.9236,
"step": 27500
},
{
"epoch": 5.54,
"learning_rate": 2.2282716293803206e-05,
"loss": 1.9304,
"step": 28000
},
{
"epoch": 5.54,
"eval_COMMENT": {
"f1": 0.7215675336447948,
"number": 6854,
"precision": 0.6910645118204889,
"recall": 0.7548876568427196
},
"eval_NAME": {
"f1": 0.8127016471387332,
"number": 8845,
"precision": 0.8137610519156654,
"recall": 0.8116449971735443
},
"eval_QTY": {
"f1": 0.9857760423929716,
"number": 7152,
"precision": 0.9831710709318497,
"recall": 0.9883948545861297
},
"eval_RANGE_END": {
"f1": 0.776,
"number": 105,
"precision": 0.6689655172413793,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9539864109400533,
"number": 5646,
"precision": 0.9272696873432537,
"recall": 0.9822883457314914
},
"eval_loss": 2.1557235717773438,
"eval_overall_accuracy": 0.8287364182053035,
"eval_overall_f1": 0.860940800659488,
"eval_overall_precision": 0.8460759493670886,
"eval_overall_recall": 0.8763373190685966,
"eval_runtime": 11.4111,
"eval_samples_per_second": 745.412,
"eval_steps_per_second": 23.311,
"step": 28000
},
{
"epoch": 5.64,
"learning_rate": 2.1787764799049696e-05,
"loss": 1.908,
"step": 28500
},
{
"epoch": 5.74,
"learning_rate": 2.129281330429618e-05,
"loss": 1.9369,
"step": 29000
},
{
"epoch": 5.74,
"eval_COMMENT": {
"f1": 0.7214330697641872,
"number": 6854,
"precision": 0.6931558424095737,
"recall": 0.7521155529617741
},
"eval_NAME": {
"f1": 0.8120292235374073,
"number": 8845,
"precision": 0.8135497049477984,
"recall": 0.8105144149236857
},
"eval_QTY": {
"f1": 0.9862020905923344,
"number": 7152,
"precision": 0.9830508474576272,
"recall": 0.9893736017897091
},
"eval_RANGE_END": {
"f1": 0.7841409691629957,
"number": 105,
"precision": 0.7295081967213115,
"recall": 0.8476190476190476
},
"eval_UNIT": {
"f1": 0.9530419880034275,
"number": 5646,
"precision": 0.923140770252324,
"recall": 0.9849450938717677
},
"eval_loss": 2.152221918106079,
"eval_overall_accuracy": 0.8286794316541296,
"eval_overall_f1": 0.8608987026376836,
"eval_overall_precision": 0.8464839658027237,
"eval_overall_recall": 0.8758128802181666,
"eval_runtime": 8.8394,
"eval_samples_per_second": 962.281,
"eval_steps_per_second": 30.093,
"step": 29000
},
{
"epoch": 5.84,
"learning_rate": 2.0797861809542665e-05,
"loss": 1.9176,
"step": 29500
},
{
"epoch": 5.94,
"learning_rate": 2.0302910314789152e-05,
"loss": 1.8944,
"step": 30000
},
{
"epoch": 5.94,
"eval_COMMENT": {
"f1": 0.723598615916955,
"number": 6854,
"precision": 0.6882569773565034,
"recall": 0.762766267872775
},
"eval_NAME": {
"f1": 0.8156853881794554,
"number": 8845,
"precision": 0.8153168417485598,
"recall": 0.8160542679479932
},
"eval_QTY": {
"f1": 0.9857272157627236,
"number": 7152,
"precision": 0.9816946331992789,
"recall": 0.9897930648769575
},
"eval_RANGE_END": {
"f1": 0.7631578947368421,
"number": 105,
"precision": 0.7073170731707317,
"recall": 0.8285714285714286
},
"eval_UNIT": {
"f1": 0.9549935705100728,
"number": 5646,
"precision": 0.9254028908456554,
"recall": 0.9865391427559334
},
"eval_loss": 2.128391742706299,
"eval_overall_accuracy": 0.8317377099004635,
"eval_overall_f1": 0.8623381960139715,
"eval_overall_precision": 0.8449768471914637,
"eval_overall_recall": 0.880427942101951,
"eval_runtime": 11.5016,
"eval_samples_per_second": 739.547,
"eval_steps_per_second": 23.127,
"step": 30000
},
{
"epoch": 6.04,
"learning_rate": 1.9807958820035638e-05,
"loss": 1.837,
"step": 30500
},
{
"epoch": 6.14,
"learning_rate": 1.9313007325282124e-05,
"loss": 1.8311,
"step": 31000
},
{
"epoch": 6.14,
"eval_COMMENT": {
"f1": 0.7244426318651441,
"number": 6854,
"precision": 0.6781623822855688,
"recall": 0.7775021885030639
},
"eval_NAME": {
"f1": 0.818961625282167,
"number": 8845,
"precision": 0.8175774647887324,
"recall": 0.8203504804974562
},
"eval_QTY": {
"f1": 0.9856425982715361,
"number": 7152,
"precision": 0.9826292384658143,
"recall": 0.9886744966442953
},
"eval_RANGE_END": {
"f1": 0.7896995708154506,
"number": 105,
"precision": 0.71875,
"recall": 0.8761904761904762
},
"eval_UNIT": {
"f1": 0.9552008238928938,
"number": 5646,
"precision": 0.9265734265734266,
"recall": 0.9856535600425079
},
"eval_loss": 2.171062469482422,
"eval_overall_accuracy": 0.8314527771445939,
"eval_overall_f1": 0.8629676979459644,
"eval_overall_precision": 0.8419984698799189,
"eval_overall_recall": 0.8850080413957065,
"eval_runtime": 11.2938,
"eval_samples_per_second": 753.154,
"eval_steps_per_second": 23.553,
"step": 31000
},
{
"epoch": 6.24,
"learning_rate": 1.8818055830528607e-05,
"loss": 1.8426,
"step": 31500
},
{
"epoch": 6.34,
"learning_rate": 1.8323104335775097e-05,
"loss": 1.879,
"step": 32000
},
{
"epoch": 6.34,
"eval_COMMENT": {
"f1": 0.7243460764587525,
"number": 6854,
"precision": 0.6905675353882789,
"recall": 0.7615990662386928
},
"eval_NAME": {
"f1": 0.8148399502318742,
"number": 8845,
"precision": 0.8152087812606088,
"recall": 0.8144714527981911
},
"eval_QTY": {
"f1": 0.985952712100139,
"number": 7152,
"precision": 0.9807692307692307,
"recall": 0.9911912751677853
},
"eval_RANGE_END": {
"f1": 0.7796610169491526,
"number": 105,
"precision": 0.7022900763358778,
"recall": 0.8761904761904762
},
"eval_UNIT": {
"f1": 0.9541174456428694,
"number": 5646,
"precision": 0.9232935719019219,
"recall": 0.9870704923839887
},
"eval_loss": 2.1472506523132324,
"eval_overall_accuracy": 0.830635969911101,
"eval_overall_f1": 0.8623636394773346,
"eval_overall_precision": 0.8451545768856366,
"eval_overall_recall": 0.8802880917418362,
"eval_runtime": 12.4001,
"eval_samples_per_second": 685.964,
"eval_steps_per_second": 21.452,
"step": 32000
},
{
"epoch": 6.43,
"learning_rate": 1.782815284102158e-05,
"loss": 1.8605,
"step": 32500
},
{
"epoch": 6.53,
"learning_rate": 1.7333201346268066e-05,
"loss": 1.8279,
"step": 33000
},
{
"epoch": 6.53,
"eval_COMMENT": {
"f1": 0.7266004792879152,
"number": 6854,
"precision": 0.6845568313765966,
"recall": 0.7741464838050773
},
"eval_NAME": {
"f1": 0.8171618650279078,
"number": 8845,
"precision": 0.8150022492127755,
"recall": 0.8193329564725834
},
"eval_QTY": {
"f1": 0.9857839721254356,
"number": 7152,
"precision": 0.9826340650180606,
"recall": 0.9889541387024608
},
"eval_RANGE_END": {
"f1": 0.7860262008733625,
"number": 105,
"precision": 0.7258064516129032,
"recall": 0.8571428571428571
},
"eval_UNIT": {
"f1": 0.9554850330216998,
"number": 5646,
"precision": 0.9263262930317645,
"recall": 0.9865391427559334
},
"eval_loss": 2.1636247634887695,
"eval_overall_accuracy": 0.83139579059342,
"eval_overall_f1": 0.8632980539433255,
"eval_overall_precision": 0.8434852224964974,
"eval_overall_recall": 0.8840640514649325,
"eval_runtime": 11.6243,
"eval_samples_per_second": 731.745,
"eval_steps_per_second": 22.883,
"step": 33000
},
{
"epoch": 6.63,
"learning_rate": 1.6838249851514553e-05,
"loss": 1.8596,
"step": 33500
},
{
"epoch": 6.73,
"learning_rate": 1.634329835676104e-05,
"loss": 1.8613,
"step": 34000
},
{
"epoch": 6.73,
"eval_COMMENT": {
"f1": 0.7281226369698219,
"number": 6854,
"precision": 0.6884180423761861,
"recall": 0.7726874817624745
},
"eval_NAME": {
"f1": 0.8162550161080653,
"number": 8845,
"precision": 0.8161166365280289,
"recall": 0.8163934426229508
},
"eval_QTY": {
"f1": 0.9855233853006681,
"number": 7152,
"precision": 0.9811529933481153,
"recall": 0.9899328859060402
},
"eval_RANGE_END": {
"f1": 0.7777777777777778,
"number": 105,
"precision": 0.6666666666666666,
"recall": 0.9333333333333333
},
"eval_UNIT": {
"f1": 0.9550600343053174,
"number": 5646,
"precision": 0.9258397073495178,
"recall": 0.9861849096705633
},
"eval_loss": 2.119246482849121,
"eval_overall_accuracy": 0.8333523288503913,
"eval_overall_f1": 0.8633971291866029,
"eval_overall_precision": 0.8444080486663547,
"eval_overall_recall": 0.8832599118942731,
"eval_runtime": 9.0301,
"eval_samples_per_second": 941.963,
"eval_steps_per_second": 29.457,
"step": 34000
},
{
"epoch": 6.83,
"learning_rate": 1.5848346862007525e-05,
"loss": 1.8804,
"step": 34500
},
{
"epoch": 6.93,
"learning_rate": 1.535339536725401e-05,
"loss": 1.8604,
"step": 35000
},
{
"epoch": 6.93,
"eval_COMMENT": {
"f1": 0.7285265601529427,
"number": 6854,
"precision": 0.68467659137577,
"recall": 0.7783775897286256
},
"eval_NAME": {
"f1": 0.8183306055646481,
"number": 8845,
"precision": 0.8169934640522876,
"recall": 0.819672131147541
},
"eval_QTY": {
"f1": 0.9865589525732991,
"number": 7152,
"precision": 0.9827945053420286,
"recall": 0.9903523489932886
},
"eval_RANGE_END": {
"f1": 0.7818930041152263,
"number": 105,
"precision": 0.6884057971014492,
"recall": 0.9047619047619048
},
"eval_UNIT": {
"f1": 0.9555517418911963,
"number": 5646,
"precision": 0.9267643142476698,
"recall": 0.9861849096705633
},
"eval_loss": 2.1069583892822266,
"eval_overall_accuracy": 0.834340095737406,
"eval_overall_f1": 0.8642295423141878,
"eval_overall_precision": 0.8438322395815984,
"eval_overall_recall": 0.8856373680162226,
"eval_runtime": 11.4858,
"eval_samples_per_second": 740.57,
"eval_steps_per_second": 23.159,
"step": 35000
},
{
"epoch": 7.03,
"learning_rate": 1.4858443872500496e-05,
"loss": 1.7995,
"step": 35500
},
{
"epoch": 7.13,
"learning_rate": 1.4363492377746981e-05,
"loss": 1.8026,
"step": 36000
},
{
"epoch": 7.13,
"eval_COMMENT": {
"f1": 0.7254587315984092,
"number": 6854,
"precision": 0.695146409947854,
"recall": 0.7585351619492268
},
"eval_NAME": {
"f1": 0.8138180584610165,
"number": 8845,
"precision": 0.8139561185252205,
"recall": 0.81368004522329
},
"eval_QTY": {
"f1": 0.9861982434127978,
"number": 7152,
"precision": 0.9833194328607172,
"recall": 0.9890939597315436
},
"eval_RANGE_END": {
"f1": 0.7692307692307693,
"number": 105,
"precision": 0.6976744186046512,
"recall": 0.8571428571428571
},
"eval_UNIT": {
"f1": 0.9548265200961868,
"number": 5646,
"precision": 0.926808936312104,
"recall": 0.9845908607863975
},
"eval_loss": 2.1282002925872803,
"eval_overall_accuracy": 0.8295152344046804,
"eval_overall_f1": 0.8625437813336996,
"eval_overall_precision": 0.8474124552999123,
"eval_overall_recall": 0.8782252989301448,
"eval_runtime": 9.0618,
"eval_samples_per_second": 938.668,
"eval_steps_per_second": 29.354,
"step": 36000
},
{
"epoch": 7.23,
"learning_rate": 1.3868540882993467e-05,
"loss": 1.7692,
"step": 36500
},
{
"epoch": 7.33,
"learning_rate": 1.3373589388239954e-05,
"loss": 1.774,
"step": 37000
},
{
"epoch": 7.33,
"eval_COMMENT": {
"f1": 0.7252502780867629,
"number": 6854,
"precision": 0.6926958831341301,
"recall": 0.7610154654216515
},
"eval_NAME": {
"f1": 0.8135153429602889,
"number": 8845,
"precision": 0.8117753011370032,
"recall": 0.8152628603730921
},
"eval_QTY": {
"f1": 0.9858644941160087,
"number": 7152,
"precision": 0.9819669857123041,
"recall": 0.9897930648769575
},
"eval_RANGE_END": {
"f1": 0.7948717948717948,
"number": 105,
"precision": 0.7209302325581395,
"recall": 0.8857142857142857
},
"eval_UNIT": {
"f1": 0.953885787891799,
"number": 5646,
"precision": 0.9258209701616936,
"recall": 0.983705278072972
},
"eval_loss": 2.1374754905700684,
"eval_overall_accuracy": 0.829952131297014,
"eval_overall_f1": 0.8621126953660542,
"eval_overall_precision": 0.8454789915966386,
"eval_overall_recall": 0.8794140269911195,
"eval_runtime": 13.9271,
"eval_samples_per_second": 610.751,
"eval_steps_per_second": 19.099,
"step": 37000
},
{
"epoch": 7.42,
"learning_rate": 1.287863789348644e-05,
"loss": 1.7909,
"step": 37500
},
{
"epoch": 7.52,
"learning_rate": 1.2383686398732925e-05,
"loss": 1.8132,
"step": 38000
},
{
"epoch": 7.52,
"eval_COMMENT": {
"f1": 0.7251632624704737,
"number": 6854,
"precision": 0.6921750663129973,
"recall": 0.7614531660344325
},
"eval_NAME": {
"f1": 0.8144125798970531,
"number": 8845,
"precision": 0.8149196287072674,
"recall": 0.8139061616732617
},
"eval_QTY": {
"f1": 0.9862059356276995,
"number": 7152,
"precision": 0.9827825603998889,
"recall": 0.9896532438478747
},
"eval_RANGE_END": {
"f1": 0.7966804979253113,
"number": 105,
"precision": 0.7058823529411765,
"recall": 0.9142857142857143
},
"eval_UNIT": {
"f1": 0.9550012856775519,
"number": 5646,
"precision": 0.9252615844544095,
"recall": 0.9867162592986185
},
"eval_loss": 2.1093838214874268,
"eval_overall_accuracy": 0.8298571537117241,
"eval_overall_f1": 0.8627067798062913,
"eval_overall_precision": 0.8462987253220328,
"eval_overall_recall": 0.8797636528914062,
"eval_runtime": 10.2321,
"eval_samples_per_second": 831.306,
"eval_steps_per_second": 25.997,
"step": 38000
},
{
"epoch": 7.62,
"learning_rate": 1.1888734903979411e-05,
"loss": 1.7708,
"step": 38500
},
{
"epoch": 7.72,
"learning_rate": 1.1393783409225896e-05,
"loss": 1.805,
"step": 39000
},
{
"epoch": 7.72,
"eval_COMMENT": {
"f1": 0.7264215888751205,
"number": 6854,
"precision": 0.6876955161626694,
"recall": 0.7697694776772688
},
"eval_NAME": {
"f1": 0.815460358779922,
"number": 8845,
"precision": 0.8163380920009065,
"recall": 0.814584511023177
},
"eval_QTY": {
"f1": 0.9862822923194763,
"number": 7152,
"precision": 0.9823831321958663,
"recall": 0.9902125279642058
},
"eval_RANGE_END": {
"f1": 0.7844827586206896,
"number": 105,
"precision": 0.7165354330708661,
"recall": 0.8666666666666667
},
"eval_UNIT": {
"f1": 0.9549858526965618,
"number": 5646,
"precision": 0.9255442911750041,
"recall": 0.9863620262132483
},
"eval_loss": 2.1103549003601074,
"eval_overall_accuracy": 0.8331053871286377,
"eval_overall_f1": 0.8630181513352608,
"eval_overall_precision": 0.8449633178117986,
"eval_overall_recall": 0.8818614082931263,
"eval_runtime": 10.8182,
"eval_samples_per_second": 786.27,
"eval_steps_per_second": 24.588,
"step": 39000
},
{
"epoch": 7.82,
"learning_rate": 1.0898831914472382e-05,
"loss": 1.8185,
"step": 39500
},
{
"epoch": 7.92,
"learning_rate": 1.0403880419718868e-05,
"loss": 1.7337,
"step": 40000
},
{
"epoch": 7.92,
"eval_COMMENT": {
"f1": 0.7251437677544517,
"number": 6854,
"precision": 0.6904604829133131,
"recall": 0.7634957688940764
},
"eval_NAME": {
"f1": 0.8154846001695395,
"number": 8845,
"precision": 0.8152542372881356,
"recall": 0.8157150932730356
},
"eval_QTY": {
"f1": 0.9866220735785953,
"number": 7152,
"precision": 0.9833333333333333,
"recall": 0.9899328859060402
},
"eval_RANGE_END": {
"f1": 0.8,
"number": 105,
"precision": 0.7,
"recall": 0.9333333333333333
},
"eval_UNIT": {
"f1": 0.9544557852302942,
"number": 5646,
"precision": 0.9253284550141361,
"recall": 0.9854764434998229
},
"eval_loss": 2.1034367084503174,
"eval_overall_accuracy": 0.830616974394043,
"eval_overall_f1": 0.8629076459303919,
"eval_overall_precision": 0.8458129071251091,
"eval_overall_recall": 0.8807076428221803,
"eval_runtime": 10.7303,
"eval_samples_per_second": 792.708,
"eval_steps_per_second": 24.79,
"step": 40000
},
{
"epoch": 8.02,
"learning_rate": 9.908928924965353e-06,
"loss": 1.7519,
"step": 40500
},
{
"epoch": 8.12,
"learning_rate": 9.41397743021184e-06,
"loss": 1.7771,
"step": 41000
},
{
"epoch": 8.12,
"eval_COMMENT": {
"f1": 0.7258660347110893,
"number": 6854,
"precision": 0.6949152542372882,
"recall": 0.759702363583309
},
"eval_NAME": {
"f1": 0.8134750169568167,
"number": 8845,
"precision": 0.8133830677065672,
"recall": 0.8135669869983041
},
"eval_QTY": {
"f1": 0.9863395595204906,
"number": 7152,
"precision": 0.9833240689271817,
"recall": 0.9893736017897091
},
"eval_RANGE_END": {
"f1": 0.7931034482758621,
"number": 105,
"precision": 0.7244094488188977,
"recall": 0.8761904761904762
},
"eval_UNIT": {
"f1": 0.9552213149978513,
"number": 5646,
"precision": 0.9278677575555184,
"recall": 0.9842366277010273
},
"eval_loss": 2.107405424118042,
"eval_overall_accuracy": 0.8285654585517818,
"eval_overall_f1": 0.8627047069729117,
"eval_overall_precision": 0.8474301902063942,
"eval_overall_recall": 0.8785399622404028,
"eval_runtime": 11.3451,
"eval_samples_per_second": 749.75,
"eval_steps_per_second": 23.446,
"step": 41000
},
{
"epoch": 8.22,
"learning_rate": 8.919025935458326e-06,
"loss": 1.7381,
"step": 41500
},
{
"epoch": 8.32,
"learning_rate": 8.424074440704812e-06,
"loss": 1.7179,
"step": 42000
},
{
"epoch": 8.32,
"eval_COMMENT": {
"f1": 0.7297001232370259,
"number": 6854,
"precision": 0.6874355005159959,
"recall": 0.7775021885030639
},
"eval_NAME": {
"f1": 0.8157106527267589,
"number": 8845,
"precision": 0.8154802259887005,
"recall": 0.8159412097230073
},
"eval_QTY": {
"f1": 0.9864158829676071,
"number": 7152,
"precision": 0.982923781757601,
"recall": 0.9899328859060402
},
"eval_RANGE_END": {
"f1": 0.8016194331983806,
"number": 105,
"precision": 0.6971830985915493,
"recall": 0.9428571428571428
},
"eval_UNIT": {
"f1": 0.954233801851217,
"number": 5646,
"precision": 0.9244437064098306,
"recall": 0.9860077931278781
},
"eval_loss": 2.1069343090057373,
"eval_overall_accuracy": 0.8319276650710432,
"eval_overall_f1": 0.86363558757747,
"eval_overall_precision": 0.8439387366945844,
"eval_overall_recall": 0.8842738270051045,
"eval_runtime": 11.303,
"eval_samples_per_second": 752.544,
"eval_steps_per_second": 23.534,
"step": 42000
},
{
"epoch": 8.41,
"learning_rate": 7.929122945951298e-06,
"loss": 1.7763,
"step": 42500
},
{
"epoch": 8.51,
"learning_rate": 7.434171451197783e-06,
"loss": 1.7005,
"step": 43000
},
{
"epoch": 8.51,
"eval_COMMENT": {
"f1": 0.7259434619133825,
"number": 6854,
"precision": 0.694326052210975,
"recall": 0.7605777648088707
},
"eval_NAME": {
"f1": 0.8142243328810492,
"number": 8845,
"precision": 0.8143164084586678,
"recall": 0.8141322781232334
},
"eval_QTY": {
"f1": 0.9863471719141822,
"number": 7152,
"precision": 0.9827873403664631,
"recall": 0.9899328859060402
},
"eval_RANGE_END": {
"f1": 0.7894736842105263,
"number": 105,
"precision": 0.7317073170731707,
"recall": 0.8571428571428571
},
"eval_UNIT": {
"f1": 0.9534087016101404,
"number": 5646,
"precision": 0.9230514096185738,
"recall": 0.9858306765851931
},
"eval_loss": 2.1151254177093506,
"eval_overall_accuracy": 0.8293252792341007,
"eval_overall_f1": 0.8626307665923513,
"eval_overall_precision": 0.8465733135855662,
"eval_overall_recall": 0.8793091392210335,
"eval_runtime": 10.9284,
"eval_samples_per_second": 778.339,
"eval_steps_per_second": 24.34,
"step": 43000
},
{
"epoch": 8.61,
"learning_rate": 6.939219956444269e-06,
"loss": 1.7224,
"step": 43500
},
{
"epoch": 8.71,
"learning_rate": 6.444268461690754e-06,
"loss": 1.7078,
"step": 44000
},
{
"epoch": 8.71,
"eval_COMMENT": {
"f1": 0.7251940133037693,
"number": 6854,
"precision": 0.6905515967273687,
"recall": 0.7634957688940764
},
"eval_NAME": {
"f1": 0.8152167768922051,
"number": 8845,
"precision": 0.8151706986208456,
"recall": 0.8152628603730921
},
"eval_QTY": {
"f1": 0.9865495853369572,
"number": 7152,
"precision": 0.9834653327775462,
"recall": 0.9896532438478747
},
"eval_RANGE_END": {
"f1": 0.7899159663865547,
"number": 105,
"precision": 0.706766917293233,
"recall": 0.8952380952380953
},
"eval_UNIT": {
"f1": 0.9550831476084348,
"number": 5646,
"precision": 0.9254152823920265,
"recall": 0.9867162592986185
},
"eval_loss": 2.1110451221466064,
"eval_overall_accuracy": 0.8313008130081301,
"eval_overall_f1": 0.8629231190900369,
"eval_overall_precision": 0.8459394102236851,
"eval_overall_recall": 0.8806027550520943,
"eval_runtime": 11.2874,
"eval_samples_per_second": 753.583,
"eval_steps_per_second": 23.566,
"step": 44000
},
{
"epoch": 8.81,
"learning_rate": 5.949316966937241e-06,
"loss": 1.768,
"step": 44500
},
{
"epoch": 8.91,
"learning_rate": 5.4543654721837265e-06,
"loss": 1.7494,
"step": 45000
},
{
"epoch": 8.91,
"eval_COMMENT": {
"f1": 0.7275605726872247,
"number": 6854,
"precision": 0.6886890800104248,
"recall": 0.7710825795156113
},
"eval_NAME": {
"f1": 0.8160244095378009,
"number": 8845,
"precision": 0.8156557099288377,
"recall": 0.8163934426229508
},
"eval_QTY": {
"f1": 0.9865552072448623,
"number": 7152,
"precision": 0.9830626128002221,
"recall": 0.9900727069351231
},
"eval_RANGE_END": {
"f1": 0.7899159663865547,
"number": 105,
"precision": 0.706766917293233,
"recall": 0.8952380952380953
},
"eval_UNIT": {
"f1": 0.9546817441960078,
"number": 5646,
"precision": 0.924506387921022,
"recall": 0.9868933758413035
},
"eval_loss": 2.1094605922698975,
"eval_overall_accuracy": 0.8318896740369273,
"eval_overall_f1": 0.8634685085139848,
"eval_overall_precision": 0.8448645031783205,
"eval_overall_recall": 0.8829102859939865,
"eval_runtime": 10.8603,
"eval_samples_per_second": 783.222,
"eval_steps_per_second": 24.493,
"step": 45000
},
{
"epoch": 9.01,
"learning_rate": 4.959413977430212e-06,
"loss": 1.7068,
"step": 45500
},
{
"epoch": 9.11,
"learning_rate": 4.4644624826766974e-06,
"loss": 1.6805,
"step": 46000
},
{
"epoch": 9.11,
"eval_COMMENT": {
"f1": 0.727134881797505,
"number": 6854,
"precision": 0.6890920966688439,
"recall": 0.7696235774730085
},
"eval_NAME": {
"f1": 0.8148566905986773,
"number": 8845,
"precision": 0.8149027589326097,
"recall": 0.8148106274731487
},
"eval_QTY": {
"f1": 0.9866963850386571,
"number": 7152,
"precision": 0.9830673143650243,
"recall": 0.9903523489932886
},
"eval_RANGE_END": {
"f1": 0.7950819672131149,
"number": 105,
"precision": 0.697841726618705,
"recall": 0.9238095238095239
},
"eval_UNIT": {
"f1": 0.9543739279588336,
"number": 5646,
"precision": 0.9251745926172265,
"recall": 0.9854764434998229
},
"eval_loss": 2.113201856613159,
"eval_overall_accuracy": 0.8326874857533622,
"eval_overall_f1": 0.8630322106091448,
"eval_overall_precision": 0.8448939947081087,
"eval_overall_recall": 0.8819662960632124,
"eval_runtime": 9.5944,
"eval_samples_per_second": 886.557,
"eval_steps_per_second": 27.724,
"step": 46000
},
{
"epoch": 9.21,
"learning_rate": 3.969510987923184e-06,
"loss": 1.7258,
"step": 46500
},
{
"epoch": 9.31,
"learning_rate": 3.4745594931696697e-06,
"loss": 1.6867,
"step": 47000
},
{
"epoch": 9.31,
"eval_COMMENT": {
"f1": 0.7311783679912154,
"number": 6854,
"precision": 0.6902941557600104,
"recall": 0.7772103880945433
},
"eval_NAME": {
"f1": 0.8176065092100803,
"number": 8845,
"precision": 0.8172370947701344,
"recall": 0.817976257772753
},
"eval_QTY": {
"f1": 0.9865533337978123,
"number": 7152,
"precision": 0.9831967782252465,
"recall": 0.9899328859060402
},
"eval_RANGE_END": {
"f1": 0.7932489451476793,
"number": 105,
"precision": 0.7121212121212122,
"recall": 0.8952380952380953
},
"eval_UNIT": {
"f1": 0.9545610425240054,
"number": 5646,
"precision": 0.925058158856763,
"recall": 0.9860077931278781
},
"eval_loss": 2.1125941276550293,
"eval_overall_accuracy": 0.8326115036851303,
"eval_overall_f1": 0.8647198537327205,
"eval_overall_precision": 0.8456602386283881,
"eval_overall_recall": 0.8846584154954199,
"eval_runtime": 11.2863,
"eval_samples_per_second": 753.659,
"eval_steps_per_second": 23.568,
"step": 47000
},
{
"epoch": 9.4,
"learning_rate": 2.979607998416155e-06,
"loss": 1.6794,
"step": 47500
},
{
"epoch": 9.5,
"learning_rate": 2.484656503662641e-06,
"loss": 1.7212,
"step": 48000
},
{
"epoch": 9.5,
"eval_COMMENT": {
"f1": 0.7277605779153767,
"number": 6854,
"precision": 0.6885822158573103,
"recall": 0.7716661803326524
},
"eval_NAME": {
"f1": 0.8148064424978807,
"number": 8845,
"precision": 0.8145762711864407,
"recall": 0.8150367439231204
},
"eval_QTY": {
"f1": 0.9864120967179988,
"number": 7152,
"precision": 0.98319211001528,
"recall": 0.9896532438478747
},
"eval_RANGE_END": {
"f1": 0.7901234567901234,
"number": 105,
"precision": 0.6956521739130435,
"recall": 0.9142857142857143
},
"eval_UNIT": {
"f1": 0.9545104086353122,
"number": 5646,
"precision": 0.9243404678944749,
"recall": 0.9867162592986185
},
"eval_loss": 2.105802297592163,
"eval_overall_accuracy": 0.8318706785198693,
"eval_overall_f1": 0.86305280612681,
"eval_overall_precision": 0.8443886937614986,
"eval_overall_recall": 0.8825606600936997,
"eval_runtime": 10.3961,
"eval_samples_per_second": 818.189,
"eval_steps_per_second": 25.586,
"step": 48000
},
{
"epoch": 9.6,
"learning_rate": 1.989705008909127e-06,
"loss": 1.6992,
"step": 48500
},
{
"epoch": 9.7,
"learning_rate": 1.4947535141556129e-06,
"loss": 1.6952,
"step": 49000
},
{
"epoch": 9.7,
"eval_COMMENT": {
"f1": 0.7261049723756906,
"number": 6854,
"precision": 0.6893522161028062,
"recall": 0.7669973737963233
},
"eval_NAME": {
"f1": 0.81525854761232,
"number": 8845,
"precision": 0.8150282485875706,
"recall": 0.8154889768230639
},
"eval_QTY": {
"f1": 0.9866276640200585,
"number": 7152,
"precision": 0.9829308909242298,
"recall": 0.9903523489932886
},
"eval_RANGE_END": {
"f1": 0.7916666666666667,
"number": 105,
"precision": 0.7037037037037037,
"recall": 0.9047619047619048
},
"eval_UNIT": {
"f1": 0.9544792113159023,
"number": 5646,
"precision": 0.9249044691809271,
"recall": 0.9860077931278781
},
"eval_loss": 2.1103529930114746,
"eval_overall_accuracy": 0.8311488488716663,
"eval_overall_f1": 0.8629658783668163,
"eval_overall_precision": 0.8451199892747017,
"eval_overall_recall": 0.881581707572897,
"eval_runtime": 11.1488,
"eval_samples_per_second": 762.95,
"eval_steps_per_second": 23.859,
"step": 49000
},
{
"epoch": 9.8,
"learning_rate": 9.998020194020988e-07,
"loss": 1.7282,
"step": 49500
},
{
"epoch": 9.9,
"learning_rate": 5.048505246485845e-07,
"loss": 1.7128,
"step": 50000
},
{
"epoch": 9.9,
"eval_COMMENT": {
"f1": 0.7280375120673009,
"number": 6854,
"precision": 0.6902458158995816,
"recall": 0.7702071782900496
},
"eval_NAME": {
"f1": 0.8154846001695395,
"number": 8845,
"precision": 0.8152542372881356,
"recall": 0.8157150932730356
},
"eval_QTY": {
"f1": 0.9866276640200585,
"number": 7152,
"precision": 0.9829308909242298,
"recall": 0.9903523489932886
},
"eval_RANGE_END": {
"f1": 0.7851239669421487,
"number": 105,
"precision": 0.6934306569343066,
"recall": 0.9047619047619048
},
"eval_UNIT": {
"f1": 0.9546351084812623,
"number": 5646,
"precision": 0.9253532834580216,
"recall": 0.9858306765851931
},
"eval_loss": 2.104012966156006,
"eval_overall_accuracy": 0.8311298533546083,
"eval_overall_f1": 0.8634575250607274,
"eval_overall_precision": 0.8453242229367631,
"eval_overall_recall": 0.8823858471435564,
"eval_runtime": 10.6017,
"eval_samples_per_second": 802.322,
"eval_steps_per_second": 25.09,
"step": 50000
},
{
"epoch": 10.0,
"learning_rate": 9.899029895070283e-09,
"loss": 1.7318,
"step": 50500
},
{
"epoch": 10.0,
"step": 50510,
"total_flos": 1554473524185192.0,
"train_loss": 2.2027091482279917,
"train_runtime": 3516.1179,
"train_samples_per_second": 459.606,
"train_steps_per_second": 14.365
}
],
"logging_steps": 500,
"max_steps": 50510,
"num_train_epochs": 10,
"save_steps": 1000,
"total_flos": 1554473524185192.0,
"trial_name": null,
"trial_params": null
}