napsternxg's picture
End of training
05ed773
{
"best_metric": 0.474032998085022,
"best_model_checkpoint": "nyt_ingredients-tagger-gte-small-L3-ingredient-v2/checkpoint-24000",
"epoch": 10.0,
"eval_steps": 1000,
"global_step": 50510,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.1,
"learning_rate": 4.9505048505246485e-05,
"loss": 1.1293,
"step": 500
},
{
"epoch": 0.2,
"learning_rate": 4.9010097010492975e-05,
"loss": 0.6931,
"step": 1000
},
{
"epoch": 0.2,
"eval_COMMENT": {
"f1": 0.5770606987183658,
"number": 6901,
"precision": 0.5236127508854782,
"recall": 0.6426604839878278
},
"eval_NAME": {
"f1": 0.7875208913649026,
"number": 8857,
"precision": 0.7773012207192346,
"recall": 0.7980128711753416
},
"eval_QTY": {
"f1": 0.9780634343998882,
"number": 7189,
"precision": 0.9824561403508771,
"recall": 0.9737098344693281
},
"eval_RANGE_END": {
"f1": 0.0,
"number": 92,
"precision": 0.0,
"recall": 0.0
},
"eval_UNIT": {
"f1": 0.9434346865975879,
"number": 5732,
"precision": 0.9192320423700762,
"recall": 0.9689462665736218
},
"eval_loss": 0.6230219006538391,
"eval_overall_accuracy": 0.7985813450669499,
"eval_overall_f1": 0.8086250651249558,
"eval_overall_precision": 0.7828506345590628,
"eval_overall_recall": 0.8361544610892913,
"eval_runtime": 7.9128,
"eval_samples_per_second": 1074.967,
"eval_steps_per_second": 33.616,
"step": 1000
},
{
"epoch": 0.3,
"learning_rate": 4.851514551573946e-05,
"loss": 0.6087,
"step": 1500
},
{
"epoch": 0.4,
"learning_rate": 4.802019402098595e-05,
"loss": 0.5826,
"step": 2000
},
{
"epoch": 0.4,
"eval_COMMENT": {
"f1": 0.602454780361757,
"number": 6901,
"precision": 0.5435365427205968,
"recall": 0.6756991740327489
},
"eval_NAME": {
"f1": 0.7907440212577502,
"number": 8857,
"precision": 0.7757141305528402,
"recall": 0.8063678446426555
},
"eval_QTY": {
"f1": 0.9754149163280765,
"number": 7189,
"precision": 0.9659028914348063,
"recall": 0.9851161496731117
},
"eval_RANGE_END": {
"f1": 0.6567164179104478,
"number": 92,
"precision": 0.6055045871559633,
"recall": 0.717391304347826
},
"eval_UNIT": {
"f1": 0.9462474645030426,
"number": 5732,
"precision": 0.9177049180327869,
"recall": 0.9766224703419399
},
"eval_loss": 0.5530511736869812,
"eval_overall_accuracy": 0.8078557068618898,
"eval_overall_f1": 0.8170321807714068,
"eval_overall_precision": 0.7837009608325087,
"eval_overall_recall": 0.8533245281707275,
"eval_runtime": 6.3157,
"eval_samples_per_second": 1346.806,
"eval_steps_per_second": 42.117,
"step": 2000
},
{
"epoch": 0.49,
"learning_rate": 4.752524252623243e-05,
"loss": 0.5569,
"step": 2500
},
{
"epoch": 0.59,
"learning_rate": 4.703029103147892e-05,
"loss": 0.5435,
"step": 3000
},
{
"epoch": 0.59,
"eval_COMMENT": {
"f1": 0.6313494946826079,
"number": 6901,
"precision": 0.5801165331391115,
"recall": 0.6925083321257789
},
"eval_NAME": {
"f1": 0.7944305207463102,
"number": 8857,
"precision": 0.7839085513299626,
"recall": 0.8052387941740996
},
"eval_QTY": {
"f1": 0.9791782343142699,
"number": 7189,
"precision": 0.9771436487048067,
"recall": 0.9812213103352344
},
"eval_RANGE_END": {
"f1": 0.7109004739336493,
"number": 92,
"precision": 0.6302521008403361,
"recall": 0.8152173913043478
},
"eval_UNIT": {
"f1": 0.9472093999160722,
"number": 5732,
"precision": 0.9126637554585153,
"recall": 0.9844731332868109
},
"eval_loss": 0.5327398180961609,
"eval_overall_accuracy": 0.8150438114023442,
"eval_overall_f1": 0.827899644462333,
"eval_overall_precision": 0.7999157403506497,
"eval_overall_recall": 0.8579124813179938,
"eval_runtime": 8.1233,
"eval_samples_per_second": 1047.112,
"eval_steps_per_second": 32.745,
"step": 3000
},
{
"epoch": 0.69,
"learning_rate": 4.65353395367254e-05,
"loss": 0.5324,
"step": 3500
},
{
"epoch": 0.79,
"learning_rate": 4.6040388041971886e-05,
"loss": 0.5333,
"step": 4000
},
{
"epoch": 0.79,
"eval_COMMENT": {
"f1": 0.6446886446886447,
"number": 6901,
"precision": 0.5875760104924288,
"recall": 0.7140994058832053
},
"eval_NAME": {
"f1": 0.7953999888349244,
"number": 8857,
"precision": 0.786660777385159,
"recall": 0.8043355537992548
},
"eval_QTY": {
"f1": 0.9809583594894328,
"number": 7189,
"precision": 0.9837716843872412,
"recall": 0.9781610794269022
},
"eval_RANGE_END": {
"f1": 0.7555555555555556,
"number": 92,
"precision": 0.6390977443609023,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.9506497918967128,
"number": 5732,
"precision": 0.9263366992219831,
"recall": 0.9762735519888346
},
"eval_loss": 0.5212323665618896,
"eval_overall_accuracy": 0.8183059591093578,
"eval_overall_f1": 0.831933619994625,
"eval_overall_precision": 0.8049731838127743,
"eval_overall_recall": 0.8607625734246289,
"eval_runtime": 8.6379,
"eval_samples_per_second": 984.732,
"eval_steps_per_second": 30.795,
"step": 4000
},
{
"epoch": 0.89,
"learning_rate": 4.5545436547218376e-05,
"loss": 0.5285,
"step": 4500
},
{
"epoch": 0.99,
"learning_rate": 4.505048505246486e-05,
"loss": 0.5199,
"step": 5000
},
{
"epoch": 0.99,
"eval_COMMENT": {
"f1": 0.6402057097646205,
"number": 6901,
"precision": 0.5873457536898137,
"recall": 0.7035212288074192
},
"eval_NAME": {
"f1": 0.8005563282336579,
"number": 8857,
"precision": 0.7890984865101996,
"recall": 0.812351812126002
},
"eval_QTY": {
"f1": 0.9803540437348144,
"number": 7189,
"precision": 0.978519955654102,
"recall": 0.9821950201697037
},
"eval_RANGE_END": {
"f1": 0.7747747747747747,
"number": 92,
"precision": 0.6615384615384615,
"recall": 0.9347826086956522
},
"eval_UNIT": {
"f1": 0.9499704716105627,
"number": 5732,
"precision": 0.9197843489625878,
"recall": 0.9822051639916259
},
"eval_loss": 0.5120549201965332,
"eval_overall_accuracy": 0.8185525167848879,
"eval_overall_f1": 0.8328133910301567,
"eval_overall_precision": 0.804738906356358,
"eval_overall_recall": 0.8629175211150116,
"eval_runtime": 6.4358,
"eval_samples_per_second": 1321.664,
"eval_steps_per_second": 41.331,
"step": 5000
},
{
"epoch": 1.09,
"learning_rate": 4.455553355771135e-05,
"loss": 0.5127,
"step": 5500
},
{
"epoch": 1.19,
"learning_rate": 4.406058206295783e-05,
"loss": 0.4983,
"step": 6000
},
{
"epoch": 1.19,
"eval_COMMENT": {
"f1": 0.6476600322754169,
"number": 6901,
"precision": 0.6041901894367081,
"recall": 0.6978698739313143
},
"eval_NAME": {
"f1": 0.7935644937586686,
"number": 8857,
"precision": 0.7801047120418848,
"recall": 0.8074968951112115
},
"eval_QTY": {
"f1": 0.9824293353705119,
"number": 7189,
"precision": 0.980998613037448,
"recall": 0.983864237028794
},
"eval_RANGE_END": {
"f1": 0.7601809954751132,
"number": 92,
"precision": 0.6511627906976745,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.9500843170320405,
"number": 5732,
"precision": 0.9193864229765013,
"recall": 0.9829030006978368
},
"eval_loss": 0.5088106393814087,
"eval_overall_accuracy": 0.8192163259113151,
"eval_overall_f1": 0.8339592771611903,
"eval_overall_precision": 0.8089590276416389,
"eval_overall_recall": 0.8605540300997532,
"eval_runtime": 8.5928,
"eval_samples_per_second": 989.902,
"eval_steps_per_second": 30.956,
"step": 6000
},
{
"epoch": 1.29,
"learning_rate": 4.356563056820432e-05,
"loss": 0.5102,
"step": 6500
},
{
"epoch": 1.39,
"learning_rate": 4.3070679073450804e-05,
"loss": 0.5031,
"step": 7000
},
{
"epoch": 1.39,
"eval_COMMENT": {
"f1": 0.6483065113460373,
"number": 6901,
"precision": 0.6055345911949686,
"recall": 0.6975800608607449
},
"eval_NAME": {
"f1": 0.797360248447205,
"number": 8857,
"precision": 0.7835422343324251,
"recall": 0.8116743818448685
},
"eval_QTY": {
"f1": 0.9815493055075669,
"number": 7189,
"precision": 0.9752815160670145,
"recall": 0.9878981777715955
},
"eval_RANGE_END": {
"f1": 0.7706422018348623,
"number": 92,
"precision": 0.6666666666666666,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.9498936622713738,
"number": 5732,
"precision": 0.9269467043001827,
"recall": 0.9740055826936497
},
"eval_loss": 0.5030972361564636,
"eval_overall_accuracy": 0.8199370329628646,
"eval_overall_f1": 0.8351003758828189,
"eval_overall_precision": 0.8107082078806126,
"eval_overall_recall": 0.8610058739703174,
"eval_runtime": 7.9063,
"eval_samples_per_second": 1075.848,
"eval_steps_per_second": 33.644,
"step": 7000
},
{
"epoch": 1.48,
"learning_rate": 4.257572757869729e-05,
"loss": 0.5027,
"step": 7500
},
{
"epoch": 1.58,
"learning_rate": 4.208077608394378e-05,
"loss": 0.492,
"step": 8000
},
{
"epoch": 1.58,
"eval_COMMENT": {
"f1": 0.6769068494956819,
"number": 6901,
"precision": 0.6209482341557814,
"recall": 0.743950152151862
},
"eval_NAME": {
"f1": 0.7926012072880323,
"number": 8857,
"precision": 0.7778260869565218,
"recall": 0.8079485152986339
},
"eval_QTY": {
"f1": 0.9821801475706529,
"number": 7189,
"precision": 0.983001254005852,
"recall": 0.9813604117401585
},
"eval_RANGE_END": {
"f1": 0.7685589519650656,
"number": 92,
"precision": 0.6423357664233577,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9496828752642706,
"number": 5732,
"precision": 0.9215493188905302,
"recall": 0.9795882763433357
},
"eval_loss": 0.5041355490684509,
"eval_overall_accuracy": 0.8246216287979365,
"eval_overall_f1": 0.8398886765248299,
"eval_overall_precision": 0.8112712550607287,
"eval_overall_recall": 0.8705988669146015,
"eval_runtime": 9.0062,
"eval_samples_per_second": 944.457,
"eval_steps_per_second": 29.535,
"step": 8000
},
{
"epoch": 1.68,
"learning_rate": 4.158582458919026e-05,
"loss": 0.4939,
"step": 8500
},
{
"epoch": 1.78,
"learning_rate": 4.109087309443675e-05,
"loss": 0.4817,
"step": 9000
},
{
"epoch": 1.78,
"eval_COMMENT": {
"f1": 0.6750676255195619,
"number": 6901,
"precision": 0.6196705426356589,
"recall": 0.7413418345167367
},
"eval_NAME": {
"f1": 0.8006897702620014,
"number": 8857,
"precision": 0.7891447368421053,
"recall": 0.8125776222197132
},
"eval_QTY": {
"f1": 0.9833679833679833,
"number": 7189,
"precision": 0.9798370390829996,
"recall": 0.9869244679371262
},
"eval_RANGE_END": {
"f1": 0.7792207792207793,
"number": 92,
"precision": 0.6474820143884892,
"recall": 0.9782608695652174
},
"eval_UNIT": {
"f1": 0.9505083606419629,
"number": 5732,
"precision": 0.9168422758956071,
"recall": 0.9867411025819958
},
"eval_loss": 0.4901449382305145,
"eval_overall_accuracy": 0.8292872586579676,
"eval_overall_f1": 0.8427365317609219,
"eval_overall_precision": 0.8133872271624899,
"eval_overall_recall": 0.8742831323207396,
"eval_runtime": 9.1291,
"eval_samples_per_second": 931.746,
"eval_steps_per_second": 29.138,
"step": 9000
},
{
"epoch": 1.88,
"learning_rate": 4.059592159968323e-05,
"loss": 0.4903,
"step": 9500
},
{
"epoch": 1.98,
"learning_rate": 4.010097010492972e-05,
"loss": 0.4905,
"step": 10000
},
{
"epoch": 1.98,
"eval_COMMENT": {
"f1": 0.6778359049069598,
"number": 6901,
"precision": 0.6241463414634146,
"recall": 0.7416316475873062
},
"eval_NAME": {
"f1": 0.8002232142857143,
"number": 8857,
"precision": 0.7911287653095002,
"recall": 0.8095291859546122
},
"eval_QTY": {
"f1": 0.9842749791260784,
"number": 7189,
"precision": 0.9846860643185299,
"recall": 0.983864237028794
},
"eval_RANGE_END": {
"f1": 0.789237668161435,
"number": 92,
"precision": 0.6717557251908397,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9502270052127123,
"number": 5732,
"precision": 0.9170723790976956,
"recall": 0.9858688066992324
},
"eval_loss": 0.4891791045665741,
"eval_overall_accuracy": 0.8287751773318667,
"eval_overall_f1": 0.8435557049235421,
"eval_overall_precision": 0.8165522625980025,
"eval_overall_recall": 0.8724062423968579,
"eval_runtime": 6.9634,
"eval_samples_per_second": 1221.536,
"eval_steps_per_second": 38.2,
"step": 10000
},
{
"epoch": 2.08,
"learning_rate": 3.9606018610176205e-05,
"loss": 0.4804,
"step": 10500
},
{
"epoch": 2.18,
"learning_rate": 3.911106711542269e-05,
"loss": 0.4757,
"step": 11000
},
{
"epoch": 2.18,
"eval_COMMENT": {
"f1": 0.6788539520042544,
"number": 6901,
"precision": 0.6271186440677966,
"recall": 0.7398927691638892
},
"eval_NAME": {
"f1": 0.802429240026744,
"number": 8857,
"precision": 0.7921020789792103,
"recall": 0.8130292424071356
},
"eval_QTY": {
"f1": 0.9835042971998891,
"number": 7189,
"precision": 0.9801077496891836,
"recall": 0.9869244679371262
},
"eval_RANGE_END": {
"f1": 0.7758620689655172,
"number": 92,
"precision": 0.6428571428571429,
"recall": 0.9782608695652174
},
"eval_UNIT": {
"f1": 0.9515842839036756,
"number": 5732,
"precision": 0.9226609864001311,
"recall": 0.9823796231681786
},
"eval_loss": 0.4953509271144867,
"eval_overall_accuracy": 0.8274285931039714,
"eval_overall_f1": 0.844669333960932,
"eval_overall_precision": 0.8179391176949373,
"eval_overall_recall": 0.8732056584755483,
"eval_runtime": 8.0512,
"eval_samples_per_second": 1056.487,
"eval_steps_per_second": 33.039,
"step": 11000
},
{
"epoch": 2.28,
"learning_rate": 3.861611562066917e-05,
"loss": 0.4856,
"step": 11500
},
{
"epoch": 2.38,
"learning_rate": 3.812116412591566e-05,
"loss": 0.4691,
"step": 12000
},
{
"epoch": 2.38,
"eval_COMMENT": {
"f1": 0.6842557693579316,
"number": 6901,
"precision": 0.6292872780345414,
"recall": 0.7497464135632517
},
"eval_NAME": {
"f1": 0.803944509443423,
"number": 8857,
"precision": 0.7935547734271887,
"recall": 0.8146099130631139
},
"eval_QTY": {
"f1": 0.984621778886118,
"number": 7189,
"precision": 0.9806816613771215,
"recall": 0.9885936847962165
},
"eval_RANGE_END": {
"f1": 0.780701754385965,
"number": 92,
"precision": 0.6544117647058824,
"recall": 0.967391304347826
},
"eval_UNIT": {
"f1": 0.9528556944913822,
"number": 5732,
"precision": 0.9238204456094364,
"recall": 0.9837752965806001
},
"eval_loss": 0.4902682304382324,
"eval_overall_accuracy": 0.8301407275348026,
"eval_overall_f1": 0.84684079769019,
"eval_overall_precision": 0.818934450180189,
"eval_overall_recall": 0.8767161377776233,
"eval_runtime": 8.9123,
"eval_samples_per_second": 954.413,
"eval_steps_per_second": 29.846,
"step": 12000
},
{
"epoch": 2.47,
"learning_rate": 3.762621263116215e-05,
"loss": 0.4806,
"step": 12500
},
{
"epoch": 2.57,
"learning_rate": 3.7131261136408633e-05,
"loss": 0.4765,
"step": 13000
},
{
"epoch": 2.57,
"eval_COMMENT": {
"f1": 0.6893633899649634,
"number": 6901,
"precision": 0.6338439095550693,
"recall": 0.7555426749746413
},
"eval_NAME": {
"f1": 0.805656475322788,
"number": 8857,
"precision": 0.7977640026566305,
"recall": 0.8137066726882691
},
"eval_QTY": {
"f1": 0.9841977027497391,
"number": 7189,
"precision": 0.9850891861761427,
"recall": 0.9833078314090973
},
"eval_RANGE_END": {
"f1": 0.7777777777777777,
"number": 92,
"precision": 0.6774193548387096,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.9518021440027011,
"number": 5732,
"precision": 0.9219950940310712,
"recall": 0.9836008374040475
},
"eval_loss": 0.4845636188983917,
"eval_overall_accuracy": 0.8307097067860258,
"eval_overall_f1": 0.8482320088820106,
"eval_overall_precision": 0.8219070904645477,
"eval_overall_recall": 0.8762990511278718,
"eval_runtime": 6.7092,
"eval_samples_per_second": 1267.814,
"eval_steps_per_second": 39.647,
"step": 13000
},
{
"epoch": 2.67,
"learning_rate": 3.663630964165512e-05,
"loss": 0.4715,
"step": 13500
},
{
"epoch": 2.77,
"learning_rate": 3.6141358146901606e-05,
"loss": 0.4747,
"step": 14000
},
{
"epoch": 2.77,
"eval_COMMENT": {
"f1": 0.6842317515795134,
"number": 6901,
"precision": 0.6380844929171368,
"recall": 0.7375742645993334
},
"eval_NAME": {
"f1": 0.8026484170700496,
"number": 8857,
"precision": 0.791246160596753,
"recall": 0.8143841029694028
},
"eval_QTY": {
"f1": 0.9847090569431951,
"number": 7189,
"precision": 0.9796255506607929,
"recall": 0.9898455974405341
},
"eval_RANGE_END": {
"f1": 0.7878787878787878,
"number": 92,
"precision": 0.6546762589928058,
"recall": 0.9891304347826086
},
"eval_UNIT": {
"f1": 0.9519481612387444,
"number": 5732,
"precision": 0.9195252804422045,
"recall": 0.9867411025819958
},
"eval_loss": 0.4844052493572235,
"eval_overall_accuracy": 0.8314304138375754,
"eval_overall_f1": 0.8470833754081255,
"eval_overall_precision": 0.8211570463666917,
"eval_overall_recall": 0.8747002189704911,
"eval_runtime": 8.8562,
"eval_samples_per_second": 960.458,
"eval_steps_per_second": 30.035,
"step": 14000
},
{
"epoch": 2.87,
"learning_rate": 3.564640665214809e-05,
"loss": 0.4673,
"step": 14500
},
{
"epoch": 2.97,
"learning_rate": 3.515145515739457e-05,
"loss": 0.4654,
"step": 15000
},
{
"epoch": 2.97,
"eval_COMMENT": {
"f1": 0.6951928862739855,
"number": 6901,
"precision": 0.6453574975173784,
"recall": 0.7533690769453703
},
"eval_NAME": {
"f1": 0.8027195720017833,
"number": 8857,
"precision": 0.7925608011444921,
"recall": 0.8131421474539912
},
"eval_QTY": {
"f1": 0.9852237252861602,
"number": 7189,
"precision": 0.9827013562136728,
"recall": 0.9877590763666713
},
"eval_RANGE_END": {
"f1": 0.7802690582959643,
"number": 92,
"precision": 0.6641221374045801,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9533801506049582,
"number": 5732,
"precision": 0.9255791030064071,
"recall": 0.9829030006978368
},
"eval_loss": 0.48082008957862854,
"eval_overall_accuracy": 0.8331752835413269,
"eval_overall_f1": 0.8498601704909194,
"eval_overall_precision": 0.8246313793441659,
"eval_overall_recall": 0.8766813805568107,
"eval_runtime": 7.2911,
"eval_samples_per_second": 1166.621,
"eval_steps_per_second": 36.483,
"step": 15000
},
{
"epoch": 3.07,
"learning_rate": 3.465650366264107e-05,
"loss": 0.4573,
"step": 15500
},
{
"epoch": 3.17,
"learning_rate": 3.416155216788755e-05,
"loss": 0.4586,
"step": 16000
},
{
"epoch": 3.17,
"eval_COMMENT": {
"f1": 0.6976900801400768,
"number": 6901,
"precision": 0.6517362858580775,
"recall": 0.7506158527749601
},
"eval_NAME": {
"f1": 0.8010911317708622,
"number": 8857,
"precision": 0.7901383703052932,
"recall": 0.812351812126002
},
"eval_QTY": {
"f1": 0.9851262538913871,
"number": 7189,
"precision": 0.979906413432425,
"recall": 0.990402003060231
},
"eval_RANGE_END": {
"f1": 0.7802690582959643,
"number": 92,
"precision": 0.6641221374045801,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9516034003871727,
"number": 5732,
"precision": 0.9193364774760123,
"recall": 0.9862177250523377
},
"eval_loss": 0.48265689611434937,
"eval_overall_accuracy": 0.8316959374881463,
"eval_overall_f1": 0.8500783210658401,
"eval_overall_precision": 0.824673202614379,
"eval_overall_recall": 0.8770984672065621,
"eval_runtime": 9.1659,
"eval_samples_per_second": 928.008,
"eval_steps_per_second": 29.021,
"step": 16000
},
{
"epoch": 3.27,
"learning_rate": 3.3666600673134034e-05,
"loss": 0.4591,
"step": 16500
},
{
"epoch": 3.37,
"learning_rate": 3.317164917838052e-05,
"loss": 0.4612,
"step": 17000
},
{
"epoch": 3.37,
"eval_COMMENT": {
"f1": 0.6966127636920211,
"number": 6901,
"precision": 0.6441053408811224,
"recall": 0.7584408056803362
},
"eval_NAME": {
"f1": 0.7990913120567377,
"number": 8857,
"precision": 0.7845718637797846,
"recall": 0.8141582928756915
},
"eval_QTY": {
"f1": 0.9846325012168833,
"number": 7189,
"precision": 0.9844271412680756,
"recall": 0.9848379468632633
},
"eval_RANGE_END": {
"f1": 0.7802690582959643,
"number": 92,
"precision": 0.6641221374045801,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9502140878179833,
"number": 5732,
"precision": 0.9158439877002751,
"recall": 0.9872644801116539
},
"eval_loss": 0.4868798851966858,
"eval_overall_accuracy": 0.8307666047111482,
"eval_overall_f1": 0.8481624433629804,
"eval_overall_precision": 0.8199811804406373,
"eval_overall_recall": 0.8783497271558166,
"eval_runtime": 7.3722,
"eval_samples_per_second": 1153.794,
"eval_steps_per_second": 36.081,
"step": 17000
},
{
"epoch": 3.46,
"learning_rate": 3.267669768362701e-05,
"loss": 0.4592,
"step": 17500
},
{
"epoch": 3.56,
"learning_rate": 3.218174618887349e-05,
"loss": 0.4546,
"step": 18000
},
{
"epoch": 3.56,
"eval_COMMENT": {
"f1": 0.6903326332904275,
"number": 6901,
"precision": 0.6482188295165394,
"recall": 0.7382987972757571
},
"eval_NAME": {
"f1": 0.8029488387561666,
"number": 8857,
"precision": 0.788654181184669,
"recall": 0.8177712543750706
},
"eval_QTY": {
"f1": 0.9853083853083853,
"number": 7189,
"precision": 0.9817704736914791,
"recall": 0.9888718876060648
},
"eval_RANGE_END": {
"f1": 0.787037037037037,
"number": 92,
"precision": 0.6854838709677419,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.9534019922336655,
"number": 5732,
"precision": 0.9236179260713118,
"recall": 0.9851709699930217
},
"eval_loss": 0.480613112449646,
"eval_overall_accuracy": 0.8314683457876569,
"eval_overall_f1": 0.8492933517725234,
"eval_overall_precision": 0.8249189136061331,
"eval_overall_recall": 0.8751520628410552,
"eval_runtime": 8.0402,
"eval_samples_per_second": 1057.931,
"eval_steps_per_second": 33.084,
"step": 18000
},
{
"epoch": 3.66,
"learning_rate": 3.168679469411997e-05,
"loss": 0.4609,
"step": 18500
},
{
"epoch": 3.76,
"learning_rate": 3.119184319936647e-05,
"loss": 0.4471,
"step": 19000
},
{
"epoch": 3.76,
"eval_COMMENT": {
"f1": 0.6993611924407772,
"number": 6901,
"precision": 0.6466100652147164,
"recall": 0.7614838429213158
},
"eval_NAME": {
"f1": 0.8037861915367484,
"number": 8857,
"precision": 0.7929254092057564,
"recall": 0.8149486282036807
},
"eval_QTY": {
"f1": 0.9852052510939778,
"number": 7189,
"precision": 0.983906770255272,
"recall": 0.9865071637223536
},
"eval_RANGE_END": {
"f1": 0.7927927927927929,
"number": 92,
"precision": 0.676923076923077,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9520276536548351,
"number": 5732,
"precision": 0.9211943220753793,
"recall": 0.984996510816469
},
"eval_loss": 0.4822600483894348,
"eval_overall_accuracy": 0.8327769980654706,
"eval_overall_f1": 0.8508441514764242,
"eval_overall_precision": 0.8241521972831222,
"eval_overall_recall": 0.87932292933857,
"eval_runtime": 8.7949,
"eval_samples_per_second": 967.151,
"eval_steps_per_second": 30.245,
"step": 19000
},
{
"epoch": 3.86,
"learning_rate": 3.069689170461295e-05,
"loss": 0.4581,
"step": 19500
},
{
"epoch": 3.96,
"learning_rate": 3.0201940209859435e-05,
"loss": 0.4542,
"step": 20000
},
{
"epoch": 3.96,
"eval_COMMENT": {
"f1": 0.6950766529344229,
"number": 6901,
"precision": 0.6508980521123198,
"recall": 0.7456890305752789
},
"eval_NAME": {
"f1": 0.7992666259236624,
"number": 8857,
"precision": 0.7868081382629621,
"recall": 0.8121260020322908
},
"eval_QTY": {
"f1": 0.9853604384930272,
"number": 7189,
"precision": 0.9829734219269103,
"recall": 0.9877590763666713
},
"eval_RANGE_END": {
"f1": 0.7873303167420815,
"number": 92,
"precision": 0.6744186046511628,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9524210526315788,
"number": 5732,
"precision": 0.920559986977047,
"recall": 0.9865666434054431
},
"eval_loss": 0.47578319907188416,
"eval_overall_accuracy": 0.832568372340022,
"eval_overall_f1": 0.8490938211245047,
"eval_overall_precision": 0.8244499738082766,
"eval_overall_recall": 0.875256334503493,
"eval_runtime": 6.7831,
"eval_samples_per_second": 1253.998,
"eval_steps_per_second": 39.215,
"step": 20000
},
{
"epoch": 4.06,
"learning_rate": 2.970698871510592e-05,
"loss": 0.4454,
"step": 20500
},
{
"epoch": 4.16,
"learning_rate": 2.9212037220352405e-05,
"loss": 0.4452,
"step": 21000
},
{
"epoch": 4.16,
"eval_COMMENT": {
"f1": 0.6982899022801302,
"number": 6901,
"precision": 0.6566687938736439,
"recall": 0.7455441240399941
},
"eval_NAME": {
"f1": 0.7992468294844105,
"number": 8857,
"precision": 0.7843478260869565,
"recall": 0.8147228181099695
},
"eval_QTY": {
"f1": 0.9847455276660656,
"number": 7189,
"precision": 0.981750311074243,
"recall": 0.9877590763666713
},
"eval_RANGE_END": {
"f1": 0.787037037037037,
"number": 92,
"precision": 0.6854838709677419,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.9537733457280487,
"number": 5732,
"precision": 0.9249303392886412,
"recall": 0.9844731332868109
},
"eval_loss": 0.48325347900390625,
"eval_overall_accuracy": 0.8338959905928763,
"eval_overall_f1": 0.8500944924406048,
"eval_overall_precision": 0.8260912340537172,
"eval_overall_recall": 0.8755343922699941,
"eval_runtime": 9.0461,
"eval_samples_per_second": 940.291,
"eval_steps_per_second": 29.405,
"step": 21000
},
{
"epoch": 4.26,
"learning_rate": 2.871708572559889e-05,
"loss": 0.4217,
"step": 21500
},
{
"epoch": 4.36,
"learning_rate": 2.8222134230845377e-05,
"loss": 0.4412,
"step": 22000
},
{
"epoch": 4.36,
"eval_COMMENT": {
"f1": 0.6974386700006758,
"number": 6901,
"precision": 0.6534954407294833,
"recall": 0.7477177220692653
},
"eval_NAME": {
"f1": 0.8008429926238145,
"number": 8857,
"precision": 0.7870067582297798,
"recall": 0.8151744382973919
},
"eval_QTY": {
"f1": 0.9858392336526447,
"number": 7189,
"precision": 0.9839268394069558,
"recall": 0.9877590763666713
},
"eval_RANGE_END": {
"f1": 0.789237668161435,
"number": 92,
"precision": 0.6717557251908397,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9540462916033113,
"number": 5732,
"precision": 0.9248280379954144,
"recall": 0.9851709699930217
},
"eval_loss": 0.4888293445110321,
"eval_overall_accuracy": 0.8325494063649812,
"eval_overall_f1": 0.8505270258875117,
"eval_overall_precision": 0.8261040492727034,
"eval_overall_recall": 0.8764380800111223,
"eval_runtime": 6.5585,
"eval_samples_per_second": 1296.944,
"eval_steps_per_second": 40.558,
"step": 22000
},
{
"epoch": 4.45,
"learning_rate": 2.7727182736091867e-05,
"loss": 0.4481,
"step": 22500
},
{
"epoch": 4.55,
"learning_rate": 2.7232231241338353e-05,
"loss": 0.4423,
"step": 23000
},
{
"epoch": 4.55,
"eval_COMMENT": {
"f1": 0.6981985021253626,
"number": 6901,
"precision": 0.6532828282828282,
"recall": 0.7497464135632517
},
"eval_NAME": {
"f1": 0.8019725177304966,
"number": 8857,
"precision": 0.7874007180937874,
"recall": 0.817093824093937
},
"eval_QTY": {
"f1": 0.9857043719639139,
"number": 7189,
"precision": 0.9835202880487467,
"recall": 0.9878981777715955
},
"eval_RANGE_END": {
"f1": 0.7999999999999999,
"number": 92,
"precision": 0.6766917293233082,
"recall": 0.9782608695652174
},
"eval_UNIT": {
"f1": 0.9548452562151193,
"number": 5732,
"precision": 0.9264850672792911,
"recall": 0.984996510816469
},
"eval_loss": 0.4827423095703125,
"eval_overall_accuracy": 0.8337821947426317,
"eval_overall_f1": 0.8511377043654138,
"eval_overall_precision": 0.8262377695605223,
"eval_overall_recall": 0.8775850682979389,
"eval_runtime": 8.9572,
"eval_samples_per_second": 949.629,
"eval_steps_per_second": 29.697,
"step": 23000
},
{
"epoch": 4.65,
"learning_rate": 2.6737279746584836e-05,
"loss": 0.4519,
"step": 23500
},
{
"epoch": 4.75,
"learning_rate": 2.6242328251831323e-05,
"loss": 0.4507,
"step": 24000
},
{
"epoch": 4.75,
"eval_COMMENT": {
"f1": 0.69833923223523,
"number": 6901,
"precision": 0.6584520600693108,
"recall": 0.7433705260107231
},
"eval_NAME": {
"f1": 0.8048291977300545,
"number": 8857,
"precision": 0.7933530766699572,
"recall": 0.8166422039065147
},
"eval_QTY": {
"f1": 0.9856135011758197,
"number": 7189,
"precision": 0.9801898472967395,
"recall": 0.9910975100848518
},
"eval_RANGE_END": {
"f1": 0.7837837837837838,
"number": 92,
"precision": 0.6692307692307692,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9537942664418213,
"number": 5732,
"precision": 0.922976501305483,
"recall": 0.9867411025819958
},
"eval_loss": 0.474032998085022,
"eval_overall_accuracy": 0.8347115275196297,
"eval_overall_f1": 0.8523122656487518,
"eval_overall_precision": 0.8290126499096435,
"eval_overall_recall": 0.8769594383233117,
"eval_runtime": 7.5421,
"eval_samples_per_second": 1127.8,
"eval_steps_per_second": 35.269,
"step": 24000
},
{
"epoch": 4.85,
"learning_rate": 2.5747376757077806e-05,
"loss": 0.4377,
"step": 24500
},
{
"epoch": 4.95,
"learning_rate": 2.5252425262324292e-05,
"loss": 0.4452,
"step": 25000
},
{
"epoch": 4.95,
"eval_COMMENT": {
"f1": 0.7040598290598291,
"number": 6901,
"precision": 0.6528792569659443,
"recall": 0.7639472540211564
},
"eval_NAME": {
"f1": 0.8012646292084975,
"number": 8857,
"precision": 0.7875054513737462,
"recall": 0.8155131534379587
},
"eval_QTY": {
"f1": 0.9855775897933713,
"number": 7189,
"precision": 0.9825798423890502,
"recall": 0.9885936847962165
},
"eval_RANGE_END": {
"f1": 0.7727272727272728,
"number": 92,
"precision": 0.6640625,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.953449148254343,
"number": 5732,
"precision": 0.9227881162259223,
"recall": 0.9862177250523377
},
"eval_loss": 0.4791179597377777,
"eval_overall_accuracy": 0.8352236088457308,
"eval_overall_f1": 0.8516931350306697,
"eval_overall_precision": 0.8244940456823062,
"eval_overall_recall": 0.8807479753918876,
"eval_runtime": 6.5842,
"eval_samples_per_second": 1291.88,
"eval_steps_per_second": 40.4,
"step": 25000
},
{
"epoch": 5.05,
"learning_rate": 2.4757473767570778e-05,
"loss": 0.4442,
"step": 25500
},
{
"epoch": 5.15,
"learning_rate": 2.4262522272817265e-05,
"loss": 0.4274,
"step": 26000
},
{
"epoch": 5.15,
"eval_COMMENT": {
"f1": 0.7096947333109694,
"number": 6901,
"precision": 0.6607946026986506,
"recall": 0.766410665120997
},
"eval_NAME": {
"f1": 0.8056639536180176,
"number": 8857,
"precision": 0.795727342803656,
"recall": 0.8158518685785254
},
"eval_QTY": {
"f1": 0.9859017987360232,
"number": 7189,
"precision": 0.9844660194174757,
"recall": 0.9873417721518988
},
"eval_RANGE_END": {
"f1": 0.7962962962962964,
"number": 92,
"precision": 0.6935483870967742,
"recall": 0.9347826086956522
},
"eval_UNIT": {
"f1": 0.9532647207693606,
"number": 5732,
"precision": 0.9229010127409344,
"recall": 0.9856943475226797
},
"eval_loss": 0.48070788383483887,
"eval_overall_accuracy": 0.836058111747525,
"eval_overall_f1": 0.854768006474238,
"eval_overall_precision": 0.8299990177138928,
"eval_overall_recall": 0.8810607903792013,
"eval_runtime": 9.3326,
"eval_samples_per_second": 911.433,
"eval_steps_per_second": 28.502,
"step": 26000
},
{
"epoch": 5.25,
"learning_rate": 2.376757077806375e-05,
"loss": 0.432,
"step": 26500
},
{
"epoch": 5.35,
"learning_rate": 2.3272619283310237e-05,
"loss": 0.4312,
"step": 27000
},
{
"epoch": 5.35,
"eval_COMMENT": {
"f1": 0.7056545830829829,
"number": 6901,
"precision": 0.6542461005199307,
"recall": 0.7658310389798579
},
"eval_NAME": {
"f1": 0.8019135562107137,
"number": 8857,
"precision": 0.7903508771929825,
"recall": 0.8138195777351248
},
"eval_QTY": {
"f1": 0.9852421533984619,
"number": 7189,
"precision": 0.981501932633904,
"recall": 0.989010989010989
},
"eval_RANGE_END": {
"f1": 0.789237668161435,
"number": 92,
"precision": 0.6717557251908397,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9502391541495343,
"number": 5732,
"precision": 0.9154405820533549,
"recall": 0.9877878576413119
},
"eval_loss": 0.48605257272720337,
"eval_overall_accuracy": 0.83349770511702,
"eval_overall_f1": 0.8517865242150884,
"eval_overall_precision": 0.8242733597763183,
"eval_overall_recall": 0.8811998192624517,
"eval_runtime": 7.0035,
"eval_samples_per_second": 1214.536,
"eval_steps_per_second": 37.981,
"step": 27000
},
{
"epoch": 5.44,
"learning_rate": 2.2777667788556724e-05,
"loss": 0.4321,
"step": 27500
},
{
"epoch": 5.54,
"learning_rate": 2.2282716293803206e-05,
"loss": 0.4315,
"step": 28000
},
{
"epoch": 5.54,
"eval_COMMENT": {
"f1": 0.7045745469244761,
"number": 6901,
"precision": 0.6583983883152859,
"recall": 0.7577162730039124
},
"eval_NAME": {
"f1": 0.8038757099899767,
"number": 8857,
"precision": 0.7930996593780903,
"recall": 0.8149486282036807
},
"eval_QTY": {
"f1": 0.9861322978782415,
"number": 7189,
"precision": 0.9831328632655882,
"recall": 0.9891500904159132
},
"eval_RANGE_END": {
"f1": 0.7909090909090909,
"number": 92,
"precision": 0.6796875,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9528698872243729,
"number": 5732,
"precision": 0.9204878048780488,
"recall": 0.9876133984647593
},
"eval_loss": 0.481955349445343,
"eval_overall_accuracy": 0.8341235822933657,
"eval_overall_f1": 0.8531310577328276,
"eval_overall_precision": 0.8282385285069058,
"eval_overall_recall": 0.8795662298842585,
"eval_runtime": 8.4264,
"eval_samples_per_second": 1009.444,
"eval_steps_per_second": 31.567,
"step": 28000
},
{
"epoch": 5.64,
"learning_rate": 2.1787764799049696e-05,
"loss": 0.4328,
"step": 28500
},
{
"epoch": 5.74,
"learning_rate": 2.129281330429618e-05,
"loss": 0.4316,
"step": 29000
},
{
"epoch": 5.74,
"eval_COMMENT": {
"f1": 0.7066999527697188,
"number": 6901,
"precision": 0.6612373737373738,
"recall": 0.7588755252861904
},
"eval_NAME": {
"f1": 0.8088874039425326,
"number": 8857,
"precision": 0.7980441709702231,
"recall": 0.8200293553121825
},
"eval_QTY": {
"f1": 0.9862747816442535,
"number": 7189,
"precision": 0.9830040071852978,
"recall": 0.9895673946306858
},
"eval_RANGE_END": {
"f1": 0.7741935483870968,
"number": 92,
"precision": 0.672,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.955117910573916,
"number": 5732,
"precision": 0.9263813739957371,
"recall": 0.9856943475226797
},
"eval_loss": 0.4761992394924164,
"eval_overall_accuracy": 0.836987444524523,
"eval_overall_f1": 0.8555853712048336,
"eval_overall_precision": 0.8315727314480678,
"eval_overall_recall": 0.8810260331583887,
"eval_runtime": 8.3244,
"eval_samples_per_second": 1021.82,
"eval_steps_per_second": 31.954,
"step": 29000
},
{
"epoch": 5.84,
"learning_rate": 2.0797861809542665e-05,
"loss": 0.4429,
"step": 29500
},
{
"epoch": 5.94,
"learning_rate": 2.0302910314789152e-05,
"loss": 0.4278,
"step": 30000
},
{
"epoch": 5.94,
"eval_COMMENT": {
"f1": 0.7081487447979596,
"number": 6901,
"precision": 0.6596223583843942,
"recall": 0.7643819736270105
},
"eval_NAME": {
"f1": 0.8039357385068653,
"number": 8857,
"precision": 0.7918309242225142,
"recall": 0.8164163938128034
},
"eval_QTY": {
"f1": 0.9861265260821309,
"number": 7189,
"precision": 0.9835339698353397,
"recall": 0.9887327862011406
},
"eval_RANGE_END": {
"f1": 0.783410138248848,
"number": 92,
"precision": 0.68,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.9540695710908478,
"number": 5732,
"precision": 0.9244109947643979,
"recall": 0.9856943475226797
},
"eval_loss": 0.4822809398174286,
"eval_overall_accuracy": 0.8347684254447522,
"eval_overall_f1": 0.8540192709386161,
"eval_overall_precision": 0.8285882391396725,
"eval_overall_recall": 0.8810607903792013,
"eval_runtime": 6.5281,
"eval_samples_per_second": 1302.987,
"eval_steps_per_second": 40.747,
"step": 30000
},
{
"epoch": 6.04,
"learning_rate": 1.9807958820035638e-05,
"loss": 0.4251,
"step": 30500
},
{
"epoch": 6.14,
"learning_rate": 1.9313007325282124e-05,
"loss": 0.4211,
"step": 31000
},
{
"epoch": 6.14,
"eval_COMMENT": {
"f1": 0.705458989679522,
"number": 6901,
"precision": 0.6637281206081512,
"recall": 0.7527894508042313
},
"eval_NAME": {
"f1": 0.7998453978245265,
"number": 8857,
"precision": 0.7826885671061162,
"recall": 0.8177712543750706
},
"eval_QTY": {
"f1": 0.9858901646147462,
"number": 7189,
"precision": 0.9804649883065071,
"recall": 0.9913757128947003
},
"eval_RANGE_END": {
"f1": 0.787037037037037,
"number": 92,
"precision": 0.6854838709677419,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.9548103724976772,
"number": 5732,
"precision": 0.925495333224169,
"recall": 0.9860432658757851
},
"eval_loss": 0.47935572266578674,
"eval_overall_accuracy": 0.8356218943215871,
"eval_overall_f1": 0.8526081682167409,
"eval_overall_precision": 0.8273764755894183,
"eval_overall_recall": 0.8794272010010079,
"eval_runtime": 9.2091,
"eval_samples_per_second": 923.653,
"eval_steps_per_second": 28.885,
"step": 31000
},
{
"epoch": 6.24,
"learning_rate": 1.8818055830528607e-05,
"loss": 0.4113,
"step": 31500
},
{
"epoch": 6.34,
"learning_rate": 1.8323104335775097e-05,
"loss": 0.4231,
"step": 32000
},
{
"epoch": 6.34,
"eval_COMMENT": {
"f1": 0.7081927385612093,
"number": 6901,
"precision": 0.6627510420613869,
"recall": 0.7603245906390378
},
"eval_NAME": {
"f1": 0.8008871638480732,
"number": 8857,
"precision": 0.7868816735672259,
"recall": 0.815400248391103
},
"eval_QTY": {
"f1": 0.9866055937261433,
"number": 7189,
"precision": 0.9844875346260388,
"recall": 0.9887327862011406
},
"eval_RANGE_END": {
"f1": 0.8018433179723502,
"number": 92,
"precision": 0.696,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9542042675212956,
"number": 5732,
"precision": 0.9235918367346939,
"recall": 0.9869155617585486
},
"eval_loss": 0.4756552577018738,
"eval_overall_accuracy": 0.8364374312483405,
"eval_overall_f1": 0.8534784953485236,
"eval_overall_precision": 0.8284312121707835,
"eval_overall_recall": 0.8800875881964478,
"eval_runtime": 6.7948,
"eval_samples_per_second": 1251.831,
"eval_steps_per_second": 39.147,
"step": 32000
},
{
"epoch": 6.43,
"learning_rate": 1.782815284102158e-05,
"loss": 0.4209,
"step": 32500
},
{
"epoch": 6.53,
"learning_rate": 1.7333201346268066e-05,
"loss": 0.4302,
"step": 33000
},
{
"epoch": 6.53,
"eval_COMMENT": {
"f1": 0.706057529610829,
"number": 6901,
"precision": 0.6624333248666497,
"recall": 0.7558324880452109
},
"eval_NAME": {
"f1": 0.8062360801781736,
"number": 8857,
"precision": 0.7953421948808085,
"recall": 0.8174325392345038
},
"eval_QTY": {
"f1": 0.986130374479889,
"number": 7189,
"precision": 0.9832664914949523,
"recall": 0.989010989010989
},
"eval_RANGE_END": {
"f1": 0.7766990291262136,
"number": 92,
"precision": 0.7017543859649122,
"recall": 0.8695652173913043
},
"eval_UNIT": {
"f1": 0.9544303797468354,
"number": 5732,
"precision": 0.9243216737495914,
"recall": 0.9865666434054431
},
"eval_loss": 0.4785662591457367,
"eval_overall_accuracy": 0.8354891324963016,
"eval_overall_f1": 0.8546047187178056,
"eval_overall_precision": 0.8311760840998685,
"eval_overall_recall": 0.8793924437801953,
"eval_runtime": 8.3624,
"eval_samples_per_second": 1017.166,
"eval_steps_per_second": 31.809,
"step": 33000
},
{
"epoch": 6.63,
"learning_rate": 1.6838249851514553e-05,
"loss": 0.4309,
"step": 33500
},
{
"epoch": 6.73,
"learning_rate": 1.634329835676104e-05,
"loss": 0.4223,
"step": 34000
},
{
"epoch": 6.73,
"eval_COMMENT": {
"f1": 0.703981612925032,
"number": 6901,
"precision": 0.6597820577800304,
"recall": 0.7545283292276481
},
"eval_NAME": {
"f1": 0.8044022011005503,
"number": 8857,
"precision": 0.7922049485439019,
"recall": 0.8169809190470814
},
"eval_QTY": {
"f1": 0.986130374479889,
"number": 7189,
"precision": 0.9832664914949523,
"recall": 0.989010989010989
},
"eval_RANGE_END": {
"f1": 0.7981651376146789,
"number": 92,
"precision": 0.6904761904761905,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9541965415436525,
"number": 5732,
"precision": 0.923730197615548,
"recall": 0.9867411025819958
},
"eval_loss": 0.4795403480529785,
"eval_overall_accuracy": 0.836304669423055,
"eval_overall_f1": 0.8534844880813807,
"eval_overall_precision": 0.8292139251294828,
"eval_overall_recall": 0.8792186576761322,
"eval_runtime": 8.6534,
"eval_samples_per_second": 982.967,
"eval_steps_per_second": 30.739,
"step": 34000
},
{
"epoch": 6.83,
"learning_rate": 1.5848346862007525e-05,
"loss": 0.4119,
"step": 34500
},
{
"epoch": 6.93,
"learning_rate": 1.535339536725401e-05,
"loss": 0.4184,
"step": 35000
},
{
"epoch": 6.93,
"eval_COMMENT": {
"f1": 0.7059539095762654,
"number": 6901,
"precision": 0.6614741641337386,
"recall": 0.7568468337922041
},
"eval_NAME": {
"f1": 0.8020405899966729,
"number": 8857,
"precision": 0.788057099269914,
"recall": 0.8165292988596591
},
"eval_QTY": {
"f1": 0.9865650969529086,
"number": 7189,
"precision": 0.9823472624465591,
"recall": 0.9908193072750034
},
"eval_RANGE_END": {
"f1": 0.7963800904977375,
"number": 92,
"precision": 0.6821705426356589,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9530710253601821,
"number": 5732,
"precision": 0.9216229428059313,
"recall": 0.9867411025819958
},
"eval_loss": 0.4803193211555481,
"eval_overall_accuracy": 0.8355839623715056,
"eval_overall_f1": 0.8531527433837031,
"eval_overall_precision": 0.8277868584504741,
"eval_overall_recall": 0.8801223454172604,
"eval_runtime": 7.0311,
"eval_samples_per_second": 1209.766,
"eval_steps_per_second": 37.832,
"step": 35000
},
{
"epoch": 7.03,
"learning_rate": 1.4858443872500496e-05,
"loss": 0.4189,
"step": 35500
},
{
"epoch": 7.13,
"learning_rate": 1.4363492377746981e-05,
"loss": 0.4071,
"step": 36000
},
{
"epoch": 7.13,
"eval_COMMENT": {
"f1": 0.7068977142471848,
"number": 6901,
"precision": 0.6610340479192938,
"recall": 0.7596000579626141
},
"eval_NAME": {
"f1": 0.8058371393561323,
"number": 8857,
"precision": 0.7952072111685171,
"recall": 0.8167551089533702
},
"eval_QTY": {
"f1": 0.9864247125640672,
"number": 7189,
"precision": 0.9823423920540765,
"recall": 0.9905411044651551
},
"eval_RANGE_END": {
"f1": 0.7981651376146789,
"number": 92,
"precision": 0.6904761904761905,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9542881284326151,
"number": 5732,
"precision": 0.9252826478780928,
"recall": 0.9851709699930217
},
"eval_loss": 0.48823681473731995,
"eval_overall_accuracy": 0.8358115540719948,
"eval_overall_f1": 0.8546798029556651,
"eval_overall_precision": 0.8303884609080479,
"eval_overall_recall": 0.880435160404574,
"eval_runtime": 9.3911,
"eval_samples_per_second": 905.75,
"eval_steps_per_second": 28.325,
"step": 36000
},
{
"epoch": 7.23,
"learning_rate": 1.3868540882993467e-05,
"loss": 0.4066,
"step": 36500
},
{
"epoch": 7.33,
"learning_rate": 1.3373589388239954e-05,
"loss": 0.4093,
"step": 37000
},
{
"epoch": 7.33,
"eval_COMMENT": {
"f1": 0.7065691471515801,
"number": 6901,
"precision": 0.6579605098725319,
"recall": 0.7629329082741632
},
"eval_NAME": {
"f1": 0.8055648302726766,
"number": 8857,
"precision": 0.794249972566663,
"recall": 0.8172067291407926
},
"eval_QTY": {
"f1": 0.9863412604867227,
"number": 7189,
"precision": 0.9832734310201825,
"recall": 0.9894282932257615
},
"eval_RANGE_END": {
"f1": 0.7924528301886793,
"number": 92,
"precision": 0.7,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.9535530641490347,
"number": 5732,
"precision": 0.9225248735932148,
"recall": 0.9867411025819958
},
"eval_loss": 0.48563364148139954,
"eval_overall_accuracy": 0.8367219208739521,
"eval_overall_f1": 0.8541543851375251,
"eval_overall_precision": 0.8286274509803921,
"eval_overall_recall": 0.8813040909248896,
"eval_runtime": 6.6204,
"eval_samples_per_second": 1284.823,
"eval_steps_per_second": 40.179,
"step": 37000
},
{
"epoch": 7.42,
"learning_rate": 1.287863789348644e-05,
"loss": 0.4197,
"step": 37500
},
{
"epoch": 7.52,
"learning_rate": 1.2383686398732925e-05,
"loss": 0.4124,
"step": 38000
},
{
"epoch": 7.52,
"eval_COMMENT": {
"f1": 0.7066407036862955,
"number": 6901,
"precision": 0.6584084084084084,
"recall": 0.762498188668309
},
"eval_NAME": {
"f1": 0.8056977520587582,
"number": 8857,
"precision": 0.7942951179374658,
"recall": 0.8174325392345038
},
"eval_QTY": {
"f1": 0.9862728785357736,
"number": 7189,
"precision": 0.9831375259156876,
"recall": 0.9894282932257615
},
"eval_RANGE_END": {
"f1": 0.7963800904977375,
"number": 92,
"precision": 0.6821705426356589,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9536647009267059,
"number": 5732,
"precision": 0.9221244705115673,
"recall": 0.9874389392882066
},
"eval_loss": 0.4802015423774719,
"eval_overall_accuracy": 0.8361908735728104,
"eval_overall_f1": 0.8542606938363086,
"eval_overall_precision": 0.8286124995916234,
"eval_overall_recall": 0.881547391470578,
"eval_runtime": 9.142,
"eval_samples_per_second": 930.428,
"eval_steps_per_second": 29.096,
"step": 38000
},
{
"epoch": 7.62,
"learning_rate": 1.1888734903979411e-05,
"loss": 0.4071,
"step": 38500
},
{
"epoch": 7.72,
"learning_rate": 1.1393783409225896e-05,
"loss": 0.414,
"step": 39000
},
{
"epoch": 7.72,
"eval_COMMENT": {
"f1": 0.7048144163528779,
"number": 6901,
"precision": 0.6575084681972149,
"recall": 0.7594551514273293
},
"eval_NAME": {
"f1": 0.8015089315433264,
"number": 8857,
"precision": 0.7878721779910568,
"recall": 0.8156260584848143
},
"eval_QTY": {
"f1": 0.9858686616791354,
"number": 7189,
"precision": 0.9819235545743066,
"recall": 0.9898455974405341
},
"eval_RANGE_END": {
"f1": 0.7945205479452054,
"number": 92,
"precision": 0.6850393700787402,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9549138804457953,
"number": 5732,
"precision": 0.925229057591623,
"recall": 0.9865666434054431
},
"eval_loss": 0.483047753572464,
"eval_overall_accuracy": 0.8365701930736259,
"eval_overall_f1": 0.8526693267336735,
"eval_overall_precision": 0.8268464703193366,
"eval_overall_recall": 0.880157102638073,
"eval_runtime": 7.5994,
"eval_samples_per_second": 1119.299,
"eval_steps_per_second": 35.003,
"step": 39000
},
{
"epoch": 7.82,
"learning_rate": 1.0898831914472382e-05,
"loss": 0.4196,
"step": 39500
},
{
"epoch": 7.92,
"learning_rate": 1.0403880419718868e-05,
"loss": 0.4212,
"step": 40000
},
{
"epoch": 7.92,
"eval_COMMENT": {
"f1": 0.7108280254777071,
"number": 6901,
"precision": 0.6614674319940105,
"recall": 0.7681495435444139
},
"eval_NAME": {
"f1": 0.8036936084997496,
"number": 8857,
"precision": 0.7921052631578948,
"recall": 0.8156260584848143
},
"eval_QTY": {
"f1": 0.9861815151725575,
"number": 7189,
"precision": 0.9846089850249584,
"recall": 0.9877590763666713
},
"eval_RANGE_END": {
"f1": 0.787037037037037,
"number": 92,
"precision": 0.6854838709677419,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.9544457567065969,
"number": 5732,
"precision": 0.9240444299248611,
"recall": 0.9869155617585486
},
"eval_loss": 0.4802730679512024,
"eval_overall_accuracy": 0.8373477980502978,
"eval_overall_f1": 0.8546737867021544,
"eval_overall_precision": 0.8292364016736402,
"eval_overall_recall": 0.8817211775746411,
"eval_runtime": 8.1983,
"eval_samples_per_second": 1037.537,
"eval_steps_per_second": 32.446,
"step": 40000
},
{
"epoch": 8.02,
"learning_rate": 9.908928924965353e-06,
"loss": 0.4135,
"step": 40500
},
{
"epoch": 8.12,
"learning_rate": 9.41397743021184e-06,
"loss": 0.3994,
"step": 41000
},
{
"epoch": 8.12,
"eval_COMMENT": {
"f1": 0.7058981774161006,
"number": 6901,
"precision": 0.6586345381526104,
"recall": 0.7604694971743226
},
"eval_NAME": {
"f1": 0.8033988670443185,
"number": 8857,
"precision": 0.7905782052683353,
"recall": 0.8166422039065147
},
"eval_QTY": {
"f1": 0.9862045060658579,
"number": 7189,
"precision": 0.9830016583747927,
"recall": 0.9894282932257615
},
"eval_RANGE_END": {
"f1": 0.7963800904977375,
"number": 92,
"precision": 0.6821705426356589,
"recall": 0.9565217391304348
},
"eval_UNIT": {
"f1": 0.9540433426089888,
"number": 5732,
"precision": 0.9232903541700669,
"recall": 0.9869155617585486
},
"eval_loss": 0.4922930598258972,
"eval_overall_accuracy": 0.8354701665212608,
"eval_overall_f1": 0.8534523408555069,
"eval_overall_precision": 0.8278284164788134,
"eval_overall_recall": 0.8807132181710751,
"eval_runtime": 7.4213,
"eval_samples_per_second": 1146.156,
"eval_steps_per_second": 35.843,
"step": 41000
},
{
"epoch": 8.22,
"learning_rate": 8.919025935458326e-06,
"loss": 0.4167,
"step": 41500
},
{
"epoch": 8.32,
"learning_rate": 8.424074440704812e-06,
"loss": 0.4052,
"step": 42000
},
{
"epoch": 8.32,
"eval_COMMENT": {
"f1": 0.7033915447373744,
"number": 6901,
"precision": 0.6577553593947036,
"recall": 0.7558324880452109
},
"eval_NAME": {
"f1": 0.8042463317029791,
"number": 8857,
"precision": 0.7920087575259989,
"recall": 0.8168680140002258
},
"eval_QTY": {
"f1": 0.9861438270749618,
"number": 7189,
"precision": 0.9823326432022084,
"recall": 0.9899846988454584
},
"eval_RANGE_END": {
"f1": 0.8018018018018018,
"number": 92,
"precision": 0.6846153846153846,
"recall": 0.967391304347826
},
"eval_UNIT": {
"f1": 0.9546567592670776,
"number": 5732,
"precision": 0.9250531827851416,
"recall": 0.9862177250523377
},
"eval_loss": 0.4865518808364868,
"eval_overall_accuracy": 0.8359822478473619,
"eval_overall_f1": 0.8533090590337481,
"eval_overall_precision": 0.8284507872082747,
"eval_overall_recall": 0.8797052587675089,
"eval_runtime": 7.4797,
"eval_samples_per_second": 1137.217,
"eval_steps_per_second": 35.563,
"step": 42000
},
{
"epoch": 8.41,
"learning_rate": 7.929122945951298e-06,
"loss": 0.4042,
"step": 42500
},
{
"epoch": 8.51,
"learning_rate": 7.434171451197783e-06,
"loss": 0.4042,
"step": 43000
},
{
"epoch": 8.51,
"eval_COMMENT": {
"f1": 0.7073401950162513,
"number": 6901,
"precision": 0.663912546078556,
"recall": 0.7568468337922041
},
"eval_NAME": {
"f1": 0.8030025020850708,
"number": 8857,
"precision": 0.7910823838737949,
"recall": 0.8152873433442475
},
"eval_QTY": {
"f1": 0.9858200179843675,
"number": 7189,
"precision": 0.980462300495322,
"recall": 0.991236611489776
},
"eval_RANGE_END": {
"f1": 0.7909090909090909,
"number": 92,
"precision": 0.6796875,
"recall": 0.9456521739130435
},
"eval_UNIT": {
"f1": 0.9534962089300758,
"number": 5732,
"precision": 0.921961550993809,
"recall": 0.9872644801116539
},
"eval_loss": 0.48657840490341187,
"eval_overall_accuracy": 0.8364563972233813,
"eval_overall_f1": 0.8538279932546375,
"eval_overall_precision": 0.8292443250679682,
"eval_overall_recall": 0.8799138020923847,
"eval_runtime": 9.0804,
"eval_samples_per_second": 936.741,
"eval_steps_per_second": 29.294,
"step": 43000
},
{
"epoch": 8.61,
"learning_rate": 6.939219956444269e-06,
"loss": 0.4036,
"step": 43500
},
{
"epoch": 8.71,
"learning_rate": 6.444268461690754e-06,
"loss": 0.4135,
"step": 44000
},
{
"epoch": 8.71,
"eval_COMMENT": {
"f1": 0.7091805715057758,
"number": 6901,
"precision": 0.664262212098203,
"recall": 0.7606144037096073
},
"eval_NAME": {
"f1": 0.802937576499388,
"number": 8857,
"precision": 0.7914884282110344,
"recall": 0.8147228181099695
},
"eval_QTY": {
"f1": 0.985878443859892,
"number": 7189,
"precision": 0.9812594736116853,
"recall": 0.9905411044651551
},
"eval_RANGE_END": {
"f1": 0.7813953488372093,
"number": 92,
"precision": 0.6829268292682927,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.9540588384051252,
"number": 5732,
"precision": 0.9230141901810471,
"recall": 0.9872644801116539
},
"eval_loss": 0.48304322361946106,
"eval_overall_accuracy": 0.8367977847741153,
"eval_overall_f1": 0.8542520362219861,
"eval_overall_precision": 0.8296429741238126,
"eval_overall_recall": 0.8803656459629488,
"eval_runtime": 6.5688,
"eval_samples_per_second": 1294.905,
"eval_steps_per_second": 40.494,
"step": 44000
},
{
"epoch": 8.81,
"learning_rate": 5.949316966937241e-06,
"loss": 0.4078,
"step": 44500
},
{
"epoch": 8.91,
"learning_rate": 5.4543654721837265e-06,
"loss": 0.3958,
"step": 45000
},
{
"epoch": 8.91,
"eval_COMMENT": {
"f1": 0.7085999057175567,
"number": 6901,
"precision": 0.6619275289380976,
"recall": 0.7623532821330242
},
"eval_NAME": {
"f1": 0.8035773802910788,
"number": 8857,
"precision": 0.7909240021869874,
"recall": 0.8166422039065147
},
"eval_QTY": {
"f1": 0.9864836764400082,
"number": 7189,
"precision": 0.9831445150594087,
"recall": 0.9898455974405341
},
"eval_RANGE_END": {
"f1": 0.7906976744186046,
"number": 92,
"precision": 0.6910569105691057,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.9539395984477813,
"number": 5732,
"precision": 0.9235543939888925,
"recall": 0.9863921842288904
},
"eval_loss": 0.4859357178211212,
"eval_overall_accuracy": 0.8370822743997269,
"eval_overall_f1": 0.8542639055049118,
"eval_overall_precision": 0.829048927263213,
"eval_overall_recall": 0.8810607903792013,
"eval_runtime": 9.1351,
"eval_samples_per_second": 931.131,
"eval_steps_per_second": 29.118,
"step": 45000
},
{
"epoch": 9.01,
"learning_rate": 4.959413977430212e-06,
"loss": 0.4071,
"step": 45500
},
{
"epoch": 9.11,
"learning_rate": 4.4644624826766974e-06,
"loss": 0.3985,
"step": 46000
},
{
"epoch": 9.11,
"eval_COMMENT": {
"f1": 0.7050125483280201,
"number": 6901,
"precision": 0.6627135934710533,
"recall": 0.7530792638748007
},
"eval_NAME": {
"f1": 0.8021064301552105,
"number": 8857,
"precision": 0.7878688881629097,
"recall": 0.8168680140002258
},
"eval_QTY": {
"f1": 0.9866093110386457,
"number": 7189,
"precision": 0.9842192691029901,
"recall": 0.989010989010989
},
"eval_RANGE_END": {
"f1": 0.7853881278538813,
"number": 92,
"precision": 0.6771653543307087,
"recall": 0.9347826086956522
},
"eval_UNIT": {
"f1": 0.9550875412331895,
"number": 5732,
"precision": 0.9269413889344935,
"recall": 0.984996510816469
},
"eval_loss": 0.4896639585494995,
"eval_overall_accuracy": 0.8351856768956492,
"eval_overall_f1": 0.8533036226746344,
"eval_overall_precision": 0.8295532871631601,
"eval_overall_recall": 0.8784539988182545,
"eval_runtime": 6.8177,
"eval_samples_per_second": 1247.642,
"eval_steps_per_second": 39.016,
"step": 46000
},
{
"epoch": 9.21,
"learning_rate": 3.969510987923184e-06,
"loss": 0.3989,
"step": 46500
},
{
"epoch": 9.31,
"learning_rate": 3.4745594931696697e-06,
"loss": 0.3944,
"step": 47000
},
{
"epoch": 9.31,
"eval_COMMENT": {
"f1": 0.709349593495935,
"number": 6901,
"precision": 0.6661152818424736,
"recall": 0.7585857122156209
},
"eval_NAME": {
"f1": 0.8033533200088829,
"number": 8857,
"precision": 0.7902785363189514,
"recall": 0.8168680140002258
},
"eval_QTY": {
"f1": 0.9866833125260092,
"number": 7189,
"precision": 0.9839535205422604,
"recall": 0.9894282932257615
},
"eval_RANGE_END": {
"f1": 0.787037037037037,
"number": 92,
"precision": 0.6854838709677419,
"recall": 0.9239130434782609
},
"eval_UNIT": {
"f1": 0.954649100582721,
"number": 5732,
"precision": 0.9251923391717138,
"recall": 0.9860432658757851
},
"eval_loss": 0.48901429772377014,
"eval_overall_accuracy": 0.8369495125744415,
"eval_overall_f1": 0.8547268216112208,
"eval_overall_precision": 0.8308176926105788,
"eval_overall_recall": 0.8800528309756351,
"eval_runtime": 9.5285,
"eval_samples_per_second": 892.692,
"eval_steps_per_second": 27.916,
"step": 47000
},
{
"epoch": 9.4,
"learning_rate": 2.979607998416155e-06,
"loss": 0.397,
"step": 47500
},
{
"epoch": 9.5,
"learning_rate": 2.484656503662641e-06,
"loss": 0.3959,
"step": 48000
},
{
"epoch": 9.5,
"eval_COMMENT": {
"f1": 0.7106236964273699,
"number": 6901,
"precision": 0.6632755589047978,
"recall": 0.765251412838719
},
"eval_NAME": {
"f1": 0.8044214853080043,
"number": 8857,
"precision": 0.7917122239230264,
"recall": 0.8175454442813593
},
"eval_QTY": {
"f1": 0.9865483289418943,
"number": 7189,
"precision": 0.9835476289229919,
"recall": 0.9895673946306858
},
"eval_RANGE_END": {
"f1": 0.7926267281105991,
"number": 92,
"precision": 0.688,
"recall": 0.9347826086956522
},
"eval_UNIT": {
"f1": 0.9542693216334796,
"number": 5732,
"precision": 0.9240196078431373,
"recall": 0.9865666434054431
},
"eval_loss": 0.4869215190410614,
"eval_overall_accuracy": 0.8368736486742784,
"eval_overall_f1": 0.8550634297555469,
"eval_overall_precision": 0.829693323742889,
"eval_overall_recall": 0.8820339925619547,
"eval_runtime": 6.6612,
"eval_samples_per_second": 1276.945,
"eval_steps_per_second": 39.933,
"step": 48000
},
{
"epoch": 9.6,
"learning_rate": 1.989705008909127e-06,
"loss": 0.3916,
"step": 48500
},
{
"epoch": 9.7,
"learning_rate": 1.4947535141556129e-06,
"loss": 0.3979,
"step": 49000
},
{
"epoch": 9.7,
"eval_COMMENT": {
"f1": 0.7113812901046943,
"number": 6901,
"precision": 0.666244939271255,
"recall": 0.7630778148094479
},
"eval_NAME": {
"f1": 0.8035317636605953,
"number": 8857,
"precision": 0.7906239755218009,
"recall": 0.8168680140002258
},
"eval_QTY": {
"f1": 0.9864780528396089,
"number": 7189,
"precision": 0.9835453539823009,
"recall": 0.9894282932257615
},
"eval_RANGE_END": {
"f1": 0.7813953488372093,
"number": 92,
"precision": 0.6829268292682927,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.9541810817652518,
"number": 5732,
"precision": 0.9240071907174375,
"recall": 0.9863921842288904
},
"eval_loss": 0.48777857422828674,
"eval_overall_accuracy": 0.8369115806243599,
"eval_overall_f1": 0.8550421585160202,
"eval_overall_precision": 0.8304235317239346,
"eval_overall_recall": 0.8811650620416391,
"eval_runtime": 8.6569,
"eval_samples_per_second": 982.572,
"eval_steps_per_second": 30.727,
"step": 49000
},
{
"epoch": 9.8,
"learning_rate": 9.998020194020988e-07,
"loss": 0.4088,
"step": 49500
},
{
"epoch": 9.9,
"learning_rate": 5.048505246485845e-07,
"loss": 0.4095,
"step": 50000
},
{
"epoch": 9.9,
"eval_COMMENT": {
"f1": 0.7118095366561004,
"number": 6901,
"precision": 0.665783497350492,
"recall": 0.7646717866975801
},
"eval_NAME": {
"f1": 0.80368950380619,
"number": 8857,
"precision": 0.7912472647702407,
"recall": 0.8165292988596591
},
"eval_QTY": {
"f1": 0.9863412604867227,
"number": 7189,
"precision": 0.9832734310201825,
"recall": 0.9894282932257615
},
"eval_RANGE_END": {
"f1": 0.7813953488372093,
"number": 92,
"precision": 0.6829268292682927,
"recall": 0.9130434782608695
},
"eval_UNIT": {
"f1": 0.9544226873733964,
"number": 5732,
"precision": 0.9244604316546763,
"recall": 0.9863921842288904
},
"eval_loss": 0.48620378971099854,
"eval_overall_accuracy": 0.8372719341501347,
"eval_overall_f1": 0.855167762603271,
"eval_overall_precision": 0.8304135695340384,
"eval_overall_recall": 0.8814431198081402,
"eval_runtime": 8.2871,
"eval_samples_per_second": 1026.42,
"eval_steps_per_second": 32.098,
"step": 50000
},
{
"epoch": 10.0,
"learning_rate": 9.899029895070283e-09,
"loss": 0.3994,
"step": 50500
},
{
"epoch": 10.0,
"step": 50510,
"total_flos": 1555191327435270.0,
"train_loss": 0.45639907907811844,
"train_runtime": 1954.9419,
"train_samples_per_second": 826.638,
"train_steps_per_second": 25.837
}
],
"logging_steps": 500,
"max_steps": 50510,
"num_train_epochs": 10,
"save_steps": 1000,
"total_flos": 1555191327435270.0,
"trial_name": null,
"trial_params": null
}