|
{ |
|
"best_metric": 0.474032998085022, |
|
"best_model_checkpoint": "nyt_ingredients-tagger-gte-small-L3-ingredient-v2/checkpoint-24000", |
|
"epoch": 10.0, |
|
"eval_steps": 1000, |
|
"global_step": 50510, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 4.9505048505246485e-05, |
|
"loss": 1.1293, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 4.9010097010492975e-05, |
|
"loss": 0.6931, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_COMMENT": { |
|
"f1": 0.5770606987183658, |
|
"number": 6901, |
|
"precision": 0.5236127508854782, |
|
"recall": 0.6426604839878278 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7875208913649026, |
|
"number": 8857, |
|
"precision": 0.7773012207192346, |
|
"recall": 0.7980128711753416 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9780634343998882, |
|
"number": 7189, |
|
"precision": 0.9824561403508771, |
|
"recall": 0.9737098344693281 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.0, |
|
"number": 92, |
|
"precision": 0.0, |
|
"recall": 0.0 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9434346865975879, |
|
"number": 5732, |
|
"precision": 0.9192320423700762, |
|
"recall": 0.9689462665736218 |
|
}, |
|
"eval_loss": 0.6230219006538391, |
|
"eval_overall_accuracy": 0.7985813450669499, |
|
"eval_overall_f1": 0.8086250651249558, |
|
"eval_overall_precision": 0.7828506345590628, |
|
"eval_overall_recall": 0.8361544610892913, |
|
"eval_runtime": 7.9128, |
|
"eval_samples_per_second": 1074.967, |
|
"eval_steps_per_second": 33.616, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"learning_rate": 4.851514551573946e-05, |
|
"loss": 0.6087, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 4.802019402098595e-05, |
|
"loss": 0.5826, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_COMMENT": { |
|
"f1": 0.602454780361757, |
|
"number": 6901, |
|
"precision": 0.5435365427205968, |
|
"recall": 0.6756991740327489 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7907440212577502, |
|
"number": 8857, |
|
"precision": 0.7757141305528402, |
|
"recall": 0.8063678446426555 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9754149163280765, |
|
"number": 7189, |
|
"precision": 0.9659028914348063, |
|
"recall": 0.9851161496731117 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.6567164179104478, |
|
"number": 92, |
|
"precision": 0.6055045871559633, |
|
"recall": 0.717391304347826 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9462474645030426, |
|
"number": 5732, |
|
"precision": 0.9177049180327869, |
|
"recall": 0.9766224703419399 |
|
}, |
|
"eval_loss": 0.5530511736869812, |
|
"eval_overall_accuracy": 0.8078557068618898, |
|
"eval_overall_f1": 0.8170321807714068, |
|
"eval_overall_precision": 0.7837009608325087, |
|
"eval_overall_recall": 0.8533245281707275, |
|
"eval_runtime": 6.3157, |
|
"eval_samples_per_second": 1346.806, |
|
"eval_steps_per_second": 42.117, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"learning_rate": 4.752524252623243e-05, |
|
"loss": 0.5569, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"learning_rate": 4.703029103147892e-05, |
|
"loss": 0.5435, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"eval_COMMENT": { |
|
"f1": 0.6313494946826079, |
|
"number": 6901, |
|
"precision": 0.5801165331391115, |
|
"recall": 0.6925083321257789 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7944305207463102, |
|
"number": 8857, |
|
"precision": 0.7839085513299626, |
|
"recall": 0.8052387941740996 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9791782343142699, |
|
"number": 7189, |
|
"precision": 0.9771436487048067, |
|
"recall": 0.9812213103352344 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7109004739336493, |
|
"number": 92, |
|
"precision": 0.6302521008403361, |
|
"recall": 0.8152173913043478 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9472093999160722, |
|
"number": 5732, |
|
"precision": 0.9126637554585153, |
|
"recall": 0.9844731332868109 |
|
}, |
|
"eval_loss": 0.5327398180961609, |
|
"eval_overall_accuracy": 0.8150438114023442, |
|
"eval_overall_f1": 0.827899644462333, |
|
"eval_overall_precision": 0.7999157403506497, |
|
"eval_overall_recall": 0.8579124813179938, |
|
"eval_runtime": 8.1233, |
|
"eval_samples_per_second": 1047.112, |
|
"eval_steps_per_second": 32.745, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.69, |
|
"learning_rate": 4.65353395367254e-05, |
|
"loss": 0.5324, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"learning_rate": 4.6040388041971886e-05, |
|
"loss": 0.5333, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"eval_COMMENT": { |
|
"f1": 0.6446886446886447, |
|
"number": 6901, |
|
"precision": 0.5875760104924288, |
|
"recall": 0.7140994058832053 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7953999888349244, |
|
"number": 8857, |
|
"precision": 0.786660777385159, |
|
"recall": 0.8043355537992548 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9809583594894328, |
|
"number": 7189, |
|
"precision": 0.9837716843872412, |
|
"recall": 0.9781610794269022 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7555555555555556, |
|
"number": 92, |
|
"precision": 0.6390977443609023, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9506497918967128, |
|
"number": 5732, |
|
"precision": 0.9263366992219831, |
|
"recall": 0.9762735519888346 |
|
}, |
|
"eval_loss": 0.5212323665618896, |
|
"eval_overall_accuracy": 0.8183059591093578, |
|
"eval_overall_f1": 0.831933619994625, |
|
"eval_overall_precision": 0.8049731838127743, |
|
"eval_overall_recall": 0.8607625734246289, |
|
"eval_runtime": 8.6379, |
|
"eval_samples_per_second": 984.732, |
|
"eval_steps_per_second": 30.795, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.89, |
|
"learning_rate": 4.5545436547218376e-05, |
|
"loss": 0.5285, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"learning_rate": 4.505048505246486e-05, |
|
"loss": 0.5199, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_COMMENT": { |
|
"f1": 0.6402057097646205, |
|
"number": 6901, |
|
"precision": 0.5873457536898137, |
|
"recall": 0.7035212288074192 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8005563282336579, |
|
"number": 8857, |
|
"precision": 0.7890984865101996, |
|
"recall": 0.812351812126002 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9803540437348144, |
|
"number": 7189, |
|
"precision": 0.978519955654102, |
|
"recall": 0.9821950201697037 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7747747747747747, |
|
"number": 92, |
|
"precision": 0.6615384615384615, |
|
"recall": 0.9347826086956522 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9499704716105627, |
|
"number": 5732, |
|
"precision": 0.9197843489625878, |
|
"recall": 0.9822051639916259 |
|
}, |
|
"eval_loss": 0.5120549201965332, |
|
"eval_overall_accuracy": 0.8185525167848879, |
|
"eval_overall_f1": 0.8328133910301567, |
|
"eval_overall_precision": 0.804738906356358, |
|
"eval_overall_recall": 0.8629175211150116, |
|
"eval_runtime": 6.4358, |
|
"eval_samples_per_second": 1321.664, |
|
"eval_steps_per_second": 41.331, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 4.455553355771135e-05, |
|
"loss": 0.5127, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"learning_rate": 4.406058206295783e-05, |
|
"loss": 0.4983, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"eval_COMMENT": { |
|
"f1": 0.6476600322754169, |
|
"number": 6901, |
|
"precision": 0.6041901894367081, |
|
"recall": 0.6978698739313143 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7935644937586686, |
|
"number": 8857, |
|
"precision": 0.7801047120418848, |
|
"recall": 0.8074968951112115 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9824293353705119, |
|
"number": 7189, |
|
"precision": 0.980998613037448, |
|
"recall": 0.983864237028794 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7601809954751132, |
|
"number": 92, |
|
"precision": 0.6511627906976745, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9500843170320405, |
|
"number": 5732, |
|
"precision": 0.9193864229765013, |
|
"recall": 0.9829030006978368 |
|
}, |
|
"eval_loss": 0.5088106393814087, |
|
"eval_overall_accuracy": 0.8192163259113151, |
|
"eval_overall_f1": 0.8339592771611903, |
|
"eval_overall_precision": 0.8089590276416389, |
|
"eval_overall_recall": 0.8605540300997532, |
|
"eval_runtime": 8.5928, |
|
"eval_samples_per_second": 989.902, |
|
"eval_steps_per_second": 30.956, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 1.29, |
|
"learning_rate": 4.356563056820432e-05, |
|
"loss": 0.5102, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"learning_rate": 4.3070679073450804e-05, |
|
"loss": 0.5031, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_COMMENT": { |
|
"f1": 0.6483065113460373, |
|
"number": 6901, |
|
"precision": 0.6055345911949686, |
|
"recall": 0.6975800608607449 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.797360248447205, |
|
"number": 8857, |
|
"precision": 0.7835422343324251, |
|
"recall": 0.8116743818448685 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9815493055075669, |
|
"number": 7189, |
|
"precision": 0.9752815160670145, |
|
"recall": 0.9878981777715955 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7706422018348623, |
|
"number": 92, |
|
"precision": 0.6666666666666666, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9498936622713738, |
|
"number": 5732, |
|
"precision": 0.9269467043001827, |
|
"recall": 0.9740055826936497 |
|
}, |
|
"eval_loss": 0.5030972361564636, |
|
"eval_overall_accuracy": 0.8199370329628646, |
|
"eval_overall_f1": 0.8351003758828189, |
|
"eval_overall_precision": 0.8107082078806126, |
|
"eval_overall_recall": 0.8610058739703174, |
|
"eval_runtime": 7.9063, |
|
"eval_samples_per_second": 1075.848, |
|
"eval_steps_per_second": 33.644, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"learning_rate": 4.257572757869729e-05, |
|
"loss": 0.5027, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"learning_rate": 4.208077608394378e-05, |
|
"loss": 0.492, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"eval_COMMENT": { |
|
"f1": 0.6769068494956819, |
|
"number": 6901, |
|
"precision": 0.6209482341557814, |
|
"recall": 0.743950152151862 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7926012072880323, |
|
"number": 8857, |
|
"precision": 0.7778260869565218, |
|
"recall": 0.8079485152986339 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9821801475706529, |
|
"number": 7189, |
|
"precision": 0.983001254005852, |
|
"recall": 0.9813604117401585 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7685589519650656, |
|
"number": 92, |
|
"precision": 0.6423357664233577, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9496828752642706, |
|
"number": 5732, |
|
"precision": 0.9215493188905302, |
|
"recall": 0.9795882763433357 |
|
}, |
|
"eval_loss": 0.5041355490684509, |
|
"eval_overall_accuracy": 0.8246216287979365, |
|
"eval_overall_f1": 0.8398886765248299, |
|
"eval_overall_precision": 0.8112712550607287, |
|
"eval_overall_recall": 0.8705988669146015, |
|
"eval_runtime": 9.0062, |
|
"eval_samples_per_second": 944.457, |
|
"eval_steps_per_second": 29.535, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 1.68, |
|
"learning_rate": 4.158582458919026e-05, |
|
"loss": 0.4939, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"learning_rate": 4.109087309443675e-05, |
|
"loss": 0.4817, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"eval_COMMENT": { |
|
"f1": 0.6750676255195619, |
|
"number": 6901, |
|
"precision": 0.6196705426356589, |
|
"recall": 0.7413418345167367 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8006897702620014, |
|
"number": 8857, |
|
"precision": 0.7891447368421053, |
|
"recall": 0.8125776222197132 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9833679833679833, |
|
"number": 7189, |
|
"precision": 0.9798370390829996, |
|
"recall": 0.9869244679371262 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7792207792207793, |
|
"number": 92, |
|
"precision": 0.6474820143884892, |
|
"recall": 0.9782608695652174 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9505083606419629, |
|
"number": 5732, |
|
"precision": 0.9168422758956071, |
|
"recall": 0.9867411025819958 |
|
}, |
|
"eval_loss": 0.4901449382305145, |
|
"eval_overall_accuracy": 0.8292872586579676, |
|
"eval_overall_f1": 0.8427365317609219, |
|
"eval_overall_precision": 0.8133872271624899, |
|
"eval_overall_recall": 0.8742831323207396, |
|
"eval_runtime": 9.1291, |
|
"eval_samples_per_second": 931.746, |
|
"eval_steps_per_second": 29.138, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"learning_rate": 4.059592159968323e-05, |
|
"loss": 0.4903, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"learning_rate": 4.010097010492972e-05, |
|
"loss": 0.4905, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_COMMENT": { |
|
"f1": 0.6778359049069598, |
|
"number": 6901, |
|
"precision": 0.6241463414634146, |
|
"recall": 0.7416316475873062 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8002232142857143, |
|
"number": 8857, |
|
"precision": 0.7911287653095002, |
|
"recall": 0.8095291859546122 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9842749791260784, |
|
"number": 7189, |
|
"precision": 0.9846860643185299, |
|
"recall": 0.983864237028794 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.789237668161435, |
|
"number": 92, |
|
"precision": 0.6717557251908397, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9502270052127123, |
|
"number": 5732, |
|
"precision": 0.9170723790976956, |
|
"recall": 0.9858688066992324 |
|
}, |
|
"eval_loss": 0.4891791045665741, |
|
"eval_overall_accuracy": 0.8287751773318667, |
|
"eval_overall_f1": 0.8435557049235421, |
|
"eval_overall_precision": 0.8165522625980025, |
|
"eval_overall_recall": 0.8724062423968579, |
|
"eval_runtime": 6.9634, |
|
"eval_samples_per_second": 1221.536, |
|
"eval_steps_per_second": 38.2, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 2.08, |
|
"learning_rate": 3.9606018610176205e-05, |
|
"loss": 0.4804, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 2.18, |
|
"learning_rate": 3.911106711542269e-05, |
|
"loss": 0.4757, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 2.18, |
|
"eval_COMMENT": { |
|
"f1": 0.6788539520042544, |
|
"number": 6901, |
|
"precision": 0.6271186440677966, |
|
"recall": 0.7398927691638892 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.802429240026744, |
|
"number": 8857, |
|
"precision": 0.7921020789792103, |
|
"recall": 0.8130292424071356 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9835042971998891, |
|
"number": 7189, |
|
"precision": 0.9801077496891836, |
|
"recall": 0.9869244679371262 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7758620689655172, |
|
"number": 92, |
|
"precision": 0.6428571428571429, |
|
"recall": 0.9782608695652174 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9515842839036756, |
|
"number": 5732, |
|
"precision": 0.9226609864001311, |
|
"recall": 0.9823796231681786 |
|
}, |
|
"eval_loss": 0.4953509271144867, |
|
"eval_overall_accuracy": 0.8274285931039714, |
|
"eval_overall_f1": 0.844669333960932, |
|
"eval_overall_precision": 0.8179391176949373, |
|
"eval_overall_recall": 0.8732056584755483, |
|
"eval_runtime": 8.0512, |
|
"eval_samples_per_second": 1056.487, |
|
"eval_steps_per_second": 33.039, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 2.28, |
|
"learning_rate": 3.861611562066917e-05, |
|
"loss": 0.4856, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 2.38, |
|
"learning_rate": 3.812116412591566e-05, |
|
"loss": 0.4691, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 2.38, |
|
"eval_COMMENT": { |
|
"f1": 0.6842557693579316, |
|
"number": 6901, |
|
"precision": 0.6292872780345414, |
|
"recall": 0.7497464135632517 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.803944509443423, |
|
"number": 8857, |
|
"precision": 0.7935547734271887, |
|
"recall": 0.8146099130631139 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.984621778886118, |
|
"number": 7189, |
|
"precision": 0.9806816613771215, |
|
"recall": 0.9885936847962165 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.780701754385965, |
|
"number": 92, |
|
"precision": 0.6544117647058824, |
|
"recall": 0.967391304347826 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9528556944913822, |
|
"number": 5732, |
|
"precision": 0.9238204456094364, |
|
"recall": 0.9837752965806001 |
|
}, |
|
"eval_loss": 0.4902682304382324, |
|
"eval_overall_accuracy": 0.8301407275348026, |
|
"eval_overall_f1": 0.84684079769019, |
|
"eval_overall_precision": 0.818934450180189, |
|
"eval_overall_recall": 0.8767161377776233, |
|
"eval_runtime": 8.9123, |
|
"eval_samples_per_second": 954.413, |
|
"eval_steps_per_second": 29.846, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 2.47, |
|
"learning_rate": 3.762621263116215e-05, |
|
"loss": 0.4806, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 2.57, |
|
"learning_rate": 3.7131261136408633e-05, |
|
"loss": 0.4765, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 2.57, |
|
"eval_COMMENT": { |
|
"f1": 0.6893633899649634, |
|
"number": 6901, |
|
"precision": 0.6338439095550693, |
|
"recall": 0.7555426749746413 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.805656475322788, |
|
"number": 8857, |
|
"precision": 0.7977640026566305, |
|
"recall": 0.8137066726882691 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9841977027497391, |
|
"number": 7189, |
|
"precision": 0.9850891861761427, |
|
"recall": 0.9833078314090973 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7777777777777777, |
|
"number": 92, |
|
"precision": 0.6774193548387096, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9518021440027011, |
|
"number": 5732, |
|
"precision": 0.9219950940310712, |
|
"recall": 0.9836008374040475 |
|
}, |
|
"eval_loss": 0.4845636188983917, |
|
"eval_overall_accuracy": 0.8307097067860258, |
|
"eval_overall_f1": 0.8482320088820106, |
|
"eval_overall_precision": 0.8219070904645477, |
|
"eval_overall_recall": 0.8762990511278718, |
|
"eval_runtime": 6.7092, |
|
"eval_samples_per_second": 1267.814, |
|
"eval_steps_per_second": 39.647, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 2.67, |
|
"learning_rate": 3.663630964165512e-05, |
|
"loss": 0.4715, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"learning_rate": 3.6141358146901606e-05, |
|
"loss": 0.4747, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"eval_COMMENT": { |
|
"f1": 0.6842317515795134, |
|
"number": 6901, |
|
"precision": 0.6380844929171368, |
|
"recall": 0.7375742645993334 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8026484170700496, |
|
"number": 8857, |
|
"precision": 0.791246160596753, |
|
"recall": 0.8143841029694028 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9847090569431951, |
|
"number": 7189, |
|
"precision": 0.9796255506607929, |
|
"recall": 0.9898455974405341 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7878787878787878, |
|
"number": 92, |
|
"precision": 0.6546762589928058, |
|
"recall": 0.9891304347826086 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9519481612387444, |
|
"number": 5732, |
|
"precision": 0.9195252804422045, |
|
"recall": 0.9867411025819958 |
|
}, |
|
"eval_loss": 0.4844052493572235, |
|
"eval_overall_accuracy": 0.8314304138375754, |
|
"eval_overall_f1": 0.8470833754081255, |
|
"eval_overall_precision": 0.8211570463666917, |
|
"eval_overall_recall": 0.8747002189704911, |
|
"eval_runtime": 8.8562, |
|
"eval_samples_per_second": 960.458, |
|
"eval_steps_per_second": 30.035, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 2.87, |
|
"learning_rate": 3.564640665214809e-05, |
|
"loss": 0.4673, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 2.97, |
|
"learning_rate": 3.515145515739457e-05, |
|
"loss": 0.4654, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 2.97, |
|
"eval_COMMENT": { |
|
"f1": 0.6951928862739855, |
|
"number": 6901, |
|
"precision": 0.6453574975173784, |
|
"recall": 0.7533690769453703 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8027195720017833, |
|
"number": 8857, |
|
"precision": 0.7925608011444921, |
|
"recall": 0.8131421474539912 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9852237252861602, |
|
"number": 7189, |
|
"precision": 0.9827013562136728, |
|
"recall": 0.9877590763666713 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7802690582959643, |
|
"number": 92, |
|
"precision": 0.6641221374045801, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9533801506049582, |
|
"number": 5732, |
|
"precision": 0.9255791030064071, |
|
"recall": 0.9829030006978368 |
|
}, |
|
"eval_loss": 0.48082008957862854, |
|
"eval_overall_accuracy": 0.8331752835413269, |
|
"eval_overall_f1": 0.8498601704909194, |
|
"eval_overall_precision": 0.8246313793441659, |
|
"eval_overall_recall": 0.8766813805568107, |
|
"eval_runtime": 7.2911, |
|
"eval_samples_per_second": 1166.621, |
|
"eval_steps_per_second": 36.483, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 3.07, |
|
"learning_rate": 3.465650366264107e-05, |
|
"loss": 0.4573, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 3.17, |
|
"learning_rate": 3.416155216788755e-05, |
|
"loss": 0.4586, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 3.17, |
|
"eval_COMMENT": { |
|
"f1": 0.6976900801400768, |
|
"number": 6901, |
|
"precision": 0.6517362858580775, |
|
"recall": 0.7506158527749601 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8010911317708622, |
|
"number": 8857, |
|
"precision": 0.7901383703052932, |
|
"recall": 0.812351812126002 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9851262538913871, |
|
"number": 7189, |
|
"precision": 0.979906413432425, |
|
"recall": 0.990402003060231 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7802690582959643, |
|
"number": 92, |
|
"precision": 0.6641221374045801, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9516034003871727, |
|
"number": 5732, |
|
"precision": 0.9193364774760123, |
|
"recall": 0.9862177250523377 |
|
}, |
|
"eval_loss": 0.48265689611434937, |
|
"eval_overall_accuracy": 0.8316959374881463, |
|
"eval_overall_f1": 0.8500783210658401, |
|
"eval_overall_precision": 0.824673202614379, |
|
"eval_overall_recall": 0.8770984672065621, |
|
"eval_runtime": 9.1659, |
|
"eval_samples_per_second": 928.008, |
|
"eval_steps_per_second": 29.021, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 3.27, |
|
"learning_rate": 3.3666600673134034e-05, |
|
"loss": 0.4591, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 3.37, |
|
"learning_rate": 3.317164917838052e-05, |
|
"loss": 0.4612, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 3.37, |
|
"eval_COMMENT": { |
|
"f1": 0.6966127636920211, |
|
"number": 6901, |
|
"precision": 0.6441053408811224, |
|
"recall": 0.7584408056803362 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7990913120567377, |
|
"number": 8857, |
|
"precision": 0.7845718637797846, |
|
"recall": 0.8141582928756915 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9846325012168833, |
|
"number": 7189, |
|
"precision": 0.9844271412680756, |
|
"recall": 0.9848379468632633 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7802690582959643, |
|
"number": 92, |
|
"precision": 0.6641221374045801, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9502140878179833, |
|
"number": 5732, |
|
"precision": 0.9158439877002751, |
|
"recall": 0.9872644801116539 |
|
}, |
|
"eval_loss": 0.4868798851966858, |
|
"eval_overall_accuracy": 0.8307666047111482, |
|
"eval_overall_f1": 0.8481624433629804, |
|
"eval_overall_precision": 0.8199811804406373, |
|
"eval_overall_recall": 0.8783497271558166, |
|
"eval_runtime": 7.3722, |
|
"eval_samples_per_second": 1153.794, |
|
"eval_steps_per_second": 36.081, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 3.46, |
|
"learning_rate": 3.267669768362701e-05, |
|
"loss": 0.4592, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 3.56, |
|
"learning_rate": 3.218174618887349e-05, |
|
"loss": 0.4546, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 3.56, |
|
"eval_COMMENT": { |
|
"f1": 0.6903326332904275, |
|
"number": 6901, |
|
"precision": 0.6482188295165394, |
|
"recall": 0.7382987972757571 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8029488387561666, |
|
"number": 8857, |
|
"precision": 0.788654181184669, |
|
"recall": 0.8177712543750706 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9853083853083853, |
|
"number": 7189, |
|
"precision": 0.9817704736914791, |
|
"recall": 0.9888718876060648 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.787037037037037, |
|
"number": 92, |
|
"precision": 0.6854838709677419, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9534019922336655, |
|
"number": 5732, |
|
"precision": 0.9236179260713118, |
|
"recall": 0.9851709699930217 |
|
}, |
|
"eval_loss": 0.480613112449646, |
|
"eval_overall_accuracy": 0.8314683457876569, |
|
"eval_overall_f1": 0.8492933517725234, |
|
"eval_overall_precision": 0.8249189136061331, |
|
"eval_overall_recall": 0.8751520628410552, |
|
"eval_runtime": 8.0402, |
|
"eval_samples_per_second": 1057.931, |
|
"eval_steps_per_second": 33.084, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 3.66, |
|
"learning_rate": 3.168679469411997e-05, |
|
"loss": 0.4609, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 3.76, |
|
"learning_rate": 3.119184319936647e-05, |
|
"loss": 0.4471, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 3.76, |
|
"eval_COMMENT": { |
|
"f1": 0.6993611924407772, |
|
"number": 6901, |
|
"precision": 0.6466100652147164, |
|
"recall": 0.7614838429213158 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8037861915367484, |
|
"number": 8857, |
|
"precision": 0.7929254092057564, |
|
"recall": 0.8149486282036807 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9852052510939778, |
|
"number": 7189, |
|
"precision": 0.983906770255272, |
|
"recall": 0.9865071637223536 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7927927927927929, |
|
"number": 92, |
|
"precision": 0.676923076923077, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9520276536548351, |
|
"number": 5732, |
|
"precision": 0.9211943220753793, |
|
"recall": 0.984996510816469 |
|
}, |
|
"eval_loss": 0.4822600483894348, |
|
"eval_overall_accuracy": 0.8327769980654706, |
|
"eval_overall_f1": 0.8508441514764242, |
|
"eval_overall_precision": 0.8241521972831222, |
|
"eval_overall_recall": 0.87932292933857, |
|
"eval_runtime": 8.7949, |
|
"eval_samples_per_second": 967.151, |
|
"eval_steps_per_second": 30.245, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 3.86, |
|
"learning_rate": 3.069689170461295e-05, |
|
"loss": 0.4581, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 3.96, |
|
"learning_rate": 3.0201940209859435e-05, |
|
"loss": 0.4542, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 3.96, |
|
"eval_COMMENT": { |
|
"f1": 0.6950766529344229, |
|
"number": 6901, |
|
"precision": 0.6508980521123198, |
|
"recall": 0.7456890305752789 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7992666259236624, |
|
"number": 8857, |
|
"precision": 0.7868081382629621, |
|
"recall": 0.8121260020322908 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9853604384930272, |
|
"number": 7189, |
|
"precision": 0.9829734219269103, |
|
"recall": 0.9877590763666713 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7873303167420815, |
|
"number": 92, |
|
"precision": 0.6744186046511628, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9524210526315788, |
|
"number": 5732, |
|
"precision": 0.920559986977047, |
|
"recall": 0.9865666434054431 |
|
}, |
|
"eval_loss": 0.47578319907188416, |
|
"eval_overall_accuracy": 0.832568372340022, |
|
"eval_overall_f1": 0.8490938211245047, |
|
"eval_overall_precision": 0.8244499738082766, |
|
"eval_overall_recall": 0.875256334503493, |
|
"eval_runtime": 6.7831, |
|
"eval_samples_per_second": 1253.998, |
|
"eval_steps_per_second": 39.215, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 4.06, |
|
"learning_rate": 2.970698871510592e-05, |
|
"loss": 0.4454, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 4.16, |
|
"learning_rate": 2.9212037220352405e-05, |
|
"loss": 0.4452, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 4.16, |
|
"eval_COMMENT": { |
|
"f1": 0.6982899022801302, |
|
"number": 6901, |
|
"precision": 0.6566687938736439, |
|
"recall": 0.7455441240399941 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7992468294844105, |
|
"number": 8857, |
|
"precision": 0.7843478260869565, |
|
"recall": 0.8147228181099695 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9847455276660656, |
|
"number": 7189, |
|
"precision": 0.981750311074243, |
|
"recall": 0.9877590763666713 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.787037037037037, |
|
"number": 92, |
|
"precision": 0.6854838709677419, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9537733457280487, |
|
"number": 5732, |
|
"precision": 0.9249303392886412, |
|
"recall": 0.9844731332868109 |
|
}, |
|
"eval_loss": 0.48325347900390625, |
|
"eval_overall_accuracy": 0.8338959905928763, |
|
"eval_overall_f1": 0.8500944924406048, |
|
"eval_overall_precision": 0.8260912340537172, |
|
"eval_overall_recall": 0.8755343922699941, |
|
"eval_runtime": 9.0461, |
|
"eval_samples_per_second": 940.291, |
|
"eval_steps_per_second": 29.405, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 4.26, |
|
"learning_rate": 2.871708572559889e-05, |
|
"loss": 0.4217, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 4.36, |
|
"learning_rate": 2.8222134230845377e-05, |
|
"loss": 0.4412, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 4.36, |
|
"eval_COMMENT": { |
|
"f1": 0.6974386700006758, |
|
"number": 6901, |
|
"precision": 0.6534954407294833, |
|
"recall": 0.7477177220692653 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8008429926238145, |
|
"number": 8857, |
|
"precision": 0.7870067582297798, |
|
"recall": 0.8151744382973919 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9858392336526447, |
|
"number": 7189, |
|
"precision": 0.9839268394069558, |
|
"recall": 0.9877590763666713 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.789237668161435, |
|
"number": 92, |
|
"precision": 0.6717557251908397, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9540462916033113, |
|
"number": 5732, |
|
"precision": 0.9248280379954144, |
|
"recall": 0.9851709699930217 |
|
}, |
|
"eval_loss": 0.4888293445110321, |
|
"eval_overall_accuracy": 0.8325494063649812, |
|
"eval_overall_f1": 0.8505270258875117, |
|
"eval_overall_precision": 0.8261040492727034, |
|
"eval_overall_recall": 0.8764380800111223, |
|
"eval_runtime": 6.5585, |
|
"eval_samples_per_second": 1296.944, |
|
"eval_steps_per_second": 40.558, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 4.45, |
|
"learning_rate": 2.7727182736091867e-05, |
|
"loss": 0.4481, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 4.55, |
|
"learning_rate": 2.7232231241338353e-05, |
|
"loss": 0.4423, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 4.55, |
|
"eval_COMMENT": { |
|
"f1": 0.6981985021253626, |
|
"number": 6901, |
|
"precision": 0.6532828282828282, |
|
"recall": 0.7497464135632517 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8019725177304966, |
|
"number": 8857, |
|
"precision": 0.7874007180937874, |
|
"recall": 0.817093824093937 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9857043719639139, |
|
"number": 7189, |
|
"precision": 0.9835202880487467, |
|
"recall": 0.9878981777715955 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7999999999999999, |
|
"number": 92, |
|
"precision": 0.6766917293233082, |
|
"recall": 0.9782608695652174 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9548452562151193, |
|
"number": 5732, |
|
"precision": 0.9264850672792911, |
|
"recall": 0.984996510816469 |
|
}, |
|
"eval_loss": 0.4827423095703125, |
|
"eval_overall_accuracy": 0.8337821947426317, |
|
"eval_overall_f1": 0.8511377043654138, |
|
"eval_overall_precision": 0.8262377695605223, |
|
"eval_overall_recall": 0.8775850682979389, |
|
"eval_runtime": 8.9572, |
|
"eval_samples_per_second": 949.629, |
|
"eval_steps_per_second": 29.697, |
|
"step": 23000 |
|
}, |
|
{ |
|
"epoch": 4.65, |
|
"learning_rate": 2.6737279746584836e-05, |
|
"loss": 0.4519, |
|
"step": 23500 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"learning_rate": 2.6242328251831323e-05, |
|
"loss": 0.4507, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"eval_COMMENT": { |
|
"f1": 0.69833923223523, |
|
"number": 6901, |
|
"precision": 0.6584520600693108, |
|
"recall": 0.7433705260107231 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8048291977300545, |
|
"number": 8857, |
|
"precision": 0.7933530766699572, |
|
"recall": 0.8166422039065147 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9856135011758197, |
|
"number": 7189, |
|
"precision": 0.9801898472967395, |
|
"recall": 0.9910975100848518 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7837837837837838, |
|
"number": 92, |
|
"precision": 0.6692307692307692, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9537942664418213, |
|
"number": 5732, |
|
"precision": 0.922976501305483, |
|
"recall": 0.9867411025819958 |
|
}, |
|
"eval_loss": 0.474032998085022, |
|
"eval_overall_accuracy": 0.8347115275196297, |
|
"eval_overall_f1": 0.8523122656487518, |
|
"eval_overall_precision": 0.8290126499096435, |
|
"eval_overall_recall": 0.8769594383233117, |
|
"eval_runtime": 7.5421, |
|
"eval_samples_per_second": 1127.8, |
|
"eval_steps_per_second": 35.269, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 4.85, |
|
"learning_rate": 2.5747376757077806e-05, |
|
"loss": 0.4377, |
|
"step": 24500 |
|
}, |
|
{ |
|
"epoch": 4.95, |
|
"learning_rate": 2.5252425262324292e-05, |
|
"loss": 0.4452, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 4.95, |
|
"eval_COMMENT": { |
|
"f1": 0.7040598290598291, |
|
"number": 6901, |
|
"precision": 0.6528792569659443, |
|
"recall": 0.7639472540211564 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8012646292084975, |
|
"number": 8857, |
|
"precision": 0.7875054513737462, |
|
"recall": 0.8155131534379587 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9855775897933713, |
|
"number": 7189, |
|
"precision": 0.9825798423890502, |
|
"recall": 0.9885936847962165 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7727272727272728, |
|
"number": 92, |
|
"precision": 0.6640625, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.953449148254343, |
|
"number": 5732, |
|
"precision": 0.9227881162259223, |
|
"recall": 0.9862177250523377 |
|
}, |
|
"eval_loss": 0.4791179597377777, |
|
"eval_overall_accuracy": 0.8352236088457308, |
|
"eval_overall_f1": 0.8516931350306697, |
|
"eval_overall_precision": 0.8244940456823062, |
|
"eval_overall_recall": 0.8807479753918876, |
|
"eval_runtime": 6.5842, |
|
"eval_samples_per_second": 1291.88, |
|
"eval_steps_per_second": 40.4, |
|
"step": 25000 |
|
}, |
|
{ |
|
"epoch": 5.05, |
|
"learning_rate": 2.4757473767570778e-05, |
|
"loss": 0.4442, |
|
"step": 25500 |
|
}, |
|
{ |
|
"epoch": 5.15, |
|
"learning_rate": 2.4262522272817265e-05, |
|
"loss": 0.4274, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 5.15, |
|
"eval_COMMENT": { |
|
"f1": 0.7096947333109694, |
|
"number": 6901, |
|
"precision": 0.6607946026986506, |
|
"recall": 0.766410665120997 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8056639536180176, |
|
"number": 8857, |
|
"precision": 0.795727342803656, |
|
"recall": 0.8158518685785254 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9859017987360232, |
|
"number": 7189, |
|
"precision": 0.9844660194174757, |
|
"recall": 0.9873417721518988 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7962962962962964, |
|
"number": 92, |
|
"precision": 0.6935483870967742, |
|
"recall": 0.9347826086956522 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9532647207693606, |
|
"number": 5732, |
|
"precision": 0.9229010127409344, |
|
"recall": 0.9856943475226797 |
|
}, |
|
"eval_loss": 0.48070788383483887, |
|
"eval_overall_accuracy": 0.836058111747525, |
|
"eval_overall_f1": 0.854768006474238, |
|
"eval_overall_precision": 0.8299990177138928, |
|
"eval_overall_recall": 0.8810607903792013, |
|
"eval_runtime": 9.3326, |
|
"eval_samples_per_second": 911.433, |
|
"eval_steps_per_second": 28.502, |
|
"step": 26000 |
|
}, |
|
{ |
|
"epoch": 5.25, |
|
"learning_rate": 2.376757077806375e-05, |
|
"loss": 0.432, |
|
"step": 26500 |
|
}, |
|
{ |
|
"epoch": 5.35, |
|
"learning_rate": 2.3272619283310237e-05, |
|
"loss": 0.4312, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 5.35, |
|
"eval_COMMENT": { |
|
"f1": 0.7056545830829829, |
|
"number": 6901, |
|
"precision": 0.6542461005199307, |
|
"recall": 0.7658310389798579 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8019135562107137, |
|
"number": 8857, |
|
"precision": 0.7903508771929825, |
|
"recall": 0.8138195777351248 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9852421533984619, |
|
"number": 7189, |
|
"precision": 0.981501932633904, |
|
"recall": 0.989010989010989 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.789237668161435, |
|
"number": 92, |
|
"precision": 0.6717557251908397, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9502391541495343, |
|
"number": 5732, |
|
"precision": 0.9154405820533549, |
|
"recall": 0.9877878576413119 |
|
}, |
|
"eval_loss": 0.48605257272720337, |
|
"eval_overall_accuracy": 0.83349770511702, |
|
"eval_overall_f1": 0.8517865242150884, |
|
"eval_overall_precision": 0.8242733597763183, |
|
"eval_overall_recall": 0.8811998192624517, |
|
"eval_runtime": 7.0035, |
|
"eval_samples_per_second": 1214.536, |
|
"eval_steps_per_second": 37.981, |
|
"step": 27000 |
|
}, |
|
{ |
|
"epoch": 5.44, |
|
"learning_rate": 2.2777667788556724e-05, |
|
"loss": 0.4321, |
|
"step": 27500 |
|
}, |
|
{ |
|
"epoch": 5.54, |
|
"learning_rate": 2.2282716293803206e-05, |
|
"loss": 0.4315, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 5.54, |
|
"eval_COMMENT": { |
|
"f1": 0.7045745469244761, |
|
"number": 6901, |
|
"precision": 0.6583983883152859, |
|
"recall": 0.7577162730039124 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8038757099899767, |
|
"number": 8857, |
|
"precision": 0.7930996593780903, |
|
"recall": 0.8149486282036807 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9861322978782415, |
|
"number": 7189, |
|
"precision": 0.9831328632655882, |
|
"recall": 0.9891500904159132 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7909090909090909, |
|
"number": 92, |
|
"precision": 0.6796875, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9528698872243729, |
|
"number": 5732, |
|
"precision": 0.9204878048780488, |
|
"recall": 0.9876133984647593 |
|
}, |
|
"eval_loss": 0.481955349445343, |
|
"eval_overall_accuracy": 0.8341235822933657, |
|
"eval_overall_f1": 0.8531310577328276, |
|
"eval_overall_precision": 0.8282385285069058, |
|
"eval_overall_recall": 0.8795662298842585, |
|
"eval_runtime": 8.4264, |
|
"eval_samples_per_second": 1009.444, |
|
"eval_steps_per_second": 31.567, |
|
"step": 28000 |
|
}, |
|
{ |
|
"epoch": 5.64, |
|
"learning_rate": 2.1787764799049696e-05, |
|
"loss": 0.4328, |
|
"step": 28500 |
|
}, |
|
{ |
|
"epoch": 5.74, |
|
"learning_rate": 2.129281330429618e-05, |
|
"loss": 0.4316, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 5.74, |
|
"eval_COMMENT": { |
|
"f1": 0.7066999527697188, |
|
"number": 6901, |
|
"precision": 0.6612373737373738, |
|
"recall": 0.7588755252861904 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8088874039425326, |
|
"number": 8857, |
|
"precision": 0.7980441709702231, |
|
"recall": 0.8200293553121825 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9862747816442535, |
|
"number": 7189, |
|
"precision": 0.9830040071852978, |
|
"recall": 0.9895673946306858 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7741935483870968, |
|
"number": 92, |
|
"precision": 0.672, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.955117910573916, |
|
"number": 5732, |
|
"precision": 0.9263813739957371, |
|
"recall": 0.9856943475226797 |
|
}, |
|
"eval_loss": 0.4761992394924164, |
|
"eval_overall_accuracy": 0.836987444524523, |
|
"eval_overall_f1": 0.8555853712048336, |
|
"eval_overall_precision": 0.8315727314480678, |
|
"eval_overall_recall": 0.8810260331583887, |
|
"eval_runtime": 8.3244, |
|
"eval_samples_per_second": 1021.82, |
|
"eval_steps_per_second": 31.954, |
|
"step": 29000 |
|
}, |
|
{ |
|
"epoch": 5.84, |
|
"learning_rate": 2.0797861809542665e-05, |
|
"loss": 0.4429, |
|
"step": 29500 |
|
}, |
|
{ |
|
"epoch": 5.94, |
|
"learning_rate": 2.0302910314789152e-05, |
|
"loss": 0.4278, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 5.94, |
|
"eval_COMMENT": { |
|
"f1": 0.7081487447979596, |
|
"number": 6901, |
|
"precision": 0.6596223583843942, |
|
"recall": 0.7643819736270105 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8039357385068653, |
|
"number": 8857, |
|
"precision": 0.7918309242225142, |
|
"recall": 0.8164163938128034 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9861265260821309, |
|
"number": 7189, |
|
"precision": 0.9835339698353397, |
|
"recall": 0.9887327862011406 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.783410138248848, |
|
"number": 92, |
|
"precision": 0.68, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9540695710908478, |
|
"number": 5732, |
|
"precision": 0.9244109947643979, |
|
"recall": 0.9856943475226797 |
|
}, |
|
"eval_loss": 0.4822809398174286, |
|
"eval_overall_accuracy": 0.8347684254447522, |
|
"eval_overall_f1": 0.8540192709386161, |
|
"eval_overall_precision": 0.8285882391396725, |
|
"eval_overall_recall": 0.8810607903792013, |
|
"eval_runtime": 6.5281, |
|
"eval_samples_per_second": 1302.987, |
|
"eval_steps_per_second": 40.747, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 6.04, |
|
"learning_rate": 1.9807958820035638e-05, |
|
"loss": 0.4251, |
|
"step": 30500 |
|
}, |
|
{ |
|
"epoch": 6.14, |
|
"learning_rate": 1.9313007325282124e-05, |
|
"loss": 0.4211, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 6.14, |
|
"eval_COMMENT": { |
|
"f1": 0.705458989679522, |
|
"number": 6901, |
|
"precision": 0.6637281206081512, |
|
"recall": 0.7527894508042313 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.7998453978245265, |
|
"number": 8857, |
|
"precision": 0.7826885671061162, |
|
"recall": 0.8177712543750706 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9858901646147462, |
|
"number": 7189, |
|
"precision": 0.9804649883065071, |
|
"recall": 0.9913757128947003 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.787037037037037, |
|
"number": 92, |
|
"precision": 0.6854838709677419, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9548103724976772, |
|
"number": 5732, |
|
"precision": 0.925495333224169, |
|
"recall": 0.9860432658757851 |
|
}, |
|
"eval_loss": 0.47935572266578674, |
|
"eval_overall_accuracy": 0.8356218943215871, |
|
"eval_overall_f1": 0.8526081682167409, |
|
"eval_overall_precision": 0.8273764755894183, |
|
"eval_overall_recall": 0.8794272010010079, |
|
"eval_runtime": 9.2091, |
|
"eval_samples_per_second": 923.653, |
|
"eval_steps_per_second": 28.885, |
|
"step": 31000 |
|
}, |
|
{ |
|
"epoch": 6.24, |
|
"learning_rate": 1.8818055830528607e-05, |
|
"loss": 0.4113, |
|
"step": 31500 |
|
}, |
|
{ |
|
"epoch": 6.34, |
|
"learning_rate": 1.8323104335775097e-05, |
|
"loss": 0.4231, |
|
"step": 32000 |
|
}, |
|
{ |
|
"epoch": 6.34, |
|
"eval_COMMENT": { |
|
"f1": 0.7081927385612093, |
|
"number": 6901, |
|
"precision": 0.6627510420613869, |
|
"recall": 0.7603245906390378 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8008871638480732, |
|
"number": 8857, |
|
"precision": 0.7868816735672259, |
|
"recall": 0.815400248391103 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9866055937261433, |
|
"number": 7189, |
|
"precision": 0.9844875346260388, |
|
"recall": 0.9887327862011406 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.8018433179723502, |
|
"number": 92, |
|
"precision": 0.696, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9542042675212956, |
|
"number": 5732, |
|
"precision": 0.9235918367346939, |
|
"recall": 0.9869155617585486 |
|
}, |
|
"eval_loss": 0.4756552577018738, |
|
"eval_overall_accuracy": 0.8364374312483405, |
|
"eval_overall_f1": 0.8534784953485236, |
|
"eval_overall_precision": 0.8284312121707835, |
|
"eval_overall_recall": 0.8800875881964478, |
|
"eval_runtime": 6.7948, |
|
"eval_samples_per_second": 1251.831, |
|
"eval_steps_per_second": 39.147, |
|
"step": 32000 |
|
}, |
|
{ |
|
"epoch": 6.43, |
|
"learning_rate": 1.782815284102158e-05, |
|
"loss": 0.4209, |
|
"step": 32500 |
|
}, |
|
{ |
|
"epoch": 6.53, |
|
"learning_rate": 1.7333201346268066e-05, |
|
"loss": 0.4302, |
|
"step": 33000 |
|
}, |
|
{ |
|
"epoch": 6.53, |
|
"eval_COMMENT": { |
|
"f1": 0.706057529610829, |
|
"number": 6901, |
|
"precision": 0.6624333248666497, |
|
"recall": 0.7558324880452109 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8062360801781736, |
|
"number": 8857, |
|
"precision": 0.7953421948808085, |
|
"recall": 0.8174325392345038 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.986130374479889, |
|
"number": 7189, |
|
"precision": 0.9832664914949523, |
|
"recall": 0.989010989010989 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7766990291262136, |
|
"number": 92, |
|
"precision": 0.7017543859649122, |
|
"recall": 0.8695652173913043 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9544303797468354, |
|
"number": 5732, |
|
"precision": 0.9243216737495914, |
|
"recall": 0.9865666434054431 |
|
}, |
|
"eval_loss": 0.4785662591457367, |
|
"eval_overall_accuracy": 0.8354891324963016, |
|
"eval_overall_f1": 0.8546047187178056, |
|
"eval_overall_precision": 0.8311760840998685, |
|
"eval_overall_recall": 0.8793924437801953, |
|
"eval_runtime": 8.3624, |
|
"eval_samples_per_second": 1017.166, |
|
"eval_steps_per_second": 31.809, |
|
"step": 33000 |
|
}, |
|
{ |
|
"epoch": 6.63, |
|
"learning_rate": 1.6838249851514553e-05, |
|
"loss": 0.4309, |
|
"step": 33500 |
|
}, |
|
{ |
|
"epoch": 6.73, |
|
"learning_rate": 1.634329835676104e-05, |
|
"loss": 0.4223, |
|
"step": 34000 |
|
}, |
|
{ |
|
"epoch": 6.73, |
|
"eval_COMMENT": { |
|
"f1": 0.703981612925032, |
|
"number": 6901, |
|
"precision": 0.6597820577800304, |
|
"recall": 0.7545283292276481 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8044022011005503, |
|
"number": 8857, |
|
"precision": 0.7922049485439019, |
|
"recall": 0.8169809190470814 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.986130374479889, |
|
"number": 7189, |
|
"precision": 0.9832664914949523, |
|
"recall": 0.989010989010989 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7981651376146789, |
|
"number": 92, |
|
"precision": 0.6904761904761905, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9541965415436525, |
|
"number": 5732, |
|
"precision": 0.923730197615548, |
|
"recall": 0.9867411025819958 |
|
}, |
|
"eval_loss": 0.4795403480529785, |
|
"eval_overall_accuracy": 0.836304669423055, |
|
"eval_overall_f1": 0.8534844880813807, |
|
"eval_overall_precision": 0.8292139251294828, |
|
"eval_overall_recall": 0.8792186576761322, |
|
"eval_runtime": 8.6534, |
|
"eval_samples_per_second": 982.967, |
|
"eval_steps_per_second": 30.739, |
|
"step": 34000 |
|
}, |
|
{ |
|
"epoch": 6.83, |
|
"learning_rate": 1.5848346862007525e-05, |
|
"loss": 0.4119, |
|
"step": 34500 |
|
}, |
|
{ |
|
"epoch": 6.93, |
|
"learning_rate": 1.535339536725401e-05, |
|
"loss": 0.4184, |
|
"step": 35000 |
|
}, |
|
{ |
|
"epoch": 6.93, |
|
"eval_COMMENT": { |
|
"f1": 0.7059539095762654, |
|
"number": 6901, |
|
"precision": 0.6614741641337386, |
|
"recall": 0.7568468337922041 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8020405899966729, |
|
"number": 8857, |
|
"precision": 0.788057099269914, |
|
"recall": 0.8165292988596591 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9865650969529086, |
|
"number": 7189, |
|
"precision": 0.9823472624465591, |
|
"recall": 0.9908193072750034 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7963800904977375, |
|
"number": 92, |
|
"precision": 0.6821705426356589, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9530710253601821, |
|
"number": 5732, |
|
"precision": 0.9216229428059313, |
|
"recall": 0.9867411025819958 |
|
}, |
|
"eval_loss": 0.4803193211555481, |
|
"eval_overall_accuracy": 0.8355839623715056, |
|
"eval_overall_f1": 0.8531527433837031, |
|
"eval_overall_precision": 0.8277868584504741, |
|
"eval_overall_recall": 0.8801223454172604, |
|
"eval_runtime": 7.0311, |
|
"eval_samples_per_second": 1209.766, |
|
"eval_steps_per_second": 37.832, |
|
"step": 35000 |
|
}, |
|
{ |
|
"epoch": 7.03, |
|
"learning_rate": 1.4858443872500496e-05, |
|
"loss": 0.4189, |
|
"step": 35500 |
|
}, |
|
{ |
|
"epoch": 7.13, |
|
"learning_rate": 1.4363492377746981e-05, |
|
"loss": 0.4071, |
|
"step": 36000 |
|
}, |
|
{ |
|
"epoch": 7.13, |
|
"eval_COMMENT": { |
|
"f1": 0.7068977142471848, |
|
"number": 6901, |
|
"precision": 0.6610340479192938, |
|
"recall": 0.7596000579626141 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8058371393561323, |
|
"number": 8857, |
|
"precision": 0.7952072111685171, |
|
"recall": 0.8167551089533702 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9864247125640672, |
|
"number": 7189, |
|
"precision": 0.9823423920540765, |
|
"recall": 0.9905411044651551 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7981651376146789, |
|
"number": 92, |
|
"precision": 0.6904761904761905, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9542881284326151, |
|
"number": 5732, |
|
"precision": 0.9252826478780928, |
|
"recall": 0.9851709699930217 |
|
}, |
|
"eval_loss": 0.48823681473731995, |
|
"eval_overall_accuracy": 0.8358115540719948, |
|
"eval_overall_f1": 0.8546798029556651, |
|
"eval_overall_precision": 0.8303884609080479, |
|
"eval_overall_recall": 0.880435160404574, |
|
"eval_runtime": 9.3911, |
|
"eval_samples_per_second": 905.75, |
|
"eval_steps_per_second": 28.325, |
|
"step": 36000 |
|
}, |
|
{ |
|
"epoch": 7.23, |
|
"learning_rate": 1.3868540882993467e-05, |
|
"loss": 0.4066, |
|
"step": 36500 |
|
}, |
|
{ |
|
"epoch": 7.33, |
|
"learning_rate": 1.3373589388239954e-05, |
|
"loss": 0.4093, |
|
"step": 37000 |
|
}, |
|
{ |
|
"epoch": 7.33, |
|
"eval_COMMENT": { |
|
"f1": 0.7065691471515801, |
|
"number": 6901, |
|
"precision": 0.6579605098725319, |
|
"recall": 0.7629329082741632 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8055648302726766, |
|
"number": 8857, |
|
"precision": 0.794249972566663, |
|
"recall": 0.8172067291407926 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9863412604867227, |
|
"number": 7189, |
|
"precision": 0.9832734310201825, |
|
"recall": 0.9894282932257615 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7924528301886793, |
|
"number": 92, |
|
"precision": 0.7, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9535530641490347, |
|
"number": 5732, |
|
"precision": 0.9225248735932148, |
|
"recall": 0.9867411025819958 |
|
}, |
|
"eval_loss": 0.48563364148139954, |
|
"eval_overall_accuracy": 0.8367219208739521, |
|
"eval_overall_f1": 0.8541543851375251, |
|
"eval_overall_precision": 0.8286274509803921, |
|
"eval_overall_recall": 0.8813040909248896, |
|
"eval_runtime": 6.6204, |
|
"eval_samples_per_second": 1284.823, |
|
"eval_steps_per_second": 40.179, |
|
"step": 37000 |
|
}, |
|
{ |
|
"epoch": 7.42, |
|
"learning_rate": 1.287863789348644e-05, |
|
"loss": 0.4197, |
|
"step": 37500 |
|
}, |
|
{ |
|
"epoch": 7.52, |
|
"learning_rate": 1.2383686398732925e-05, |
|
"loss": 0.4124, |
|
"step": 38000 |
|
}, |
|
{ |
|
"epoch": 7.52, |
|
"eval_COMMENT": { |
|
"f1": 0.7066407036862955, |
|
"number": 6901, |
|
"precision": 0.6584084084084084, |
|
"recall": 0.762498188668309 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8056977520587582, |
|
"number": 8857, |
|
"precision": 0.7942951179374658, |
|
"recall": 0.8174325392345038 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9862728785357736, |
|
"number": 7189, |
|
"precision": 0.9831375259156876, |
|
"recall": 0.9894282932257615 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7963800904977375, |
|
"number": 92, |
|
"precision": 0.6821705426356589, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9536647009267059, |
|
"number": 5732, |
|
"precision": 0.9221244705115673, |
|
"recall": 0.9874389392882066 |
|
}, |
|
"eval_loss": 0.4802015423774719, |
|
"eval_overall_accuracy": 0.8361908735728104, |
|
"eval_overall_f1": 0.8542606938363086, |
|
"eval_overall_precision": 0.8286124995916234, |
|
"eval_overall_recall": 0.881547391470578, |
|
"eval_runtime": 9.142, |
|
"eval_samples_per_second": 930.428, |
|
"eval_steps_per_second": 29.096, |
|
"step": 38000 |
|
}, |
|
{ |
|
"epoch": 7.62, |
|
"learning_rate": 1.1888734903979411e-05, |
|
"loss": 0.4071, |
|
"step": 38500 |
|
}, |
|
{ |
|
"epoch": 7.72, |
|
"learning_rate": 1.1393783409225896e-05, |
|
"loss": 0.414, |
|
"step": 39000 |
|
}, |
|
{ |
|
"epoch": 7.72, |
|
"eval_COMMENT": { |
|
"f1": 0.7048144163528779, |
|
"number": 6901, |
|
"precision": 0.6575084681972149, |
|
"recall": 0.7594551514273293 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8015089315433264, |
|
"number": 8857, |
|
"precision": 0.7878721779910568, |
|
"recall": 0.8156260584848143 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9858686616791354, |
|
"number": 7189, |
|
"precision": 0.9819235545743066, |
|
"recall": 0.9898455974405341 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7945205479452054, |
|
"number": 92, |
|
"precision": 0.6850393700787402, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9549138804457953, |
|
"number": 5732, |
|
"precision": 0.925229057591623, |
|
"recall": 0.9865666434054431 |
|
}, |
|
"eval_loss": 0.483047753572464, |
|
"eval_overall_accuracy": 0.8365701930736259, |
|
"eval_overall_f1": 0.8526693267336735, |
|
"eval_overall_precision": 0.8268464703193366, |
|
"eval_overall_recall": 0.880157102638073, |
|
"eval_runtime": 7.5994, |
|
"eval_samples_per_second": 1119.299, |
|
"eval_steps_per_second": 35.003, |
|
"step": 39000 |
|
}, |
|
{ |
|
"epoch": 7.82, |
|
"learning_rate": 1.0898831914472382e-05, |
|
"loss": 0.4196, |
|
"step": 39500 |
|
}, |
|
{ |
|
"epoch": 7.92, |
|
"learning_rate": 1.0403880419718868e-05, |
|
"loss": 0.4212, |
|
"step": 40000 |
|
}, |
|
{ |
|
"epoch": 7.92, |
|
"eval_COMMENT": { |
|
"f1": 0.7108280254777071, |
|
"number": 6901, |
|
"precision": 0.6614674319940105, |
|
"recall": 0.7681495435444139 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8036936084997496, |
|
"number": 8857, |
|
"precision": 0.7921052631578948, |
|
"recall": 0.8156260584848143 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9861815151725575, |
|
"number": 7189, |
|
"precision": 0.9846089850249584, |
|
"recall": 0.9877590763666713 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.787037037037037, |
|
"number": 92, |
|
"precision": 0.6854838709677419, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9544457567065969, |
|
"number": 5732, |
|
"precision": 0.9240444299248611, |
|
"recall": 0.9869155617585486 |
|
}, |
|
"eval_loss": 0.4802730679512024, |
|
"eval_overall_accuracy": 0.8373477980502978, |
|
"eval_overall_f1": 0.8546737867021544, |
|
"eval_overall_precision": 0.8292364016736402, |
|
"eval_overall_recall": 0.8817211775746411, |
|
"eval_runtime": 8.1983, |
|
"eval_samples_per_second": 1037.537, |
|
"eval_steps_per_second": 32.446, |
|
"step": 40000 |
|
}, |
|
{ |
|
"epoch": 8.02, |
|
"learning_rate": 9.908928924965353e-06, |
|
"loss": 0.4135, |
|
"step": 40500 |
|
}, |
|
{ |
|
"epoch": 8.12, |
|
"learning_rate": 9.41397743021184e-06, |
|
"loss": 0.3994, |
|
"step": 41000 |
|
}, |
|
{ |
|
"epoch": 8.12, |
|
"eval_COMMENT": { |
|
"f1": 0.7058981774161006, |
|
"number": 6901, |
|
"precision": 0.6586345381526104, |
|
"recall": 0.7604694971743226 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8033988670443185, |
|
"number": 8857, |
|
"precision": 0.7905782052683353, |
|
"recall": 0.8166422039065147 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9862045060658579, |
|
"number": 7189, |
|
"precision": 0.9830016583747927, |
|
"recall": 0.9894282932257615 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7963800904977375, |
|
"number": 92, |
|
"precision": 0.6821705426356589, |
|
"recall": 0.9565217391304348 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9540433426089888, |
|
"number": 5732, |
|
"precision": 0.9232903541700669, |
|
"recall": 0.9869155617585486 |
|
}, |
|
"eval_loss": 0.4922930598258972, |
|
"eval_overall_accuracy": 0.8354701665212608, |
|
"eval_overall_f1": 0.8534523408555069, |
|
"eval_overall_precision": 0.8278284164788134, |
|
"eval_overall_recall": 0.8807132181710751, |
|
"eval_runtime": 7.4213, |
|
"eval_samples_per_second": 1146.156, |
|
"eval_steps_per_second": 35.843, |
|
"step": 41000 |
|
}, |
|
{ |
|
"epoch": 8.22, |
|
"learning_rate": 8.919025935458326e-06, |
|
"loss": 0.4167, |
|
"step": 41500 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"learning_rate": 8.424074440704812e-06, |
|
"loss": 0.4052, |
|
"step": 42000 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"eval_COMMENT": { |
|
"f1": 0.7033915447373744, |
|
"number": 6901, |
|
"precision": 0.6577553593947036, |
|
"recall": 0.7558324880452109 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8042463317029791, |
|
"number": 8857, |
|
"precision": 0.7920087575259989, |
|
"recall": 0.8168680140002258 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9861438270749618, |
|
"number": 7189, |
|
"precision": 0.9823326432022084, |
|
"recall": 0.9899846988454584 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.8018018018018018, |
|
"number": 92, |
|
"precision": 0.6846153846153846, |
|
"recall": 0.967391304347826 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9546567592670776, |
|
"number": 5732, |
|
"precision": 0.9250531827851416, |
|
"recall": 0.9862177250523377 |
|
}, |
|
"eval_loss": 0.4865518808364868, |
|
"eval_overall_accuracy": 0.8359822478473619, |
|
"eval_overall_f1": 0.8533090590337481, |
|
"eval_overall_precision": 0.8284507872082747, |
|
"eval_overall_recall": 0.8797052587675089, |
|
"eval_runtime": 7.4797, |
|
"eval_samples_per_second": 1137.217, |
|
"eval_steps_per_second": 35.563, |
|
"step": 42000 |
|
}, |
|
{ |
|
"epoch": 8.41, |
|
"learning_rate": 7.929122945951298e-06, |
|
"loss": 0.4042, |
|
"step": 42500 |
|
}, |
|
{ |
|
"epoch": 8.51, |
|
"learning_rate": 7.434171451197783e-06, |
|
"loss": 0.4042, |
|
"step": 43000 |
|
}, |
|
{ |
|
"epoch": 8.51, |
|
"eval_COMMENT": { |
|
"f1": 0.7073401950162513, |
|
"number": 6901, |
|
"precision": 0.663912546078556, |
|
"recall": 0.7568468337922041 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8030025020850708, |
|
"number": 8857, |
|
"precision": 0.7910823838737949, |
|
"recall": 0.8152873433442475 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9858200179843675, |
|
"number": 7189, |
|
"precision": 0.980462300495322, |
|
"recall": 0.991236611489776 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7909090909090909, |
|
"number": 92, |
|
"precision": 0.6796875, |
|
"recall": 0.9456521739130435 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9534962089300758, |
|
"number": 5732, |
|
"precision": 0.921961550993809, |
|
"recall": 0.9872644801116539 |
|
}, |
|
"eval_loss": 0.48657840490341187, |
|
"eval_overall_accuracy": 0.8364563972233813, |
|
"eval_overall_f1": 0.8538279932546375, |
|
"eval_overall_precision": 0.8292443250679682, |
|
"eval_overall_recall": 0.8799138020923847, |
|
"eval_runtime": 9.0804, |
|
"eval_samples_per_second": 936.741, |
|
"eval_steps_per_second": 29.294, |
|
"step": 43000 |
|
}, |
|
{ |
|
"epoch": 8.61, |
|
"learning_rate": 6.939219956444269e-06, |
|
"loss": 0.4036, |
|
"step": 43500 |
|
}, |
|
{ |
|
"epoch": 8.71, |
|
"learning_rate": 6.444268461690754e-06, |
|
"loss": 0.4135, |
|
"step": 44000 |
|
}, |
|
{ |
|
"epoch": 8.71, |
|
"eval_COMMENT": { |
|
"f1": 0.7091805715057758, |
|
"number": 6901, |
|
"precision": 0.664262212098203, |
|
"recall": 0.7606144037096073 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.802937576499388, |
|
"number": 8857, |
|
"precision": 0.7914884282110344, |
|
"recall": 0.8147228181099695 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.985878443859892, |
|
"number": 7189, |
|
"precision": 0.9812594736116853, |
|
"recall": 0.9905411044651551 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7813953488372093, |
|
"number": 92, |
|
"precision": 0.6829268292682927, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9540588384051252, |
|
"number": 5732, |
|
"precision": 0.9230141901810471, |
|
"recall": 0.9872644801116539 |
|
}, |
|
"eval_loss": 0.48304322361946106, |
|
"eval_overall_accuracy": 0.8367977847741153, |
|
"eval_overall_f1": 0.8542520362219861, |
|
"eval_overall_precision": 0.8296429741238126, |
|
"eval_overall_recall": 0.8803656459629488, |
|
"eval_runtime": 6.5688, |
|
"eval_samples_per_second": 1294.905, |
|
"eval_steps_per_second": 40.494, |
|
"step": 44000 |
|
}, |
|
{ |
|
"epoch": 8.81, |
|
"learning_rate": 5.949316966937241e-06, |
|
"loss": 0.4078, |
|
"step": 44500 |
|
}, |
|
{ |
|
"epoch": 8.91, |
|
"learning_rate": 5.4543654721837265e-06, |
|
"loss": 0.3958, |
|
"step": 45000 |
|
}, |
|
{ |
|
"epoch": 8.91, |
|
"eval_COMMENT": { |
|
"f1": 0.7085999057175567, |
|
"number": 6901, |
|
"precision": 0.6619275289380976, |
|
"recall": 0.7623532821330242 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8035773802910788, |
|
"number": 8857, |
|
"precision": 0.7909240021869874, |
|
"recall": 0.8166422039065147 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9864836764400082, |
|
"number": 7189, |
|
"precision": 0.9831445150594087, |
|
"recall": 0.9898455974405341 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7906976744186046, |
|
"number": 92, |
|
"precision": 0.6910569105691057, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9539395984477813, |
|
"number": 5732, |
|
"precision": 0.9235543939888925, |
|
"recall": 0.9863921842288904 |
|
}, |
|
"eval_loss": 0.4859357178211212, |
|
"eval_overall_accuracy": 0.8370822743997269, |
|
"eval_overall_f1": 0.8542639055049118, |
|
"eval_overall_precision": 0.829048927263213, |
|
"eval_overall_recall": 0.8810607903792013, |
|
"eval_runtime": 9.1351, |
|
"eval_samples_per_second": 931.131, |
|
"eval_steps_per_second": 29.118, |
|
"step": 45000 |
|
}, |
|
{ |
|
"epoch": 9.01, |
|
"learning_rate": 4.959413977430212e-06, |
|
"loss": 0.4071, |
|
"step": 45500 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"learning_rate": 4.4644624826766974e-06, |
|
"loss": 0.3985, |
|
"step": 46000 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"eval_COMMENT": { |
|
"f1": 0.7050125483280201, |
|
"number": 6901, |
|
"precision": 0.6627135934710533, |
|
"recall": 0.7530792638748007 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8021064301552105, |
|
"number": 8857, |
|
"precision": 0.7878688881629097, |
|
"recall": 0.8168680140002258 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9866093110386457, |
|
"number": 7189, |
|
"precision": 0.9842192691029901, |
|
"recall": 0.989010989010989 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7853881278538813, |
|
"number": 92, |
|
"precision": 0.6771653543307087, |
|
"recall": 0.9347826086956522 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9550875412331895, |
|
"number": 5732, |
|
"precision": 0.9269413889344935, |
|
"recall": 0.984996510816469 |
|
}, |
|
"eval_loss": 0.4896639585494995, |
|
"eval_overall_accuracy": 0.8351856768956492, |
|
"eval_overall_f1": 0.8533036226746344, |
|
"eval_overall_precision": 0.8295532871631601, |
|
"eval_overall_recall": 0.8784539988182545, |
|
"eval_runtime": 6.8177, |
|
"eval_samples_per_second": 1247.642, |
|
"eval_steps_per_second": 39.016, |
|
"step": 46000 |
|
}, |
|
{ |
|
"epoch": 9.21, |
|
"learning_rate": 3.969510987923184e-06, |
|
"loss": 0.3989, |
|
"step": 46500 |
|
}, |
|
{ |
|
"epoch": 9.31, |
|
"learning_rate": 3.4745594931696697e-06, |
|
"loss": 0.3944, |
|
"step": 47000 |
|
}, |
|
{ |
|
"epoch": 9.31, |
|
"eval_COMMENT": { |
|
"f1": 0.709349593495935, |
|
"number": 6901, |
|
"precision": 0.6661152818424736, |
|
"recall": 0.7585857122156209 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8033533200088829, |
|
"number": 8857, |
|
"precision": 0.7902785363189514, |
|
"recall": 0.8168680140002258 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9866833125260092, |
|
"number": 7189, |
|
"precision": 0.9839535205422604, |
|
"recall": 0.9894282932257615 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.787037037037037, |
|
"number": 92, |
|
"precision": 0.6854838709677419, |
|
"recall": 0.9239130434782609 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.954649100582721, |
|
"number": 5732, |
|
"precision": 0.9251923391717138, |
|
"recall": 0.9860432658757851 |
|
}, |
|
"eval_loss": 0.48901429772377014, |
|
"eval_overall_accuracy": 0.8369495125744415, |
|
"eval_overall_f1": 0.8547268216112208, |
|
"eval_overall_precision": 0.8308176926105788, |
|
"eval_overall_recall": 0.8800528309756351, |
|
"eval_runtime": 9.5285, |
|
"eval_samples_per_second": 892.692, |
|
"eval_steps_per_second": 27.916, |
|
"step": 47000 |
|
}, |
|
{ |
|
"epoch": 9.4, |
|
"learning_rate": 2.979607998416155e-06, |
|
"loss": 0.397, |
|
"step": 47500 |
|
}, |
|
{ |
|
"epoch": 9.5, |
|
"learning_rate": 2.484656503662641e-06, |
|
"loss": 0.3959, |
|
"step": 48000 |
|
}, |
|
{ |
|
"epoch": 9.5, |
|
"eval_COMMENT": { |
|
"f1": 0.7106236964273699, |
|
"number": 6901, |
|
"precision": 0.6632755589047978, |
|
"recall": 0.765251412838719 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8044214853080043, |
|
"number": 8857, |
|
"precision": 0.7917122239230264, |
|
"recall": 0.8175454442813593 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9865483289418943, |
|
"number": 7189, |
|
"precision": 0.9835476289229919, |
|
"recall": 0.9895673946306858 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7926267281105991, |
|
"number": 92, |
|
"precision": 0.688, |
|
"recall": 0.9347826086956522 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9542693216334796, |
|
"number": 5732, |
|
"precision": 0.9240196078431373, |
|
"recall": 0.9865666434054431 |
|
}, |
|
"eval_loss": 0.4869215190410614, |
|
"eval_overall_accuracy": 0.8368736486742784, |
|
"eval_overall_f1": 0.8550634297555469, |
|
"eval_overall_precision": 0.829693323742889, |
|
"eval_overall_recall": 0.8820339925619547, |
|
"eval_runtime": 6.6612, |
|
"eval_samples_per_second": 1276.945, |
|
"eval_steps_per_second": 39.933, |
|
"step": 48000 |
|
}, |
|
{ |
|
"epoch": 9.6, |
|
"learning_rate": 1.989705008909127e-06, |
|
"loss": 0.3916, |
|
"step": 48500 |
|
}, |
|
{ |
|
"epoch": 9.7, |
|
"learning_rate": 1.4947535141556129e-06, |
|
"loss": 0.3979, |
|
"step": 49000 |
|
}, |
|
{ |
|
"epoch": 9.7, |
|
"eval_COMMENT": { |
|
"f1": 0.7113812901046943, |
|
"number": 6901, |
|
"precision": 0.666244939271255, |
|
"recall": 0.7630778148094479 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.8035317636605953, |
|
"number": 8857, |
|
"precision": 0.7906239755218009, |
|
"recall": 0.8168680140002258 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9864780528396089, |
|
"number": 7189, |
|
"precision": 0.9835453539823009, |
|
"recall": 0.9894282932257615 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7813953488372093, |
|
"number": 92, |
|
"precision": 0.6829268292682927, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9541810817652518, |
|
"number": 5732, |
|
"precision": 0.9240071907174375, |
|
"recall": 0.9863921842288904 |
|
}, |
|
"eval_loss": 0.48777857422828674, |
|
"eval_overall_accuracy": 0.8369115806243599, |
|
"eval_overall_f1": 0.8550421585160202, |
|
"eval_overall_precision": 0.8304235317239346, |
|
"eval_overall_recall": 0.8811650620416391, |
|
"eval_runtime": 8.6569, |
|
"eval_samples_per_second": 982.572, |
|
"eval_steps_per_second": 30.727, |
|
"step": 49000 |
|
}, |
|
{ |
|
"epoch": 9.8, |
|
"learning_rate": 9.998020194020988e-07, |
|
"loss": 0.4088, |
|
"step": 49500 |
|
}, |
|
{ |
|
"epoch": 9.9, |
|
"learning_rate": 5.048505246485845e-07, |
|
"loss": 0.4095, |
|
"step": 50000 |
|
}, |
|
{ |
|
"epoch": 9.9, |
|
"eval_COMMENT": { |
|
"f1": 0.7118095366561004, |
|
"number": 6901, |
|
"precision": 0.665783497350492, |
|
"recall": 0.7646717866975801 |
|
}, |
|
"eval_NAME": { |
|
"f1": 0.80368950380619, |
|
"number": 8857, |
|
"precision": 0.7912472647702407, |
|
"recall": 0.8165292988596591 |
|
}, |
|
"eval_QTY": { |
|
"f1": 0.9863412604867227, |
|
"number": 7189, |
|
"precision": 0.9832734310201825, |
|
"recall": 0.9894282932257615 |
|
}, |
|
"eval_RANGE_END": { |
|
"f1": 0.7813953488372093, |
|
"number": 92, |
|
"precision": 0.6829268292682927, |
|
"recall": 0.9130434782608695 |
|
}, |
|
"eval_UNIT": { |
|
"f1": 0.9544226873733964, |
|
"number": 5732, |
|
"precision": 0.9244604316546763, |
|
"recall": 0.9863921842288904 |
|
}, |
|
"eval_loss": 0.48620378971099854, |
|
"eval_overall_accuracy": 0.8372719341501347, |
|
"eval_overall_f1": 0.855167762603271, |
|
"eval_overall_precision": 0.8304135695340384, |
|
"eval_overall_recall": 0.8814431198081402, |
|
"eval_runtime": 8.2871, |
|
"eval_samples_per_second": 1026.42, |
|
"eval_steps_per_second": 32.098, |
|
"step": 50000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 9.899029895070283e-09, |
|
"loss": 0.3994, |
|
"step": 50500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 50510, |
|
"total_flos": 1555191327435270.0, |
|
"train_loss": 0.45639907907811844, |
|
"train_runtime": 1954.9419, |
|
"train_samples_per_second": 826.638, |
|
"train_steps_per_second": 25.837 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 50510, |
|
"num_train_epochs": 10, |
|
"save_steps": 1000, |
|
"total_flos": 1555191327435270.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|