napsternxg's picture
End of training
84c1492
raw
history blame
74.6 kB
{
"best_metric": 0.47966957092285156,
"best_model_checkpoint": "nyt_ingredients-tagger-paraphrase-MiniLM-L3-v2/checkpoint-24000",
"epoch": 10.0,
"eval_steps": 1000,
"global_step": 50510,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.1,
"learning_rate": 4.9505048505246485e-05,
"loss": 1.1204,
"step": 500
},
{
"epoch": 0.2,
"learning_rate": 4.9010097010492975e-05,
"loss": 0.7174,
"step": 1000
},
{
"epoch": 0.2,
"eval_COMMENT": {
"f1": 0.5647948868453662,
"number": 6824,
"precision": 0.5088729580444236,
"recall": 0.6345252051582649
},
"eval_NAME": {
"f1": 0.7765338110165697,
"number": 8803,
"precision": 0.7654784240150094,
"recall": 0.7879132114052028
},
"eval_QTY": {
"f1": 0.9714048901782015,
"number": 7168,
"precision": 0.9619699042407661,
"recall": 0.9810267857142857
},
"eval_RANGE_END": {
"f1": 0.0,
"number": 82,
"precision": 0.0,
"recall": 0.0
},
"eval_UNIT": {
"f1": 0.945750755794424,
"number": 5755,
"precision": 0.9151633349585568,
"recall": 0.9784535186794092
},
"eval_loss": 0.656587541103363,
"eval_overall_accuracy": 0.7841206721853672,
"eval_overall_f1": 0.8021117908321461,
"eval_overall_precision": 0.7710823961589276,
"eval_overall_recall": 0.8357432243643476,
"eval_runtime": 7.1565,
"eval_samples_per_second": 1188.573,
"eval_steps_per_second": 37.169,
"step": 1000
},
{
"epoch": 0.3,
"learning_rate": 4.851514551573946e-05,
"loss": 0.6502,
"step": 1500
},
{
"epoch": 0.4,
"learning_rate": 4.802019402098595e-05,
"loss": 0.6076,
"step": 2000
},
{
"epoch": 0.4,
"eval_COMMENT": {
"f1": 0.5854632587859425,
"number": 6824,
"precision": 0.5363414634146342,
"recall": 0.6444900351699883
},
"eval_NAME": {
"f1": 0.7806724071738058,
"number": 8803,
"precision": 0.7547189819724284,
"recall": 0.8084743837328183
},
"eval_QTY": {
"f1": 0.9778333680772705,
"number": 7168,
"precision": 0.974110480409802,
"recall": 0.9815848214285714
},
"eval_RANGE_END": {
"f1": 0.23529411764705882,
"number": 82,
"precision": 0.6,
"recall": 0.14634146341463414
},
"eval_UNIT": {
"f1": 0.9454667112746737,
"number": 5755,
"precision": 0.9114658925979681,
"recall": 0.9821025195482189
},
"eval_loss": 0.584534227848053,
"eval_overall_accuracy": 0.7988032194543752,
"eval_overall_f1": 0.811141258834958,
"eval_overall_precision": 0.7792688421188132,
"eval_overall_recall": 0.8457320480581167,
"eval_runtime": 6.3972,
"eval_samples_per_second": 1329.645,
"eval_steps_per_second": 41.581,
"step": 2000
},
{
"epoch": 0.49,
"learning_rate": 4.752524252623243e-05,
"loss": 0.5843,
"step": 2500
},
{
"epoch": 0.59,
"learning_rate": 4.703029103147892e-05,
"loss": 0.5777,
"step": 3000
},
{
"epoch": 0.59,
"eval_COMMENT": {
"f1": 0.6086500655307995,
"number": 6824,
"precision": 0.55049786628734,
"recall": 0.6805392731535757
},
"eval_NAME": {
"f1": 0.7919685823330935,
"number": 8803,
"precision": 0.7717766278568349,
"recall": 0.8132454844939225
},
"eval_QTY": {
"f1": 0.9790267875683533,
"number": 7168,
"precision": 0.9715620277510647,
"recall": 0.9866071428571429
},
"eval_RANGE_END": {
"f1": 0.5133689839572192,
"number": 82,
"precision": 0.45714285714285713,
"recall": 0.5853658536585366
},
"eval_UNIT": {
"f1": 0.9490924440692275,
"number": 5755,
"precision": 0.9229885057471264,
"recall": 0.9767158992180712
},
"eval_loss": 0.5503401756286621,
"eval_overall_accuracy": 0.805647427686543,
"eval_overall_f1": 0.820622555083754,
"eval_overall_precision": 0.7870198165843648,
"eval_overall_recall": 0.8572226879016485,
"eval_runtime": 8.9283,
"eval_samples_per_second": 952.704,
"eval_steps_per_second": 29.793,
"step": 3000
},
{
"epoch": 0.69,
"learning_rate": 4.65353395367254e-05,
"loss": 0.5581,
"step": 3500
},
{
"epoch": 0.79,
"learning_rate": 4.6040388041971886e-05,
"loss": 0.553,
"step": 4000
},
{
"epoch": 0.79,
"eval_COMMENT": {
"f1": 0.6282245827010623,
"number": 6824,
"precision": 0.5713428537141486,
"recall": 0.6976846424384525
},
"eval_NAME": {
"f1": 0.7973033207042568,
"number": 8803,
"precision": 0.7823947512301804,
"recall": 0.812791093945246
},
"eval_QTY": {
"f1": 0.9824755835699939,
"number": 7168,
"precision": 0.9756500206355757,
"recall": 0.9893973214285714
},
"eval_RANGE_END": {
"f1": 0.5595238095238095,
"number": 82,
"precision": 0.5465116279069767,
"recall": 0.573170731707317
},
"eval_UNIT": {
"f1": 0.9491468718634996,
"number": 5755,
"precision": 0.9150137074665377,
"recall": 0.9859252823631625
},
"eval_loss": 0.5342816710472107,
"eval_overall_accuracy": 0.8121666316171832,
"eval_overall_f1": 0.8289142895451346,
"eval_overall_precision": 0.7968357285557776,
"eval_overall_recall": 0.8636839899413243,
"eval_runtime": 7.0508,
"eval_samples_per_second": 1206.385,
"eval_steps_per_second": 37.726,
"step": 4000
},
{
"epoch": 0.89,
"learning_rate": 4.5545436547218376e-05,
"loss": 0.5436,
"step": 4500
},
{
"epoch": 0.99,
"learning_rate": 4.505048505246486e-05,
"loss": 0.5407,
"step": 5000
},
{
"epoch": 0.99,
"eval_COMMENT": {
"f1": 0.6475744396119103,
"number": 6824,
"precision": 0.5958625785001848,
"recall": 0.7091148886283705
},
"eval_NAME": {
"f1": 0.8001564333202973,
"number": 8803,
"precision": 0.787269129287599,
"recall": 0.8134726797682609
},
"eval_QTY": {
"f1": 0.9841955023323818,
"number": 7168,
"precision": 0.9823488533703961,
"recall": 0.9860491071428571
},
"eval_RANGE_END": {
"f1": 0.626865671641791,
"number": 82,
"precision": 0.5294117647058824,
"recall": 0.7682926829268293
},
"eval_UNIT": {
"f1": 0.9520282780676653,
"number": 5755,
"precision": 0.9231271421576628,
"recall": 0.9827975673327541
},
"eval_loss": 0.518293023109436,
"eval_overall_accuracy": 0.8185520102471945,
"eval_overall_f1": 0.8361275088547816,
"eval_overall_precision": 0.8085002283253963,
"eval_overall_recall": 0.8657096954456552,
"eval_runtime": 7.4009,
"eval_samples_per_second": 1149.315,
"eval_steps_per_second": 35.941,
"step": 5000
},
{
"epoch": 1.09,
"learning_rate": 4.455553355771135e-05,
"loss": 0.5231,
"step": 5500
},
{
"epoch": 1.19,
"learning_rate": 4.406058206295783e-05,
"loss": 0.5109,
"step": 6000
},
{
"epoch": 1.19,
"eval_COMMENT": {
"f1": 0.6651526284149355,
"number": 6824,
"precision": 0.611145206824598,
"recall": 0.729630715123095
},
"eval_NAME": {
"f1": 0.803545545768759,
"number": 8803,
"precision": 0.788943623426382,
"recall": 0.8186981710780415
},
"eval_QTY": {
"f1": 0.9848337275636566,
"number": 7168,
"precision": 0.9822370247016375,
"recall": 0.9874441964285714
},
"eval_RANGE_END": {
"f1": 0.653061224489796,
"number": 82,
"precision": 0.5614035087719298,
"recall": 0.7804878048780488
},
"eval_UNIT": {
"f1": 0.9527340129749768,
"number": 5755,
"precision": 0.924762839385018,
"recall": 0.9824500434404866
},
"eval_loss": 0.5209813714027405,
"eval_overall_accuracy": 0.8200623243542929,
"eval_overall_f1": 0.841881782031408,
"eval_overall_precision": 0.8133220471415549,
"eval_overall_recall": 0.8725202570550433,
"eval_runtime": 8.4151,
"eval_samples_per_second": 1010.797,
"eval_steps_per_second": 31.61,
"step": 6000
},
{
"epoch": 1.29,
"learning_rate": 4.356563056820432e-05,
"loss": 0.5232,
"step": 6500
},
{
"epoch": 1.39,
"learning_rate": 4.3070679073450804e-05,
"loss": 0.5125,
"step": 7000
},
{
"epoch": 1.39,
"eval_COMMENT": {
"f1": 0.6596956900596554,
"number": 6824,
"precision": 0.607906114885732,
"recall": 0.7211313012895663
},
"eval_NAME": {
"f1": 0.8034675615212529,
"number": 8803,
"precision": 0.7913407513495648,
"recall": 0.8159718277859821
},
"eval_QTY": {
"f1": 0.9845339278249966,
"number": 7168,
"precision": 0.983300862788756,
"recall": 0.9857700892857143
},
"eval_RANGE_END": {
"f1": 0.641711229946524,
"number": 82,
"precision": 0.5714285714285714,
"recall": 0.7317073170731707
},
"eval_UNIT": {
"f1": 0.952638700947226,
"number": 5755,
"precision": 0.9279947273026857,
"recall": 0.978627280625543
},
"eval_loss": 0.5072416663169861,
"eval_overall_accuracy": 0.8215152847611218,
"eval_overall_f1": 0.8404435129470623,
"eval_overall_precision": 0.8142932005764444,
"eval_overall_recall": 0.8683291422184968,
"eval_runtime": 6.3336,
"eval_samples_per_second": 1342.988,
"eval_steps_per_second": 41.998,
"step": 7000
},
{
"epoch": 1.48,
"learning_rate": 4.257572757869729e-05,
"loss": 0.5084,
"step": 7500
},
{
"epoch": 1.58,
"learning_rate": 4.208077608394378e-05,
"loss": 0.4967,
"step": 8000
},
{
"epoch": 1.58,
"eval_COMMENT": {
"f1": 0.6653271716562856,
"number": 6824,
"precision": 0.6126803996546195,
"recall": 0.7278722157092614
},
"eval_NAME": {
"f1": 0.8041098197742967,
"number": 8803,
"precision": 0.7949600355239786,
"recall": 0.8134726797682609
},
"eval_QTY": {
"f1": 0.9852011394427846,
"number": 7168,
"precision": 0.9813148788927336,
"recall": 0.9891183035714286
},
"eval_RANGE_END": {
"f1": 0.6431718061674009,
"number": 82,
"precision": 0.503448275862069,
"recall": 0.8902439024390244
},
"eval_UNIT": {
"f1": 0.9540510918135063,
"number": 5755,
"precision": 0.9266295447101212,
"recall": 0.9831450912250217
},
"eval_loss": 0.5088181495666504,
"eval_overall_accuracy": 0.8218402890626494,
"eval_overall_f1": 0.8425442817824156,
"eval_overall_precision": 0.815566669935602,
"eval_overall_recall": 0.871367700474993,
"eval_runtime": 8.617,
"eval_samples_per_second": 987.123,
"eval_steps_per_second": 30.869,
"step": 8000
},
{
"epoch": 1.68,
"learning_rate": 4.158582458919026e-05,
"loss": 0.5024,
"step": 8500
},
{
"epoch": 1.78,
"learning_rate": 4.109087309443675e-05,
"loss": 0.5121,
"step": 9000
},
{
"epoch": 1.78,
"eval_COMMENT": {
"f1": 0.6751009421265142,
"number": 6824,
"precision": 0.6241911398705824,
"recall": 0.735052754982415
},
"eval_NAME": {
"f1": 0.803609223571349,
"number": 8803,
"precision": 0.7883291443558081,
"recall": 0.8194933545382256
},
"eval_QTY": {
"f1": 0.9847892827239743,
"number": 7168,
"precision": 0.9850642099385818,
"recall": 0.9845145089285714
},
"eval_RANGE_END": {
"f1": 0.6346153846153846,
"number": 82,
"precision": 0.5238095238095238,
"recall": 0.8048780487804879
},
"eval_UNIT": {
"f1": 0.9542967763656258,
"number": 5755,
"precision": 0.9253999347045381,
"recall": 0.9850564726324935
},
"eval_loss": 0.502194344997406,
"eval_overall_accuracy": 0.824765327776397,
"eval_overall_f1": 0.8448383557018655,
"eval_overall_precision": 0.8176322582753325,
"eval_overall_recall": 0.8739172953338922,
"eval_runtime": 8.4909,
"eval_samples_per_second": 1001.783,
"eval_steps_per_second": 31.328,
"step": 9000
},
{
"epoch": 1.88,
"learning_rate": 4.059592159968323e-05,
"loss": 0.4946,
"step": 9500
},
{
"epoch": 1.98,
"learning_rate": 4.010097010492972e-05,
"loss": 0.5008,
"step": 10000
},
{
"epoch": 1.98,
"eval_COMMENT": {
"f1": 0.6771771771771772,
"number": 6824,
"precision": 0.6337506387327542,
"recall": 0.7269929660023446
},
"eval_NAME": {
"f1": 0.8049774008146867,
"number": 8803,
"precision": 0.7910726036411494,
"recall": 0.8193797569010565
},
"eval_QTY": {
"f1": 0.9824440619621343,
"number": 7168,
"precision": 0.9698246567894522,
"recall": 0.9953962053571429
},
"eval_RANGE_END": {
"f1": 0.625,
"number": 82,
"precision": 0.47468354430379744,
"recall": 0.9146341463414634
},
"eval_UNIT": {
"f1": 0.9544190749010025,
"number": 5755,
"precision": 0.9263984298331698,
"recall": 0.9841876629018245
},
"eval_loss": 0.4997539520263672,
"eval_overall_accuracy": 0.8250138604775652,
"eval_overall_f1": 0.8461161686962692,
"eval_overall_precision": 0.8192313982011448,
"eval_overall_recall": 0.874825370215144,
"eval_runtime": 6.4794,
"eval_samples_per_second": 1312.774,
"eval_steps_per_second": 41.053,
"step": 10000
},
{
"epoch": 2.08,
"learning_rate": 3.9606018610176205e-05,
"loss": 0.4788,
"step": 10500
},
{
"epoch": 2.18,
"learning_rate": 3.911106711542269e-05,
"loss": 0.4863,
"step": 11000
},
{
"epoch": 2.18,
"eval_COMMENT": {
"f1": 0.6816733337853415,
"number": 6824,
"precision": 0.6343217665615142,
"recall": 0.736664712778429
},
"eval_NAME": {
"f1": 0.8056887897378694,
"number": 8803,
"precision": 0.7913881888901063,
"recall": 0.820515733272748
},
"eval_QTY": {
"f1": 0.9852848873701096,
"number": 7168,
"precision": 0.9850787895690978,
"recall": 0.9854910714285714
},
"eval_RANGE_END": {
"f1": 0.6666666666666666,
"number": 82,
"precision": 0.6122448979591837,
"recall": 0.7317073170731707
},
"eval_UNIT": {
"f1": 0.9536959084020878,
"number": 5755,
"precision": 0.9250367466927977,
"recall": 0.9841876629018245
},
"eval_loss": 0.49540793895721436,
"eval_overall_accuracy": 0.8272888905882578,
"eval_overall_f1": 0.8476538695917124,
"eval_overall_precision": 0.8224280646432794,
"eval_overall_recall": 0.8744761106454317,
"eval_runtime": 9.0889,
"eval_samples_per_second": 935.867,
"eval_steps_per_second": 29.266,
"step": 11000
},
{
"epoch": 2.28,
"learning_rate": 3.861611562066917e-05,
"loss": 0.4922,
"step": 11500
},
{
"epoch": 2.38,
"learning_rate": 3.812116412591566e-05,
"loss": 0.4893,
"step": 12000
},
{
"epoch": 2.38,
"eval_COMMENT": {
"f1": 0.6847270771712826,
"number": 6824,
"precision": 0.6325136612021858,
"recall": 0.7463364595545134
},
"eval_NAME": {
"f1": 0.8033142412278262,
"number": 8803,
"precision": 0.7868191721132898,
"recall": 0.820515733272748
},
"eval_QTY": {
"f1": 0.9853482397055761,
"number": 7168,
"precision": 0.9809207797594359,
"recall": 0.9898158482142857
},
"eval_RANGE_END": {
"f1": 0.6491228070175438,
"number": 82,
"precision": 0.5068493150684932,
"recall": 0.9024390243902439
},
"eval_UNIT": {
"f1": 0.9545187053383775,
"number": 5755,
"precision": 0.9245928338762215,
"recall": 0.9864465682015638
},
"eval_loss": 0.49466800689697266,
"eval_overall_accuracy": 0.8257212227808898,
"eval_overall_f1": 0.8474479228061903,
"eval_overall_precision": 0.818249813014211,
"eval_overall_recall": 0.878806929309863,
"eval_runtime": 7.6267,
"eval_samples_per_second": 1115.288,
"eval_steps_per_second": 34.877,
"step": 12000
},
{
"epoch": 2.47,
"learning_rate": 3.762621263116215e-05,
"loss": 0.4767,
"step": 12500
},
{
"epoch": 2.57,
"learning_rate": 3.7131261136408633e-05,
"loss": 0.489,
"step": 13000
},
{
"epoch": 2.57,
"eval_COMMENT": {
"f1": 0.6822220714915552,
"number": 6824,
"precision": 0.635054931178179,
"recall": 0.736957796014068
},
"eval_NAME": {
"f1": 0.8048549635320973,
"number": 8803,
"precision": 0.7892552959161389,
"recall": 0.8210837214585937
},
"eval_QTY": {
"f1": 0.9860937282714505,
"number": 7168,
"precision": 0.9829498197948433,
"recall": 0.9892578125
},
"eval_RANGE_END": {
"f1": 0.6574074074074074,
"number": 82,
"precision": 0.5298507462686567,
"recall": 0.8658536585365854
},
"eval_UNIT": {
"f1": 0.9543087518898035,
"number": 5755,
"precision": 0.9235896602178507,
"recall": 0.9871416159860991
},
"eval_loss": 0.48692840337753296,
"eval_overall_accuracy": 0.8271550652876288,
"eval_overall_f1": 0.8478583975138494,
"eval_overall_precision": 0.8209052851909995,
"eval_overall_recall": 0.8766415199776474,
"eval_runtime": 6.7601,
"eval_samples_per_second": 1258.259,
"eval_steps_per_second": 39.348,
"step": 13000
},
{
"epoch": 2.67,
"learning_rate": 3.663630964165512e-05,
"loss": 0.4794,
"step": 13500
},
{
"epoch": 2.77,
"learning_rate": 3.6141358146901606e-05,
"loss": 0.4691,
"step": 14000
},
{
"epoch": 2.77,
"eval_COMMENT": {
"f1": 0.6935899173329719,
"number": 6824,
"precision": 0.6450718427022939,
"recall": 0.75
},
"eval_NAME": {
"f1": 0.8057417336907953,
"number": 8803,
"precision": 0.7925502692011867,
"recall": 0.8193797569010565
},
"eval_QTY": {
"f1": 0.9854750156369451,
"number": 7168,
"precision": 0.9818584683561834,
"recall": 0.9891183035714286
},
"eval_RANGE_END": {
"f1": 0.6820276497695853,
"number": 82,
"precision": 0.5481481481481482,
"recall": 0.9024390243902439
},
"eval_UNIT": {
"f1": 0.9554861052453754,
"number": 5755,
"precision": 0.9296515450361604,
"recall": 0.9827975673327541
},
"eval_loss": 0.4904623329639435,
"eval_overall_accuracy": 0.8282639034928403,
"eval_overall_f1": 0.8510328725870033,
"eval_overall_precision": 0.8252994257588186,
"eval_overall_recall": 0.8784227437831796,
"eval_runtime": 9.0651,
"eval_samples_per_second": 938.328,
"eval_steps_per_second": 29.343,
"step": 14000
},
{
"epoch": 2.87,
"learning_rate": 3.564640665214809e-05,
"loss": 0.484,
"step": 14500
},
{
"epoch": 2.97,
"learning_rate": 3.515145515739457e-05,
"loss": 0.4781,
"step": 15000
},
{
"epoch": 2.97,
"eval_COMMENT": {
"f1": 0.6936924742826204,
"number": 6824,
"precision": 0.6444919517102615,
"recall": 0.7510257913247362
},
"eval_NAME": {
"f1": 0.8070410729253981,
"number": 8803,
"precision": 0.7942146942366916,
"recall": 0.8202885379984096
},
"eval_QTY": {
"f1": 0.9859409799554566,
"number": 7168,
"precision": 0.98375,
"recall": 0.9881417410714286
},
"eval_RANGE_END": {
"f1": 0.6602870813397129,
"number": 82,
"precision": 0.5433070866141733,
"recall": 0.8414634146341463
},
"eval_UNIT": {
"f1": 0.9547484621218505,
"number": 5755,
"precision": 0.9268651832460733,
"recall": 0.9843614248479583
},
"eval_loss": 0.48784932494163513,
"eval_overall_accuracy": 0.8293345058978722,
"eval_overall_f1": 0.8513236911105472,
"eval_overall_precision": 0.825476495095627,
"eval_overall_recall": 0.8788418552668343,
"eval_runtime": 7.0221,
"eval_samples_per_second": 1211.315,
"eval_steps_per_second": 37.88,
"step": 15000
},
{
"epoch": 3.07,
"learning_rate": 3.465650366264107e-05,
"loss": 0.462,
"step": 15500
},
{
"epoch": 3.17,
"learning_rate": 3.416155216788755e-05,
"loss": 0.4599,
"step": 16000
},
{
"epoch": 3.17,
"eval_COMMENT": {
"f1": 0.6904161841836387,
"number": 6824,
"precision": 0.6450299096347206,
"recall": 0.742672919109027
},
"eval_NAME": {
"f1": 0.8082375265096551,
"number": 8803,
"precision": 0.7944048272078991,
"recall": 0.8225604907417926
},
"eval_QTY": {
"f1": 0.9857391304347826,
"number": 7168,
"precision": 0.983072013320383,
"recall": 0.9884207589285714
},
"eval_RANGE_END": {
"f1": 0.6636363636363637,
"number": 82,
"precision": 0.5289855072463768,
"recall": 0.8902439024390244
},
"eval_UNIT": {
"f1": 0.9555706291334577,
"number": 5755,
"precision": 0.9331015068719987,
"recall": 0.9791485664639444
},
"eval_loss": 0.48515409231185913,
"eval_overall_accuracy": 0.8305962873038025,
"eval_overall_f1": 0.8510883569539567,
"eval_overall_precision": 0.8269205428910265,
"eval_overall_recall": 0.8767113718915899,
"eval_runtime": 8.5334,
"eval_samples_per_second": 996.787,
"eval_steps_per_second": 31.172,
"step": 16000
},
{
"epoch": 3.27,
"learning_rate": 3.3666600673134034e-05,
"loss": 0.4548,
"step": 16500
},
{
"epoch": 3.37,
"learning_rate": 3.317164917838052e-05,
"loss": 0.4636,
"step": 17000
},
{
"epoch": 3.37,
"eval_COMMENT": {
"f1": 0.6982570806100218,
"number": 6824,
"precision": 0.6520854526958291,
"recall": 0.7514654161781946
},
"eval_NAME": {
"f1": 0.8060380709251347,
"number": 8803,
"precision": 0.7879774305555556,
"recall": 0.8249460411223447
},
"eval_QTY": {
"f1": 0.9860387580745988,
"number": 7168,
"precision": 0.9818785447503112,
"recall": 0.990234375
},
"eval_RANGE_END": {
"f1": 0.6198347107438017,
"number": 82,
"precision": 0.46875,
"recall": 0.9146341463414634
},
"eval_UNIT": {
"f1": 0.9546639751030365,
"number": 5755,
"precision": 0.9251711770459733,
"recall": 0.9860990443092963
},
"eval_loss": 0.4889169931411743,
"eval_overall_accuracy": 0.8302904009023648,
"eval_overall_f1": 0.8521313412678315,
"eval_overall_precision": 0.8246903898310624,
"eval_overall_recall": 0.8814613020396759,
"eval_runtime": 8.1836,
"eval_samples_per_second": 1039.392,
"eval_steps_per_second": 32.504,
"step": 17000
},
{
"epoch": 3.46,
"learning_rate": 3.267669768362701e-05,
"loss": 0.4638,
"step": 17500
},
{
"epoch": 3.56,
"learning_rate": 3.218174618887349e-05,
"loss": 0.4688,
"step": 18000
},
{
"epoch": 3.56,
"eval_COMMENT": {
"f1": 0.7010448264239973,
"number": 6824,
"precision": 0.6491074772188241,
"recall": 0.7620164126611958
},
"eval_NAME": {
"f1": 0.8081609837898266,
"number": 8803,
"precision": 0.7955320787938813,
"recall": 0.8211973190957628
},
"eval_QTY": {
"f1": 0.9860232250886588,
"number": 7168,
"precision": 0.9829474559822543,
"recall": 0.9891183035714286
},
"eval_RANGE_END": {
"f1": 0.6428571428571429,
"number": 82,
"precision": 0.5526315789473685,
"recall": 0.7682926829268293
},
"eval_UNIT": {
"f1": 0.9546716003700276,
"number": 5755,
"precision": 0.9250325945241199,
"recall": 0.98627280625543
},
"eval_loss": 0.49013254046440125,
"eval_overall_accuracy": 0.8319345403100923,
"eval_overall_f1": 0.8534117209805214,
"eval_overall_precision": 0.8264781911586663,
"eval_overall_recall": 0.8821598211791003,
"eval_runtime": 7.2351,
"eval_samples_per_second": 1175.656,
"eval_steps_per_second": 36.765,
"step": 18000
},
{
"epoch": 3.66,
"learning_rate": 3.168679469411997e-05,
"loss": 0.4648,
"step": 18500
},
{
"epoch": 3.76,
"learning_rate": 3.119184319936647e-05,
"loss": 0.4584,
"step": 19000
},
{
"epoch": 3.76,
"eval_COMMENT": {
"f1": 0.6999050332383666,
"number": 6824,
"precision": 0.65155342258146,
"recall": 0.7560082063305978
},
"eval_NAME": {
"f1": 0.8059467918622849,
"number": 8803,
"precision": 0.7932665859830564,
"recall": 0.819038963989549
},
"eval_QTY": {
"f1": 0.9858998402444954,
"number": 7168,
"precision": 0.981740213030848,
"recall": 0.9900948660714286
},
"eval_RANGE_END": {
"f1": 0.6636363636363637,
"number": 82,
"precision": 0.5289855072463768,
"recall": 0.8902439024390244
},
"eval_UNIT": {
"f1": 0.956632006086736,
"number": 5755,
"precision": 0.9315113598946329,
"recall": 0.9831450912250217
},
"eval_loss": 0.48241040110588074,
"eval_overall_accuracy": 0.8306727589041619,
"eval_overall_f1": 0.8529790115098173,
"eval_overall_precision": 0.8275420388859696,
"eval_overall_recall": 0.8800293378038558,
"eval_runtime": 9.4362,
"eval_samples_per_second": 901.421,
"eval_steps_per_second": 28.189,
"step": 19000
},
{
"epoch": 3.86,
"learning_rate": 3.069689170461295e-05,
"loss": 0.4584,
"step": 19500
},
{
"epoch": 3.96,
"learning_rate": 3.0201940209859435e-05,
"loss": 0.4701,
"step": 20000
},
{
"epoch": 3.96,
"eval_COMMENT": {
"f1": 0.7003649886371462,
"number": 6824,
"precision": 0.6606470053267507,
"recall": 0.7451641266119577
},
"eval_NAME": {
"f1": 0.8087504883084994,
"number": 8803,
"precision": 0.7948661693725319,
"recall": 0.8231284789276383
},
"eval_QTY": {
"f1": 0.98635477582846,
"number": 7168,
"precision": 0.9844357976653697,
"recall": 0.98828125
},
"eval_RANGE_END": {
"f1": 0.660377358490566,
"number": 82,
"precision": 0.5384615384615384,
"recall": 0.8536585365853658
},
"eval_UNIT": {
"f1": 0.956190798376184,
"number": 5755,
"precision": 0.9314549349151425,
"recall": 0.9822762814943528
},
"eval_loss": 0.48059511184692383,
"eval_overall_accuracy": 0.8328713174144952,
"eval_overall_f1": 0.8544527532290959,
"eval_overall_precision": 0.8321636652542372,
"eval_overall_recall": 0.8779687063425538,
"eval_runtime": 6.465,
"eval_samples_per_second": 1315.706,
"eval_steps_per_second": 41.145,
"step": 20000
},
{
"epoch": 4.06,
"learning_rate": 2.970698871510592e-05,
"loss": 0.4594,
"step": 20500
},
{
"epoch": 4.16,
"learning_rate": 2.9212037220352405e-05,
"loss": 0.4441,
"step": 21000
},
{
"epoch": 4.16,
"eval_COMMENT": {
"f1": 0.6940426407074792,
"number": 6824,
"precision": 0.6520674996779595,
"recall": 0.7417936694021102
},
"eval_NAME": {
"f1": 0.8061428889383486,
"number": 8803,
"precision": 0.7900534409423056,
"recall": 0.8229012836533001
},
"eval_QTY": {
"f1": 0.9851016429963798,
"number": 7168,
"precision": 0.9831851028349082,
"recall": 0.9870256696428571
},
"eval_RANGE_END": {
"f1": 0.6521739130434783,
"number": 82,
"precision": 0.5882352941176471,
"recall": 0.7317073170731707
},
"eval_UNIT": {
"f1": 0.9563670253325427,
"number": 5755,
"precision": 0.9332010582010583,
"recall": 0.9807124239791486
},
"eval_loss": 0.4863247871398926,
"eval_overall_accuracy": 0.8309977632056895,
"eval_overall_f1": 0.851638092004753,
"eval_overall_precision": 0.8284893321883876,
"eval_overall_recall": 0.8761176306230791,
"eval_runtime": 8.7832,
"eval_samples_per_second": 968.441,
"eval_steps_per_second": 30.285,
"step": 21000
},
{
"epoch": 4.26,
"learning_rate": 2.871708572559889e-05,
"loss": 0.4493,
"step": 21500
},
{
"epoch": 4.36,
"learning_rate": 2.8222134230845377e-05,
"loss": 0.4375,
"step": 22000
},
{
"epoch": 4.36,
"eval_COMMENT": {
"f1": 0.699911438108863,
"number": 6824,
"precision": 0.6539783577339274,
"recall": 0.7527842907385698
},
"eval_NAME": {
"f1": 0.8084585420144685,
"number": 8803,
"precision": 0.7924075488164066,
"recall": 0.8251732363966829
},
"eval_QTY": {
"f1": 0.985897881208753,
"number": 7168,
"precision": 0.9818735298187353,
"recall": 0.9899553571428571
},
"eval_RANGE_END": {
"f1": 0.6519823788546256,
"number": 82,
"precision": 0.5103448275862069,
"recall": 0.9024390243902439
},
"eval_UNIT": {
"f1": 0.9565510841137266,
"number": 5755,
"precision": 0.9296490652673007,
"recall": 0.9850564726324935
},
"eval_loss": 0.4853152334690094,
"eval_overall_accuracy": 0.8326036668132373,
"eval_overall_f1": 0.8537987957513024,
"eval_overall_precision": 0.8277581004853732,
"eval_overall_recall": 0.8815311539536184,
"eval_runtime": 7.6535,
"eval_samples_per_second": 1111.391,
"eval_steps_per_second": 34.755,
"step": 22000
},
{
"epoch": 4.45,
"learning_rate": 2.7727182736091867e-05,
"loss": 0.4541,
"step": 22500
},
{
"epoch": 4.55,
"learning_rate": 2.7232231241338353e-05,
"loss": 0.4566,
"step": 23000
},
{
"epoch": 4.55,
"eval_COMMENT": {
"f1": 0.6999176728869374,
"number": 6824,
"precision": 0.6580237358101135,
"recall": 0.7475087924970691
},
"eval_NAME": {
"f1": 0.8100474462740721,
"number": 8803,
"precision": 0.7963125548726954,
"recall": 0.8242644552993298
},
"eval_QTY": {
"f1": 0.9862956521739129,
"number": 7168,
"precision": 0.9836270292770917,
"recall": 0.9889787946428571
},
"eval_RANGE_END": {
"f1": 0.6979166666666666,
"number": 82,
"precision": 0.6090909090909091,
"recall": 0.8170731707317073
},
"eval_UNIT": {
"f1": 0.9566618607412434,
"number": 5755,
"precision": 0.9343936381709742,
"recall": 0.9800173761946134
},
"eval_loss": 0.48071911931037903,
"eval_overall_accuracy": 0.8325271952128778,
"eval_overall_f1": 0.8548318578055702,
"eval_overall_precision": 0.8324122182877188,
"eval_overall_recall": 0.8784925956971221,
"eval_runtime": 7.014,
"eval_samples_per_second": 1212.724,
"eval_steps_per_second": 37.924,
"step": 23000
},
{
"epoch": 4.65,
"learning_rate": 2.6737279746584836e-05,
"loss": 0.4448,
"step": 23500
},
{
"epoch": 4.75,
"learning_rate": 2.6242328251831323e-05,
"loss": 0.4546,
"step": 24000
},
{
"epoch": 4.75,
"eval_COMMENT": {
"f1": 0.7049292873815736,
"number": 6824,
"precision": 0.6631361405321622,
"recall": 0.7523446658851114
},
"eval_NAME": {
"f1": 0.8063276332646355,
"number": 8803,
"precision": 0.7910382513661203,
"recall": 0.8222196978302851
},
"eval_QTY": {
"f1": 0.9859881491808993,
"number": 7168,
"precision": 0.985369931726348,
"recall": 0.9866071428571429
},
"eval_RANGE_END": {
"f1": 0.6783625730994152,
"number": 82,
"precision": 0.651685393258427,
"recall": 0.7073170731707317
},
"eval_UNIT": {
"f1": 0.9558001693480102,
"number": 5755,
"precision": 0.9321222130470685,
"recall": 0.9807124239791486
},
"eval_loss": 0.47966957092285156,
"eval_overall_accuracy": 0.832374252012159,
"eval_overall_f1": 0.8546520520010196,
"eval_overall_precision": 0.8322907357759904,
"eval_overall_recall": 0.8782481139983236,
"eval_runtime": 9.0205,
"eval_samples_per_second": 942.965,
"eval_steps_per_second": 29.488,
"step": 24000
},
{
"epoch": 4.85,
"learning_rate": 2.5747376757077806e-05,
"loss": 0.4498,
"step": 24500
},
{
"epoch": 4.95,
"learning_rate": 2.5252425262324292e-05,
"loss": 0.4462,
"step": 25000
},
{
"epoch": 4.95,
"eval_COMMENT": {
"f1": 0.6998077451249656,
"number": 6824,
"precision": 0.6583979328165375,
"recall": 0.7467760844079718
},
"eval_NAME": {
"f1": 0.8070350643586329,
"number": 8803,
"precision": 0.7887430864331417,
"recall": 0.8261956151312053
},
"eval_QTY": {
"f1": 0.9860329372524493,
"number": 7168,
"precision": 0.9822788315104527,
"recall": 0.9898158482142857
},
"eval_RANGE_END": {
"f1": 0.6571428571428573,
"number": 82,
"precision": 0.5390625,
"recall": 0.8414634146341463
},
"eval_UNIT": {
"f1": 0.9555161644298135,
"number": 5755,
"precision": 0.9290873276428102,
"recall": 0.9834926151172894
},
"eval_loss": 0.48545241355895996,
"eval_overall_accuracy": 0.8324889594126981,
"eval_overall_f1": 0.8534792330103665,
"eval_overall_precision": 0.8286080778844889,
"eval_overall_recall": 0.879889633975971,
"eval_runtime": 6.8304,
"eval_samples_per_second": 1245.307,
"eval_steps_per_second": 38.943,
"step": 25000
},
{
"epoch": 5.05,
"learning_rate": 2.4757473767570778e-05,
"loss": 0.4373,
"step": 25500
},
{
"epoch": 5.15,
"learning_rate": 2.4262522272817265e-05,
"loss": 0.433,
"step": 26000
},
{
"epoch": 5.15,
"eval_COMMENT": {
"f1": 0.7011549238023645,
"number": 6824,
"precision": 0.656934306569343,
"recall": 0.7517584994138335
},
"eval_NAME": {
"f1": 0.805529234713784,
"number": 8803,
"precision": 0.7907638432917488,
"recall": 0.8208565261842554
},
"eval_QTY": {
"f1": 0.9860607750209088,
"number": 7168,
"precision": 0.9852367688022284,
"recall": 0.9868861607142857
},
"eval_RANGE_END": {
"f1": 0.6607929515418502,
"number": 82,
"precision": 0.5172413793103449,
"recall": 0.9146341463414634
},
"eval_UNIT": {
"f1": 0.9570749915167968,
"number": 5755,
"precision": 0.935024034477043,
"recall": 0.9801911381407472
},
"eval_loss": 0.4933657944202423,
"eval_overall_accuracy": 0.8298315713002083,
"eval_overall_f1": 0.8533179496750768,
"eval_overall_precision": 0.8297640653357532,
"eval_overall_recall": 0.8782481139983236,
"eval_runtime": 8.2218,
"eval_samples_per_second": 1034.568,
"eval_steps_per_second": 32.353,
"step": 26000
},
{
"epoch": 5.25,
"learning_rate": 2.376757077806375e-05,
"loss": 0.4353,
"step": 26500
},
{
"epoch": 5.35,
"learning_rate": 2.3272619283310237e-05,
"loss": 0.442,
"step": 27000
},
{
"epoch": 5.35,
"eval_COMMENT": {
"f1": 0.7040608447643624,
"number": 6824,
"precision": 0.6560364464692483,
"recall": 0.7596717467760844
},
"eval_NAME": {
"f1": 0.8098804068402817,
"number": 8803,
"precision": 0.7970520294797052,
"recall": 0.8231284789276383
},
"eval_QTY": {
"f1": 0.9860037601838312,
"number": 7168,
"precision": 0.9842902822188239,
"recall": 0.9877232142857143
},
"eval_RANGE_END": {
"f1": 0.6728110599078342,
"number": 82,
"precision": 0.5407407407407407,
"recall": 0.8902439024390244
},
"eval_UNIT": {
"f1": 0.956294296321296,
"number": 5755,
"precision": 0.9294735115630638,
"recall": 0.9847089487402259
},
"eval_loss": 0.48500868678092957,
"eval_overall_accuracy": 0.8332727933163822,
"eval_overall_f1": 0.855207451312447,
"eval_overall_precision": 0.8301005983299362,
"eval_overall_recall": 0.8818804135233306,
"eval_runtime": 8.8139,
"eval_samples_per_second": 965.065,
"eval_steps_per_second": 30.18,
"step": 27000
},
{
"epoch": 5.44,
"learning_rate": 2.2777667788556724e-05,
"loss": 0.4321,
"step": 27500
},
{
"epoch": 5.54,
"learning_rate": 2.2282716293803206e-05,
"loss": 0.4348,
"step": 28000
},
{
"epoch": 5.54,
"eval_COMMENT": {
"f1": 0.7028109676082602,
"number": 6824,
"precision": 0.6646636185499674,
"recall": 0.7456037514654161
},
"eval_NAME": {
"f1": 0.8111872527717422,
"number": 8803,
"precision": 0.7959763831183031,
"recall": 0.8269907985913894
},
"eval_QTY": {
"f1": 0.9861033907726514,
"number": 7168,
"precision": 0.982281284606866,
"recall": 0.9899553571428571
},
"eval_RANGE_END": {
"f1": 0.6995073891625616,
"number": 82,
"precision": 0.5867768595041323,
"recall": 0.8658536585365854
},
"eval_UNIT": {
"f1": 0.9556492411467116,
"number": 5755,
"precision": 0.9282555282555283,
"recall": 0.9847089487402259
},
"eval_loss": 0.4908902645111084,
"eval_overall_accuracy": 0.8319536582101822,
"eval_overall_f1": 0.8560025813902146,
"eval_overall_precision": 0.8330964265644111,
"eval_overall_recall": 0.8802039675887119,
"eval_runtime": 6.4986,
"eval_samples_per_second": 1308.901,
"eval_steps_per_second": 40.932,
"step": 28000
},
{
"epoch": 5.64,
"learning_rate": 2.1787764799049696e-05,
"loss": 0.4335,
"step": 28500
},
{
"epoch": 5.74,
"learning_rate": 2.129281330429618e-05,
"loss": 0.4324,
"step": 29000
},
{
"epoch": 5.74,
"eval_COMMENT": {
"f1": 0.7066996835878389,
"number": 6824,
"precision": 0.6659320715582059,
"recall": 0.7527842907385698
},
"eval_NAME": {
"f1": 0.8106571540047935,
"number": 8803,
"precision": 0.7957977675640184,
"recall": 0.8260820174940361
},
"eval_QTY": {
"f1": 0.9864479810966712,
"number": 7168,
"precision": 0.9828278631768453,
"recall": 0.9900948660714286
},
"eval_RANGE_END": {
"f1": 0.7035175879396985,
"number": 82,
"precision": 0.5982905982905983,
"recall": 0.8536585365853658
},
"eval_UNIT": {
"f1": 0.9554875976894326,
"number": 5755,
"precision": 0.9346850589995014,
"recall": 0.9772371850564726
},
"eval_loss": 0.4821859300136566,
"eval_overall_accuracy": 0.8341139809203357,
"eval_overall_f1": 0.8565747208484169,
"eval_overall_precision": 0.8342437183434304,
"eval_overall_recall": 0.8801341156747695,
"eval_runtime": 8.6529,
"eval_samples_per_second": 983.028,
"eval_steps_per_second": 30.741,
"step": 29000
},
{
"epoch": 5.84,
"learning_rate": 2.0797861809542665e-05,
"loss": 0.4433,
"step": 29500
},
{
"epoch": 5.94,
"learning_rate": 2.0302910314789152e-05,
"loss": 0.4375,
"step": 30000
},
{
"epoch": 5.94,
"eval_COMMENT": {
"f1": 0.70434363598816,
"number": 6824,
"precision": 0.6641568220173958,
"recall": 0.7497069167643611
},
"eval_NAME": {
"f1": 0.8090376569037656,
"number": 8803,
"precision": 0.7948914711686034,
"recall": 0.823696467113484
},
"eval_QTY": {
"f1": 0.9860154456272177,
"number": 7168,
"precision": 0.9834836918806384,
"recall": 0.9885602678571429
},
"eval_RANGE_END": {
"f1": 0.6785714285714285,
"number": 82,
"precision": 0.5352112676056338,
"recall": 0.926829268292683
},
"eval_UNIT": {
"f1": 0.9560281284419215,
"number": 5755,
"precision": 0.9328703703703703,
"recall": 0.9803649000868809
},
"eval_loss": 0.48426133394241333,
"eval_overall_accuracy": 0.8327948458141358,
"eval_overall_f1": 0.8553999864065792,
"eval_overall_precision": 0.8329252150893448,
"eval_overall_recall": 0.8791212629226041,
"eval_runtime": 7.6434,
"eval_samples_per_second": 1112.862,
"eval_steps_per_second": 34.801,
"step": 30000
},
{
"epoch": 6.04,
"learning_rate": 1.9807958820035638e-05,
"loss": 0.4331,
"step": 30500
},
{
"epoch": 6.14,
"learning_rate": 1.9313007325282124e-05,
"loss": 0.4226,
"step": 31000
},
{
"epoch": 6.14,
"eval_COMMENT": {
"f1": 0.7090600610790635,
"number": 6824,
"precision": 0.6603463531791177,
"recall": 0.7655334114888629
},
"eval_NAME": {
"f1": 0.806347438752784,
"number": 8803,
"precision": 0.7907611663208475,
"recall": 0.8225604907417926
},
"eval_QTY": {
"f1": 0.9856705620478576,
"number": 7168,
"precision": 0.9829356270810211,
"recall": 0.9884207589285714
},
"eval_RANGE_END": {
"f1": 0.669603524229075,
"number": 82,
"precision": 0.5241379310344828,
"recall": 0.926829268292683
},
"eval_UNIT": {
"f1": 0.9566317921025986,
"number": 5755,
"precision": 0.9298015417418403,
"recall": 0.9850564726324935
},
"eval_loss": 0.48777666687965393,
"eval_overall_accuracy": 0.8335786797178198,
"eval_overall_f1": 0.8552831783601016,
"eval_overall_precision": 0.8288551019070712,
"eval_overall_recall": 0.8834520815870355,
"eval_runtime": 8.452,
"eval_samples_per_second": 1006.385,
"eval_steps_per_second": 31.472,
"step": 31000
},
{
"epoch": 6.24,
"learning_rate": 1.8818055830528607e-05,
"loss": 0.4237,
"step": 31500
},
{
"epoch": 6.34,
"learning_rate": 1.8323104335775097e-05,
"loss": 0.4305,
"step": 32000
},
{
"epoch": 6.34,
"eval_COMMENT": {
"f1": 0.7089205043489988,
"number": 6824,
"precision": 0.6565505182964906,
"recall": 0.770369284876905
},
"eval_NAME": {
"f1": 0.8125769273805529,
"number": 8803,
"precision": 0.8005732554293904,
"recall": 0.8249460411223447
},
"eval_QTY": {
"f1": 0.9859881491808993,
"number": 7168,
"precision": 0.985369931726348,
"recall": 0.9866071428571429
},
"eval_RANGE_END": {
"f1": 0.6634146341463415,
"number": 82,
"precision": 0.5528455284552846,
"recall": 0.8292682926829268
},
"eval_UNIT": {
"f1": 0.956661316211878,
"number": 5755,
"precision": 0.9309437684972048,
"recall": 0.9838401390095569
},
"eval_loss": 0.4837185740470886,
"eval_overall_accuracy": 0.834209570420785,
"eval_overall_f1": 0.8570026399512625,
"eval_overall_precision": 0.8312869336835194,
"eval_overall_recall": 0.8843601564682873,
"eval_runtime": 9.3183,
"eval_samples_per_second": 912.826,
"eval_steps_per_second": 28.546,
"step": 32000
},
{
"epoch": 6.43,
"learning_rate": 1.782815284102158e-05,
"loss": 0.423,
"step": 32500
},
{
"epoch": 6.53,
"learning_rate": 1.7333201346268066e-05,
"loss": 0.4142,
"step": 33000
},
{
"epoch": 6.53,
"eval_COMMENT": {
"f1": 0.6982502247734974,
"number": 6824,
"precision": 0.6611656843483955,
"recall": 0.7397420867526378
},
"eval_NAME": {
"f1": 0.8101717599821548,
"number": 8803,
"precision": 0.7957059918939643,
"recall": 0.8251732363966829
},
"eval_QTY": {
"f1": 0.9850003456141564,
"number": 7168,
"precision": 0.9761611179613646,
"recall": 0.9940011160714286
},
"eval_RANGE_END": {
"f1": 0.669683257918552,
"number": 82,
"precision": 0.5323741007194245,
"recall": 0.9024390243902439
},
"eval_UNIT": {
"f1": 0.9568381855111713,
"number": 5755,
"precision": 0.9326843755155915,
"recall": 0.9822762814943528
},
"eval_loss": 0.48620671033859253,
"eval_overall_accuracy": 0.833158085915843,
"eval_overall_f1": 0.8545377366499703,
"eval_overall_precision": 0.831510425271784,
"eval_overall_recall": 0.8788767812238055,
"eval_runtime": 6.5738,
"eval_samples_per_second": 1293.917,
"eval_steps_per_second": 40.463,
"step": 33000
},
{
"epoch": 6.63,
"learning_rate": 1.6838249851514553e-05,
"loss": 0.4247,
"step": 33500
},
{
"epoch": 6.73,
"learning_rate": 1.634329835676104e-05,
"loss": 0.4327,
"step": 34000
},
{
"epoch": 6.73,
"eval_COMMENT": {
"f1": 0.7027439024390244,
"number": 6824,
"precision": 0.6665352260778128,
"recall": 0.7431125439624854
},
"eval_NAME": {
"f1": 0.8050692012673003,
"number": 8803,
"precision": 0.7882020026121027,
"recall": 0.8226740883789617
},
"eval_QTY": {
"f1": 0.9866000138859959,
"number": 7168,
"precision": 0.9820317899101589,
"recall": 0.9912109375
},
"eval_RANGE_END": {
"f1": 0.6930693069306931,
"number": 82,
"precision": 0.5833333333333334,
"recall": 0.8536585365853658
},
"eval_UNIT": {
"f1": 0.9562352145995269,
"number": 5755,
"precision": 0.9306035191580332,
"recall": 0.9833188531711555
},
"eval_loss": 0.4834836721420288,
"eval_overall_accuracy": 0.8330242606152141,
"eval_overall_f1": 0.8544101658059254,
"eval_overall_precision": 0.8318007409367557,
"eval_overall_recall": 0.8782830399552948,
"eval_runtime": 8.5374,
"eval_samples_per_second": 996.324,
"eval_steps_per_second": 31.157,
"step": 34000
},
{
"epoch": 6.83,
"learning_rate": 1.5848346862007525e-05,
"loss": 0.4289,
"step": 34500
},
{
"epoch": 6.93,
"learning_rate": 1.535339536725401e-05,
"loss": 0.4299,
"step": 35000
},
{
"epoch": 6.93,
"eval_COMMENT": {
"f1": 0.706956462492335,
"number": 6824,
"precision": 0.660639246147969,
"recall": 0.7602579132473622
},
"eval_NAME": {
"f1": 0.8096777790166128,
"number": 8803,
"precision": 0.7949644225506295,
"recall": 0.8249460411223447
},
"eval_QTY": {
"f1": 0.9858723641171967,
"number": 7168,
"precision": 0.9836133870295792,
"recall": 0.9881417410714286
},
"eval_RANGE_END": {
"f1": 0.6757990867579909,
"number": 82,
"precision": 0.5401459854014599,
"recall": 0.9024390243902439
},
"eval_UNIT": {
"f1": 0.9569053274516457,
"number": 5755,
"precision": 0.9348582794629537,
"recall": 0.9800173761946134
},
"eval_loss": 0.4832661747932434,
"eval_overall_accuracy": 0.8333301470166516,
"eval_overall_f1": 0.8559610788086318,
"eval_overall_precision": 0.8316150070819197,
"eval_overall_recall": 0.8817756356524169,
"eval_runtime": 7.9218,
"eval_samples_per_second": 1073.752,
"eval_steps_per_second": 33.578,
"step": 35000
},
{
"epoch": 7.03,
"learning_rate": 1.4858443872500496e-05,
"loss": 0.4181,
"step": 35500
},
{
"epoch": 7.13,
"learning_rate": 1.4363492377746981e-05,
"loss": 0.4165,
"step": 36000
},
{
"epoch": 7.13,
"eval_COMMENT": {
"f1": 0.7096729965037363,
"number": 6824,
"precision": 0.6667525441195414,
"recall": 0.7584994138335287
},
"eval_NAME": {
"f1": 0.8082838265504414,
"number": 8803,
"precision": 0.7905082536924414,
"recall": 0.8268772009542201
},
"eval_QTY": {
"f1": 0.9864479810966712,
"number": 7168,
"precision": 0.9828278631768453,
"recall": 0.9900948660714286
},
"eval_RANGE_END": {
"f1": 0.6542056074766355,
"number": 82,
"precision": 0.5303030303030303,
"recall": 0.8536585365853658
},
"eval_UNIT": {
"f1": 0.9563968227142133,
"number": 5755,
"precision": 0.930909689093601,
"recall": 0.9833188531711555
},
"eval_loss": 0.48711806535720825,
"eval_overall_accuracy": 0.8347831074234806,
"eval_overall_f1": 0.8564749724739562,
"eval_overall_precision": 0.8315297832450745,
"eval_overall_recall": 0.8829631181894384,
"eval_runtime": 8.4247,
"eval_samples_per_second": 1009.646,
"eval_steps_per_second": 31.574,
"step": 36000
},
{
"epoch": 7.23,
"learning_rate": 1.3868540882993467e-05,
"loss": 0.4199,
"step": 36500
},
{
"epoch": 7.33,
"learning_rate": 1.3373589388239954e-05,
"loss": 0.4213,
"step": 37000
},
{
"epoch": 7.33,
"eval_COMMENT": {
"f1": 0.7081497797356828,
"number": 6824,
"precision": 0.667705088265836,
"recall": 0.753810082063306
},
"eval_NAME": {
"f1": 0.8101195440644984,
"number": 8803,
"precision": 0.7934001306904814,
"recall": 0.827558786777235
},
"eval_QTY": {
"f1": 0.9860821155184412,
"number": 7168,
"precision": 0.983754512635379,
"recall": 0.9884207589285714
},
"eval_RANGE_END": {
"f1": 0.663594470046083,
"number": 82,
"precision": 0.5333333333333333,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.9559865092748736,
"number": 5755,
"precision": 0.9285831285831286,
"recall": 0.9850564726324935
},
"eval_loss": 0.4881742596626282,
"eval_overall_accuracy": 0.8332727933163822,
"eval_overall_f1": 0.8566824966078698,
"eval_overall_precision": 0.832728831442891,
"eval_overall_recall": 0.8820550433081866,
"eval_runtime": 8.1883,
"eval_samples_per_second": 1038.805,
"eval_steps_per_second": 32.486,
"step": 37000
},
{
"epoch": 7.42,
"learning_rate": 1.287863789348644e-05,
"loss": 0.4196,
"step": 37500
},
{
"epoch": 7.52,
"learning_rate": 1.2383686398732925e-05,
"loss": 0.4122,
"step": 38000
},
{
"epoch": 7.52,
"eval_COMMENT": {
"f1": 0.7068037866920929,
"number": 6824,
"precision": 0.660262119862578,
"recall": 0.7604044548651817
},
"eval_NAME": {
"f1": 0.8086100450525612,
"number": 8803,
"precision": 0.7921752397558849,
"recall": 0.8257412245825286
},
"eval_QTY": {
"f1": 0.9867148918411351,
"number": 7168,
"precision": 0.9839090026355944,
"recall": 0.9895368303571429
},
"eval_RANGE_END": {
"f1": 0.6766169154228855,
"number": 82,
"precision": 0.5714285714285714,
"recall": 0.8292682926829268
},
"eval_UNIT": {
"f1": 0.9566393373341222,
"number": 5755,
"precision": 0.9313693219223174,
"recall": 0.9833188531711555
},
"eval_loss": 0.4913991689682007,
"eval_overall_accuracy": 0.8336933871183589,
"eval_overall_f1": 0.8558514330212795,
"eval_overall_precision": 0.8304477808075167,
"eval_overall_recall": 0.8828583403185247,
"eval_runtime": 6.6374,
"eval_samples_per_second": 1281.524,
"eval_steps_per_second": 40.076,
"step": 38000
},
{
"epoch": 7.62,
"learning_rate": 1.1888734903979411e-05,
"loss": 0.4196,
"step": 38500
},
{
"epoch": 7.72,
"learning_rate": 1.1393783409225896e-05,
"loss": 0.4034,
"step": 39000
},
{
"epoch": 7.72,
"eval_COMMENT": {
"f1": 0.7121398334016114,
"number": 6824,
"precision": 0.6667092815136794,
"recall": 0.7642145369284877
},
"eval_NAME": {
"f1": 0.8117607676857844,
"number": 8803,
"precision": 0.7976099111939481,
"recall": 0.8264228104055436
},
"eval_QTY": {
"f1": 0.9866388308977034,
"number": 7168,
"precision": 0.984309913912802,
"recall": 0.9889787946428571
},
"eval_RANGE_END": {
"f1": 0.6859903381642511,
"number": 82,
"precision": 0.568,
"recall": 0.8658536585365854
},
"eval_UNIT": {
"f1": 0.9563307711799983,
"number": 5755,
"precision": 0.9304733727810651,
"recall": 0.9836663770634231
},
"eval_loss": 0.4883587956428528,
"eval_overall_accuracy": 0.8344007494216835,
"eval_overall_f1": 0.8582036415420609,
"eval_overall_precision": 0.8338604467286025,
"eval_overall_recall": 0.884010896898575,
"eval_runtime": 9.4932,
"eval_samples_per_second": 896.008,
"eval_steps_per_second": 28.02,
"step": 39000
},
{
"epoch": 7.82,
"learning_rate": 1.0898831914472382e-05,
"loss": 0.4145,
"step": 39500
},
{
"epoch": 7.92,
"learning_rate": 1.0403880419718868e-05,
"loss": 0.4209,
"step": 40000
},
{
"epoch": 7.92,
"eval_COMMENT": {
"f1": 0.706067877956805,
"number": 6824,
"precision": 0.6634454322896534,
"recall": 0.7545427901524033
},
"eval_NAME": {
"f1": 0.81135449262405,
"number": 8803,
"precision": 0.7984163642362256,
"recall": 0.8247188458480064
},
"eval_QTY": {
"f1": 0.9865127919911012,
"number": 7168,
"precision": 0.9832317073170732,
"recall": 0.9898158482142857
},
"eval_RANGE_END": {
"f1": 0.6697674418604651,
"number": 82,
"precision": 0.5413533834586466,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.9571609632446134,
"number": 5755,
"precision": 0.9315789473684211,
"recall": 0.9841876629018245
},
"eval_loss": 0.49103492498397827,
"eval_overall_accuracy": 0.8326992563136865,
"eval_overall_f1": 0.8568276330306375,
"eval_overall_precision": 0.8334709242809497,
"eval_overall_recall": 0.8815311539536184,
"eval_runtime": 6.7729,
"eval_samples_per_second": 1255.88,
"eval_steps_per_second": 39.274,
"step": 40000
},
{
"epoch": 8.02,
"learning_rate": 9.908928924965353e-06,
"loss": 0.4146,
"step": 40500
},
{
"epoch": 8.12,
"learning_rate": 9.41397743021184e-06,
"loss": 0.4078,
"step": 41000
},
{
"epoch": 8.12,
"eval_COMMENT": {
"f1": 0.7065016749846176,
"number": 6824,
"precision": 0.6621812123542228,
"recall": 0.7571805392731535
},
"eval_NAME": {
"f1": 0.8095132004010249,
"number": 8803,
"precision": 0.7941208611080757,
"recall": 0.8255140293081904
},
"eval_QTY": {
"f1": 0.9861565217391305,
"number": 7168,
"precision": 0.9834882752879145,
"recall": 0.9888392857142857
},
"eval_RANGE_END": {
"f1": 0.6824644549763034,
"number": 82,
"precision": 0.5581395348837209,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.9566246723598546,
"number": 5755,
"precision": 0.9316534914361001,
"recall": 0.982971329278888
},
"eval_loss": 0.49227482080459595,
"eval_overall_accuracy": 0.8334830902173705,
"eval_overall_f1": 0.856053157948266,
"eval_overall_precision": 0.8316645807259074,
"eval_overall_recall": 0.8819153394803018,
"eval_runtime": 8.7342,
"eval_samples_per_second": 973.868,
"eval_steps_per_second": 30.455,
"step": 41000
},
{
"epoch": 8.22,
"learning_rate": 8.919025935458326e-06,
"loss": 0.4008,
"step": 41500
},
{
"epoch": 8.32,
"learning_rate": 8.424074440704812e-06,
"loss": 0.4098,
"step": 42000
},
{
"epoch": 8.32,
"eval_COMMENT": {
"f1": 0.7069577080491133,
"number": 6824,
"precision": 0.6613067891781521,
"recall": 0.7593786635404455
},
"eval_NAME": {
"f1": 0.8097364895042429,
"number": 8803,
"precision": 0.7961356899769458,
"recall": 0.8238100647506532
},
"eval_QTY": {
"f1": 0.9860801781737194,
"number": 7168,
"precision": 0.9838888888888889,
"recall": 0.98828125
},
"eval_RANGE_END": {
"f1": 0.6889952153110047,
"number": 82,
"precision": 0.5669291338582677,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.9567859554355165,
"number": 5755,
"precision": 0.9302478253733792,
"recall": 0.9848827106863597
},
"eval_loss": 0.4903165102005005,
"eval_overall_accuracy": 0.8344198673217734,
"eval_overall_f1": 0.8562469278098886,
"eval_overall_precision": 0.831812942532521,
"eval_overall_recall": 0.8821598211791003,
"eval_runtime": 7.5483,
"eval_samples_per_second": 1126.874,
"eval_steps_per_second": 35.24,
"step": 42000
},
{
"epoch": 8.41,
"learning_rate": 7.929122945951298e-06,
"loss": 0.4092,
"step": 42500
},
{
"epoch": 8.51,
"learning_rate": 7.434171451197783e-06,
"loss": 0.4009,
"step": 43000
},
{
"epoch": 8.51,
"eval_COMMENT": {
"f1": 0.7111504907306434,
"number": 6824,
"precision": 0.6647553516819572,
"recall": 0.7645076201641267
},
"eval_NAME": {
"f1": 0.8115311698449873,
"number": 8803,
"precision": 0.7969554265688314,
"recall": 0.8266500056798819
},
"eval_QTY": {
"f1": 0.9865015307542444,
"number": 7168,
"precision": 0.9840366463076069,
"recall": 0.9889787946428571
},
"eval_RANGE_END": {
"f1": 0.6666666666666667,
"number": 82,
"precision": 0.5689655172413793,
"recall": 0.8048780487804879
},
"eval_UNIT": {
"f1": 0.9566759564225994,
"number": 5755,
"precision": 0.9306605323693723,
"recall": 0.9841876629018245
},
"eval_loss": 0.4936346113681793,
"eval_overall_accuracy": 0.8347639895233907,
"eval_overall_f1": 0.8578206279546571,
"eval_overall_precision": 0.8330755306894849,
"eval_overall_recall": 0.8840807488125174,
"eval_runtime": 7.8937,
"eval_samples_per_second": 1077.574,
"eval_steps_per_second": 33.698,
"step": 43000
},
{
"epoch": 8.61,
"learning_rate": 6.939219956444269e-06,
"loss": 0.4103,
"step": 43500
},
{
"epoch": 8.71,
"learning_rate": 6.444268461690754e-06,
"loss": 0.41,
"step": 44000
},
{
"epoch": 8.71,
"eval_COMMENT": {
"f1": 0.7139846352573254,
"number": 6824,
"precision": 0.6659480025364616,
"recall": 0.7694900351699883
},
"eval_NAME": {
"f1": 0.8144254962258876,
"number": 8803,
"precision": 0.8019158775600088,
"recall": 0.8273315915028967
},
"eval_QTY": {
"f1": 0.9864385562278323,
"number": 7168,
"precision": 0.9834974344751075,
"recall": 0.9893973214285714
},
"eval_RANGE_END": {
"f1": 0.6728110599078342,
"number": 82,
"precision": 0.5407407407407407,
"recall": 0.8902439024390244
},
"eval_UNIT": {
"f1": 0.9569402228976698,
"number": 5755,
"precision": 0.9306946953522746,
"recall": 0.9847089487402259
},
"eval_loss": 0.4894082546234131,
"eval_overall_accuracy": 0.835911063528782,
"eval_overall_f1": 0.8593691770843921,
"eval_overall_precision": 0.8343530030919019,
"eval_overall_recall": 0.8859318245319922,
"eval_runtime": 9.03,
"eval_samples_per_second": 941.975,
"eval_steps_per_second": 29.457,
"step": 44000
},
{
"epoch": 8.81,
"learning_rate": 5.949316966937241e-06,
"loss": 0.4063,
"step": 44500
},
{
"epoch": 8.91,
"learning_rate": 5.4543654721837265e-06,
"loss": 0.4177,
"step": 45000
},
{
"epoch": 8.91,
"eval_COMMENT": {
"f1": 0.7089166264395559,
"number": 6824,
"precision": 0.6695323694151362,
"recall": 0.7532239155920282
},
"eval_NAME": {
"f1": 0.810614930032893,
"number": 8803,
"precision": 0.7959273045763083,
"recall": 0.8258548222196979
},
"eval_QTY": {
"f1": 0.9862956521739129,
"number": 7168,
"precision": 0.9836270292770917,
"recall": 0.9889787946428571
},
"eval_RANGE_END": {
"f1": 0.6926829268292684,
"number": 82,
"precision": 0.5772357723577236,
"recall": 0.8658536585365854
},
"eval_UNIT": {
"f1": 0.9571682014023823,
"number": 5755,
"precision": 0.9314370272936534,
"recall": 0.9843614248479583
},
"eval_loss": 0.4893593490123749,
"eval_overall_accuracy": 0.8339036840193473,
"eval_overall_f1": 0.8575312207968737,
"eval_overall_precision": 0.8349601297025444,
"eval_overall_recall": 0.8813565241687622,
"eval_runtime": 7.9862,
"eval_samples_per_second": 1065.084,
"eval_steps_per_second": 33.307,
"step": 45000
},
{
"epoch": 9.01,
"learning_rate": 4.959413977430212e-06,
"loss": 0.4109,
"step": 45500
},
{
"epoch": 9.11,
"learning_rate": 4.4644624826766974e-06,
"loss": 0.399,
"step": 46000
},
{
"epoch": 9.11,
"eval_COMMENT": {
"f1": 0.7139457401237506,
"number": 6824,
"precision": 0.6659901052898642,
"recall": 0.7693434935521688
},
"eval_NAME": {
"f1": 0.8108047897521581,
"number": 8803,
"precision": 0.7953452797202797,
"recall": 0.8268772009542201
},
"eval_QTY": {
"f1": 0.9858156028368794,
"number": 7168,
"precision": 0.9826725810923205,
"recall": 0.9889787946428571
},
"eval_RANGE_END": {
"f1": 0.6790697674418604,
"number": 82,
"precision": 0.5488721804511278,
"recall": 0.8902439024390244
},
"eval_UNIT": {
"f1": 0.9572476600050595,
"number": 5755,
"precision": 0.9298820445609436,
"recall": 0.98627280625543
},
"eval_loss": 0.49086296558380127,
"eval_overall_accuracy": 0.8356434129275241,
"eval_overall_f1": 0.8581819412023411,
"eval_overall_precision": 0.832086859542085,
"eval_overall_recall": 0.8859667504889635,
"eval_runtime": 9.6791,
"eval_samples_per_second": 878.799,
"eval_steps_per_second": 27.482,
"step": 46000
},
{
"epoch": 9.21,
"learning_rate": 3.969510987923184e-06,
"loss": 0.4028,
"step": 46500
},
{
"epoch": 9.31,
"learning_rate": 3.4745594931696697e-06,
"loss": 0.4066,
"step": 47000
},
{
"epoch": 9.31,
"eval_COMMENT": {
"f1": 0.7096332785987959,
"number": 6824,
"precision": 0.6655544147843943,
"recall": 0.7599648300117233
},
"eval_NAME": {
"f1": 0.8115457483561797,
"number": 8803,
"precision": 0.7964563053702286,
"recall": 0.8272179938657276
},
"eval_QTY": {
"f1": 0.9858900396191006,
"number": 7168,
"precision": 0.9824075356697604,
"recall": 0.9893973214285714
},
"eval_RANGE_END": {
"f1": 0.6792452830188679,
"number": 82,
"precision": 0.5538461538461539,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.9569838056680162,
"number": 5755,
"precision": 0.9298475659727914,
"recall": 0.9857515204170286
},
"eval_loss": 0.4892035126686096,
"eval_overall_accuracy": 0.8339610377196168,
"eval_overall_f1": 0.8575495196299372,
"eval_overall_precision": 0.8328122428830015,
"eval_overall_recall": 0.8838013411567477,
"eval_runtime": 7.0853,
"eval_samples_per_second": 1200.507,
"eval_steps_per_second": 37.542,
"step": 47000
},
{
"epoch": 9.4,
"learning_rate": 2.979607998416155e-06,
"loss": 0.4045,
"step": 47500
},
{
"epoch": 9.5,
"learning_rate": 2.484656503662641e-06,
"loss": 0.397,
"step": 48000
},
{
"epoch": 9.5,
"eval_COMMENT": {
"f1": 0.7098901098901098,
"number": 6824,
"precision": 0.6680455015511892,
"recall": 0.757327080890973
},
"eval_NAME": {
"f1": 0.8101547711836098,
"number": 8803,
"precision": 0.7944098700731521,
"recall": 0.8265364080427127
},
"eval_QTY": {
"f1": 0.9862327909887358,
"number": 7168,
"precision": 0.9830884391461048,
"recall": 0.9893973214285714
},
"eval_RANGE_END": {
"f1": 0.6857142857142857,
"number": 82,
"precision": 0.5625,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.9567713610266801,
"number": 5755,
"precision": 0.9305304647725406,
"recall": 0.9845351867940921
},
"eval_loss": 0.491767019033432,
"eval_overall_accuracy": 0.8346875179230313,
"eval_overall_f1": 0.8573560839919944,
"eval_overall_precision": 0.8334102750115413,
"eval_overall_recall": 0.8827186364906399,
"eval_runtime": 8.8099,
"eval_samples_per_second": 965.502,
"eval_steps_per_second": 30.193,
"step": 48000
},
{
"epoch": 9.6,
"learning_rate": 1.989705008909127e-06,
"loss": 0.4023,
"step": 48500
},
{
"epoch": 9.7,
"learning_rate": 1.4947535141556129e-06,
"loss": 0.3987,
"step": 49000
},
{
"epoch": 9.7,
"eval_COMMENT": {
"f1": 0.7078929306794783,
"number": 6824,
"precision": 0.6657629744384198,
"recall": 0.7557151230949589
},
"eval_NAME": {
"f1": 0.8108077994428969,
"number": 8803,
"precision": 0.7955613862468569,
"recall": 0.8266500056798819
},
"eval_QTY": {
"f1": 0.9860232250886588,
"number": 7168,
"precision": 0.9829474559822543,
"recall": 0.9891183035714286
},
"eval_RANGE_END": {
"f1": 0.6857142857142857,
"number": 82,
"precision": 0.5625,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.9566759564225994,
"number": 5755,
"precision": 0.9306605323693723,
"recall": 0.9841876629018245
},
"eval_loss": 0.4935953915119171,
"eval_overall_accuracy": 0.8338845661192574,
"eval_overall_f1": 0.8569683810557741,
"eval_overall_precision": 0.83311345646438,
"eval_overall_recall": 0.8822296730930428,
"eval_runtime": 7.6552,
"eval_samples_per_second": 1111.139,
"eval_steps_per_second": 34.748,
"step": 49000
},
{
"epoch": 9.8,
"learning_rate": 9.998020194020988e-07,
"loss": 0.3986,
"step": 49500
},
{
"epoch": 9.9,
"learning_rate": 5.048505246485845e-07,
"loss": 0.4109,
"step": 50000
},
{
"epoch": 9.9,
"eval_COMMENT": {
"f1": 0.7082043875937006,
"number": 6824,
"precision": 0.6672281974860698,
"recall": 0.7545427901524033
},
"eval_NAME": {
"f1": 0.8094707520891365,
"number": 8803,
"precision": 0.794249480704056,
"recall": 0.8252868340338521
},
"eval_QTY": {
"f1": 0.986230876216968,
"number": 7168,
"precision": 0.983222407099279,
"recall": 0.9892578125
},
"eval_RANGE_END": {
"f1": 0.6889952153110047,
"number": 82,
"precision": 0.5669291338582677,
"recall": 0.8780487804878049
},
"eval_UNIT": {
"f1": 0.956595169734842,
"number": 5755,
"precision": 0.9305076392311483,
"recall": 0.9841876629018245
},
"eval_loss": 0.49291422963142395,
"eval_overall_accuracy": 0.8339228019194371,
"eval_overall_f1": 0.8567597841213808,
"eval_overall_precision": 0.8333113238692638,
"eval_overall_recall": 0.8815660799105896,
"eval_runtime": 7.4834,
"eval_samples_per_second": 1136.652,
"eval_steps_per_second": 35.545,
"step": 50000
},
{
"epoch": 10.0,
"learning_rate": 9.899029895070283e-09,
"loss": 0.4034,
"step": 50500
},
{
"epoch": 10.0,
"step": 50510,
"total_flos": 1557854363345160.0,
"train_loss": 0.46329507851359913,
"train_runtime": 1951.481,
"train_samples_per_second": 828.104,
"train_steps_per_second": 25.883
}
],
"logging_steps": 500,
"max_steps": 50510,
"num_train_epochs": 10,
"save_steps": 1000,
"total_flos": 1557854363345160.0,
"trial_name": null,
"trial_params": null
}