metaextractor / trainer_state.json
tieandrews's picture
Update Roberta v6 Model as Outlined in Final Report (#3)
f4165ec
{
"best_metric": 0.646713977167541,
"best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/ffossils/roberta-finetuned-v6/models/checkpoint-400",
"epoch": 14.716981132075471,
"global_step": 585,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.25,
"learning_rate": 2.0000000000000003e-06,
"loss": 2.785,
"step": 10
},
{
"epoch": 0.5,
"learning_rate": 4.000000000000001e-06,
"loss": 2.592,
"step": 20
},
{
"epoch": 0.63,
"eval_AGE_f1": 0.0,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.0,
"eval_AGE_recall": 0.0,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.013565891472868219,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.006958250497017893,
"eval_EMAIL_recall": 0.2692307692307692,
"eval_GEOG_f1": 0.0,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.0,
"eval_GEOG_recall": 0.0,
"eval_REGION_f1": 0.0,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.0,
"eval_REGION_recall": 0.0,
"eval_SITE_f1": 0.0,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.0,
"eval_SITE_recall": 0.0,
"eval_TAXA_f1": 0.0,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.0,
"eval_TAXA_recall": 0.0,
"eval_accuracy_entity": 0.8152934266033001,
"eval_accuracy_token": 0.8152934266033001,
"eval_f1_entity": 0.022789506227365072,
"eval_f1_token": 0.022789506227365072,
"eval_loss": 2.0357258319854736,
"eval_overall_accuracy": 0.8141186522133818,
"eval_overall_f1": 0.004022988505747126,
"eval_overall_precision": 0.0025371511417180137,
"eval_overall_recall": 0.009708737864077669,
"eval_precision_entity": 0.02199113535629049,
"eval_precision_token": 0.02199113535629049,
"eval_recall_entity": 0.02364802933088909,
"eval_recall_token": 0.02364802933088909,
"eval_runtime": 10.2464,
"eval_samples_per_second": 18.446,
"eval_steps_per_second": 2.342,
"step": 25
},
{
"epoch": 0.75,
"learning_rate": 6e-06,
"loss": 1.9963,
"step": 30
},
{
"epoch": 1.01,
"learning_rate": 8.000000000000001e-06,
"loss": 0.8245,
"step": 40
},
{
"epoch": 1.26,
"learning_rate": 1e-05,
"loss": 0.5512,
"step": 50
},
{
"epoch": 1.26,
"eval_AGE_f1": 0.0,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.0,
"eval_AGE_recall": 0.0,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.0,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.0,
"eval_EMAIL_recall": 0.0,
"eval_GEOG_f1": 0.0,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.0,
"eval_GEOG_recall": 0.0,
"eval_REGION_f1": 0.0,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.0,
"eval_REGION_recall": 0.0,
"eval_SITE_f1": 0.0,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.0,
"eval_SITE_recall": 0.0,
"eval_TAXA_f1": 0.0,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.0,
"eval_TAXA_recall": 0.0,
"eval_accuracy_entity": 0.9028853171000872,
"eval_accuracy_token": 0.9028853171000872,
"eval_f1_entity": 0.0,
"eval_f1_token": 0.0,
"eval_loss": 0.4787032902240753,
"eval_overall_accuracy": 0.9028853171000872,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_precision_entity": 0.0,
"eval_precision_token": 0.0,
"eval_recall_entity": 0.0,
"eval_recall_token": 0.0,
"eval_runtime": 10.1567,
"eval_samples_per_second": 18.608,
"eval_steps_per_second": 2.363,
"step": 50
},
{
"epoch": 1.51,
"learning_rate": 1.2e-05,
"loss": 0.4716,
"step": 60
},
{
"epoch": 1.76,
"learning_rate": 1.4e-05,
"loss": 0.3759,
"step": 70
},
{
"epoch": 1.89,
"eval_AGE_f1": 0.0,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.0,
"eval_AGE_recall": 0.0,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.0,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.0,
"eval_EMAIL_recall": 0.0,
"eval_GEOG_f1": 0.0,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.0,
"eval_GEOG_recall": 0.0,
"eval_REGION_f1": 0.0,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.0,
"eval_REGION_recall": 0.0,
"eval_SITE_f1": 0.0,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.0,
"eval_SITE_recall": 0.0,
"eval_TAXA_f1": 0.4575645756457565,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.44364937388193204,
"eval_TAXA_recall": 0.4723809523809524,
"eval_accuracy_entity": 0.9267723963617593,
"eval_accuracy_token": 0.9267723963617593,
"eval_f1_entity": 0.45445053510832684,
"eval_f1_token": 0.45445053510832684,
"eval_loss": 0.28952518105506897,
"eval_overall_accuracy": 0.9190651643794165,
"eval_overall_f1": 0.23732057416267943,
"eval_overall_precision": 0.38271604938271603,
"eval_overall_recall": 0.17198335644937587,
"eval_precision_entity": 0.7888536474852741,
"eval_precision_token": 0.7888536474852741,
"eval_recall_entity": 0.3191567369385884,
"eval_recall_token": 0.3191567369385884,
"eval_runtime": 10.7946,
"eval_samples_per_second": 17.509,
"eval_steps_per_second": 2.223,
"step": 75
},
{
"epoch": 2.01,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.3221,
"step": 80
},
{
"epoch": 2.26,
"learning_rate": 1.8e-05,
"loss": 0.2555,
"step": 90
},
{
"epoch": 2.52,
"learning_rate": 2e-05,
"loss": 0.2161,
"step": 100
},
{
"epoch": 2.52,
"eval_AGE_f1": 0.36414565826330536,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.3282828282828283,
"eval_AGE_recall": 0.4088050314465409,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.0,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.0,
"eval_EMAIL_recall": 0.0,
"eval_GEOG_f1": 0.058823529411764705,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.04,
"eval_GEOG_recall": 0.1111111111111111,
"eval_REGION_f1": 0.25806451612903225,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.1907356948228883,
"eval_REGION_recall": 0.39886039886039887,
"eval_SITE_f1": 0.028925619834710745,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.045454545454545456,
"eval_SITE_recall": 0.021212121212121213,
"eval_TAXA_f1": 0.6412859560067682,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.5768645357686454,
"eval_TAXA_recall": 0.7219047619047619,
"eval_accuracy_entity": 0.943005642476994,
"eval_accuracy_token": 0.943005642476994,
"eval_f1_entity": 0.654824165915239,
"eval_f1_token": 0.654824165915239,
"eval_loss": 0.20675021409988403,
"eval_overall_accuracy": 0.9366867802281911,
"eval_overall_f1": 0.3688473520249221,
"eval_overall_precision": 0.334841628959276,
"eval_overall_recall": 0.4105409153952843,
"eval_precision_entity": 0.6443655723158829,
"eval_precision_token": 0.6443655723158829,
"eval_recall_entity": 0.6656278643446379,
"eval_recall_token": 0.6656278643446379,
"eval_runtime": 11.4868,
"eval_samples_per_second": 16.454,
"eval_steps_per_second": 2.089,
"step": 100
},
{
"epoch": 2.77,
"learning_rate": 1.9587628865979382e-05,
"loss": 0.1805,
"step": 110
},
{
"epoch": 3.02,
"learning_rate": 1.9175257731958766e-05,
"loss": 0.1729,
"step": 120
},
{
"epoch": 3.14,
"eval_AGE_f1": 0.47398843930635837,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.4385026737967914,
"eval_AGE_recall": 0.5157232704402516,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.0,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.0,
"eval_EMAIL_recall": 0.0,
"eval_GEOG_f1": 0.2758620689655173,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2,
"eval_GEOG_recall": 0.4444444444444444,
"eval_REGION_f1": 0.3544813695871098,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.27414330218068533,
"eval_REGION_recall": 0.5014245014245015,
"eval_SITE_f1": 0.14779874213836475,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.15359477124183007,
"eval_SITE_recall": 0.14242424242424243,
"eval_TAXA_f1": 0.7314578005115089,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.6620370370370371,
"eval_TAXA_recall": 0.8171428571428572,
"eval_accuracy_entity": 0.9479539346042256,
"eval_accuracy_token": 0.9479539346042256,
"eval_f1_entity": 0.7052475850665739,
"eval_f1_token": 0.7052475850665739,
"eval_loss": 0.16586871445178986,
"eval_overall_accuracy": 0.9440380199711647,
"eval_overall_f1": 0.4548536209553159,
"eval_overall_precision": 0.40931780366056575,
"eval_overall_recall": 0.5117891816920943,
"eval_precision_entity": 0.6713055003313453,
"eval_precision_token": 0.6713055003313453,
"eval_recall_entity": 0.7428047662694776,
"eval_recall_token": 0.7428047662694776,
"eval_runtime": 12.6888,
"eval_samples_per_second": 14.895,
"eval_steps_per_second": 1.891,
"step": 125
},
{
"epoch": 3.27,
"learning_rate": 1.8762886597938147e-05,
"loss": 0.1471,
"step": 130
},
{
"epoch": 3.52,
"learning_rate": 1.8350515463917527e-05,
"loss": 0.1384,
"step": 140
},
{
"epoch": 3.77,
"learning_rate": 1.793814432989691e-05,
"loss": 0.1233,
"step": 150
},
{
"epoch": 3.77,
"eval_AGE_f1": 0.42245989304812837,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.3674418604651163,
"eval_AGE_recall": 0.4968553459119497,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.17543859649122806,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 1.0,
"eval_EMAIL_recall": 0.09615384615384616,
"eval_GEOG_f1": 0.3703703703703704,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2777777777777778,
"eval_GEOG_recall": 0.5555555555555556,
"eval_REGION_f1": 0.43149946062567424,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.3472222222222222,
"eval_REGION_recall": 0.5698005698005698,
"eval_SITE_f1": 0.2934472934472935,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.2768817204301075,
"eval_SITE_recall": 0.31212121212121213,
"eval_TAXA_f1": 0.7345890410958905,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.6671850699844479,
"eval_TAXA_recall": 0.8171428571428572,
"eval_accuracy_entity": 0.9522080418646873,
"eval_accuracy_token": 0.9522080418646873,
"eval_f1_entity": 0.7402282947077135,
"eval_f1_token": 0.7402282947077135,
"eval_loss": 0.14876657724380493,
"eval_overall_accuracy": 0.9501076876524092,
"eval_overall_f1": 0.5018337408312958,
"eval_overall_precision": 0.4486338797814208,
"eval_overall_recall": 0.5693481276005548,
"eval_precision_entity": 0.7006056637747585,
"eval_precision_token": 0.7006056637747585,
"eval_recall_entity": 0.7846012832263978,
"eval_recall_token": 0.7846012832263978,
"eval_runtime": 11.4316,
"eval_samples_per_second": 16.533,
"eval_steps_per_second": 2.099,
"step": 150
},
{
"epoch": 4.03,
"learning_rate": 1.752577319587629e-05,
"loss": 0.1231,
"step": 160
},
{
"epoch": 4.28,
"learning_rate": 1.7113402061855672e-05,
"loss": 0.1084,
"step": 170
},
{
"epoch": 4.4,
"eval_AGE_f1": 0.6049046321525886,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.5336538461538461,
"eval_AGE_recall": 0.6981132075471698,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.5555555555555556,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 1.0,
"eval_EMAIL_recall": 0.38461538461538464,
"eval_GEOG_f1": 0.33333333333333326,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.23809523809523808,
"eval_GEOG_recall": 0.5555555555555556,
"eval_REGION_f1": 0.4647887323943662,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.39520958083832336,
"eval_REGION_recall": 0.5641025641025641,
"eval_SITE_f1": 0.3371104815864023,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.31648936170212766,
"eval_SITE_recall": 0.3606060606060606,
"eval_TAXA_f1": 0.776173285198556,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7375643224699828,
"eval_TAXA_recall": 0.819047619047619,
"eval_accuracy_entity": 0.955144977839483,
"eval_accuracy_token": 0.955144977839483,
"eval_f1_entity": 0.7561658212349135,
"eval_f1_token": 0.7561658212349135,
"eval_loss": 0.137845978140831,
"eval_overall_accuracy": 0.9533828162546056,
"eval_overall_f1": 0.5576255131038838,
"eval_overall_precision": 0.5118840579710144,
"eval_overall_recall": 0.6123439667128987,
"eval_precision_entity": 0.7230306071249373,
"eval_precision_token": 0.7230306071249373,
"eval_recall_entity": 0.7924839596700275,
"eval_recall_token": 0.7924839596700275,
"eval_runtime": 12.8578,
"eval_samples_per_second": 14.699,
"eval_steps_per_second": 1.867,
"step": 175
},
{
"epoch": 4.53,
"learning_rate": 1.6701030927835052e-05,
"loss": 0.1,
"step": 180
},
{
"epoch": 4.78,
"learning_rate": 1.6288659793814433e-05,
"loss": 0.1068,
"step": 190
},
{
"epoch": 5.03,
"learning_rate": 1.5876288659793813e-05,
"loss": 0.0984,
"step": 200
},
{
"epoch": 5.03,
"eval_AGE_f1": 0.672316384180791,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6102564102564103,
"eval_AGE_recall": 0.7484276729559748,
"eval_ALTI_f1": 0.06060606060606061,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.058823529411764705,
"eval_ALTI_recall": 0.0625,
"eval_EMAIL_f1": 0.7826086956521738,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.9,
"eval_EMAIL_recall": 0.6923076923076923,
"eval_GEOG_f1": 0.42857142857142855,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.3157894736842105,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.44173140954495005,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.3618181818181818,
"eval_REGION_recall": 0.5669515669515669,
"eval_SITE_f1": 0.4200792602377807,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.37236533957845436,
"eval_SITE_recall": 0.4818181818181818,
"eval_TAXA_f1": 0.7944954128440367,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7663716814159292,
"eval_TAXA_recall": 0.8247619047619048,
"eval_accuracy_entity": 0.9572097328278244,
"eval_accuracy_token": 0.9572097328278244,
"eval_f1_entity": 0.7708746230073245,
"eval_f1_token": 0.7708746230073245,
"eval_loss": 0.13383713364601135,
"eval_overall_accuracy": 0.9555721685267261,
"eval_overall_f1": 0.5855606758832566,
"eval_overall_precision": 0.5256480970766685,
"eval_overall_recall": 0.6608876560332871,
"eval_precision_entity": 0.7273170731707317,
"eval_precision_token": 0.7273170731707317,
"eval_recall_entity": 0.8199816681943172,
"eval_recall_token": 0.8199816681943172,
"eval_runtime": 9.949,
"eval_samples_per_second": 18.997,
"eval_steps_per_second": 2.412,
"step": 200
},
{
"epoch": 5.28,
"learning_rate": 1.5463917525773197e-05,
"loss": 0.0887,
"step": 210
},
{
"epoch": 5.53,
"learning_rate": 1.5051546391752578e-05,
"loss": 0.0872,
"step": 220
},
{
"epoch": 5.66,
"eval_AGE_f1": 0.6319018404907976,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6167664670658682,
"eval_AGE_recall": 0.6477987421383647,
"eval_ALTI_f1": 0.07407407407407407,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.09090909090909091,
"eval_ALTI_recall": 0.0625,
"eval_EMAIL_f1": 0.9622641509433962,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.9444444444444444,
"eval_EMAIL_recall": 0.9807692307692307,
"eval_GEOG_f1": 0.3870967741935484,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2727272727272727,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.4956709956709957,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.39965095986038396,
"eval_REGION_recall": 0.6524216524216524,
"eval_SITE_f1": 0.4276048714479026,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3863080684596577,
"eval_SITE_recall": 0.47878787878787876,
"eval_TAXA_f1": 0.7708703374777975,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7221297836938436,
"eval_TAXA_recall": 0.8266666666666667,
"eval_accuracy_entity": 0.9552339758993253,
"eval_accuracy_token": 0.9552339758993253,
"eval_f1_entity": 0.7587956698240865,
"eval_f1_token": 0.7587956698240865,
"eval_loss": 0.14531326293945312,
"eval_overall_accuracy": 0.9539702034495648,
"eval_overall_f1": 0.598963098505642,
"eval_overall_precision": 0.5345672291780076,
"eval_overall_recall": 0.680998613037448,
"eval_precision_entity": 0.7043491913958235,
"eval_precision_token": 0.7043491913958235,
"eval_recall_entity": 0.8223648029330889,
"eval_recall_token": 0.8223648029330889,
"eval_runtime": 10.0713,
"eval_samples_per_second": 18.766,
"eval_steps_per_second": 2.383,
"step": 225
},
{
"epoch": 5.79,
"learning_rate": 1.4639175257731958e-05,
"loss": 0.086,
"step": 230
},
{
"epoch": 6.04,
"learning_rate": 1.4226804123711342e-05,
"loss": 0.0789,
"step": 240
},
{
"epoch": 6.29,
"learning_rate": 1.3814432989690723e-05,
"loss": 0.0713,
"step": 250
},
{
"epoch": 6.29,
"eval_AGE_f1": 0.6857142857142857,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6282722513089005,
"eval_AGE_recall": 0.7547169811320755,
"eval_ALTI_f1": 0.07142857142857144,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.08333333333333333,
"eval_ALTI_recall": 0.0625,
"eval_EMAIL_f1": 0.859504132231405,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.7536231884057971,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.4,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2857142857142857,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.49940262843488653,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.43004115226337447,
"eval_REGION_recall": 0.5954415954415955,
"eval_SITE_f1": 0.4341736694677871,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.4036458333333333,
"eval_SITE_recall": 0.4696969696969697,
"eval_TAXA_f1": 0.7922437673130194,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7688172043010753,
"eval_TAXA_recall": 0.8171428571428572,
"eval_accuracy_entity": 0.9578683184706573,
"eval_accuracy_token": 0.9578683184706573,
"eval_f1_entity": 0.768325871301905,
"eval_f1_token": 0.768325871301905,
"eval_loss": 0.1395871937274933,
"eval_overall_accuracy": 0.9568181413645183,
"eval_overall_f1": 0.6146063863420803,
"eval_overall_precision": 0.5647879140034864,
"eval_overall_recall": 0.6740638002773925,
"eval_precision_entity": 0.7371967654986523,
"eval_precision_token": 0.7371967654986523,
"eval_recall_entity": 0.8021998166819432,
"eval_recall_token": 0.8021998166819432,
"eval_runtime": 12.126,
"eval_samples_per_second": 15.586,
"eval_steps_per_second": 1.979,
"step": 250
},
{
"epoch": 6.54,
"learning_rate": 1.3402061855670103e-05,
"loss": 0.0761,
"step": 260
},
{
"epoch": 6.79,
"learning_rate": 1.2989690721649485e-05,
"loss": 0.0715,
"step": 270
},
{
"epoch": 6.92,
"eval_AGE_f1": 0.7211267605633802,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6530612244897959,
"eval_AGE_recall": 0.8050314465408805,
"eval_ALTI_f1": 0.13333333333333333,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.14285714285714285,
"eval_ALTI_recall": 0.125,
"eval_EMAIL_f1": 0.8455284552845529,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.7323943661971831,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.3870967741935484,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2727272727272727,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5431818181818181,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.45179584120982985,
"eval_REGION_recall": 0.6809116809116809,
"eval_SITE_f1": 0.45517241379310347,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.4177215189873418,
"eval_SITE_recall": 0.5,
"eval_TAXA_f1": 0.7958412098298677,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7898686679174484,
"eval_TAXA_recall": 0.8019047619047619,
"eval_accuracy_entity": 0.9568893398123921,
"eval_accuracy_token": 0.9568893398123921,
"eval_f1_entity": 0.7651905252317198,
"eval_f1_token": 0.7651905252317198,
"eval_loss": 0.14375238120555878,
"eval_overall_accuracy": 0.9557857638703476,
"eval_overall_f1": 0.6327295440349782,
"eval_overall_precision": 0.5755681818181818,
"eval_overall_recall": 0.70249653259362,
"eval_precision_entity": 0.7193803453283847,
"eval_precision_token": 0.7193803453283847,
"eval_recall_entity": 0.8172318973418882,
"eval_recall_token": 0.8172318973418882,
"eval_runtime": 12.8036,
"eval_samples_per_second": 14.761,
"eval_steps_per_second": 1.874,
"step": 275
},
{
"epoch": 7.04,
"learning_rate": 1.2577319587628866e-05,
"loss": 0.0779,
"step": 280
},
{
"epoch": 7.3,
"learning_rate": 1.2164948453608248e-05,
"loss": 0.0652,
"step": 290
},
{
"epoch": 7.55,
"learning_rate": 1.175257731958763e-05,
"loss": 0.0651,
"step": 300
},
{
"epoch": 7.55,
"eval_AGE_f1": 0.7202380952380952,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6836158192090396,
"eval_AGE_recall": 0.7610062893081762,
"eval_ALTI_f1": 0.06896551724137931,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.07692307692307693,
"eval_ALTI_recall": 0.0625,
"eval_EMAIL_f1": 0.7428571428571429,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5909090909090909,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.42857142857142855,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.3157894736842105,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5471478463329453,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.4625984251968504,
"eval_REGION_recall": 0.6695156695156695,
"eval_SITE_f1": 0.4159544159544159,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3924731182795699,
"eval_SITE_recall": 0.44242424242424244,
"eval_TAXA_f1": 0.8036697247706422,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7752212389380531,
"eval_TAXA_recall": 0.8342857142857143,
"eval_accuracy_entity": 0.9569427386482975,
"eval_accuracy_token": 0.9569427386482975,
"eval_f1_entity": 0.7655160390516038,
"eval_f1_token": 0.7655160390516038,
"eval_loss": 0.13883507251739502,
"eval_overall_accuracy": 0.9559281607660953,
"eval_overall_f1": 0.6275125628140703,
"eval_overall_precision": 0.5734787600459242,
"eval_overall_recall": 0.6927877947295423,
"eval_precision_entity": 0.7297656639521356,
"eval_precision_token": 0.7297656639521356,
"eval_recall_entity": 0.8049495875343722,
"eval_recall_token": 0.8049495875343722,
"eval_runtime": 10.0268,
"eval_samples_per_second": 18.85,
"eval_steps_per_second": 2.394,
"step": 300
},
{
"epoch": 7.8,
"learning_rate": 1.134020618556701e-05,
"loss": 0.0616,
"step": 310
},
{
"epoch": 8.05,
"learning_rate": 1.0927835051546391e-05,
"loss": 0.0629,
"step": 320
},
{
"epoch": 8.18,
"eval_AGE_f1": 0.702857142857143,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.643979057591623,
"eval_AGE_recall": 0.7735849056603774,
"eval_ALTI_f1": 0.07692307692307693,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.1,
"eval_ALTI_recall": 0.0625,
"eval_EMAIL_f1": 0.787878787878788,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.65,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.41379310344827586,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.3,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5244040862656072,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.4358490566037736,
"eval_REGION_recall": 0.6581196581196581,
"eval_SITE_f1": 0.39538239538239534,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3774104683195592,
"eval_SITE_recall": 0.41515151515151516,
"eval_TAXA_f1": 0.7945701357466064,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.756896551724138,
"eval_TAXA_recall": 0.8361904761904762,
"eval_accuracy_entity": 0.9557857638703476,
"eval_accuracy_token": 0.9557857638703476,
"eval_f1_entity": 0.7590018133149123,
"eval_f1_token": 0.7590018133149123,
"eval_loss": 0.14412528276443481,
"eval_overall_accuracy": 0.9548245848240509,
"eval_overall_f1": 0.6150497512437811,
"eval_overall_precision": 0.5574971815107103,
"eval_overall_recall": 0.6858529819694869,
"eval_precision_entity": 0.7174338883447601,
"eval_precision_token": 0.7174338883447601,
"eval_recall_entity": 0.8056828597616865,
"eval_recall_token": 0.8056828597616865,
"eval_runtime": 10.4306,
"eval_samples_per_second": 18.12,
"eval_steps_per_second": 2.301,
"step": 325
},
{
"epoch": 8.3,
"learning_rate": 1.0515463917525775e-05,
"loss": 0.0556,
"step": 330
},
{
"epoch": 8.55,
"learning_rate": 1.0103092783505156e-05,
"loss": 0.0609,
"step": 340
},
{
"epoch": 8.81,
"learning_rate": 9.690721649484536e-06,
"loss": 0.0558,
"step": 350
},
{
"epoch": 8.81,
"eval_AGE_f1": 0.6822157434402333,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6358695652173914,
"eval_AGE_recall": 0.7358490566037735,
"eval_ALTI_f1": 0.12121212121212122,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.11764705882352941,
"eval_ALTI_recall": 0.125,
"eval_EMAIL_f1": 0.7482014388489209,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5977011494252874,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.37500000000000006,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2608695652173913,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5439429928741093,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.4663951120162933,
"eval_REGION_recall": 0.6524216524216524,
"eval_SITE_f1": 0.4425531914893617,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.416,
"eval_SITE_recall": 0.4727272727272727,
"eval_TAXA_f1": 0.7924865831842576,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7470489038785835,
"eval_TAXA_recall": 0.8438095238095238,
"eval_accuracy_entity": 0.9551983766753884,
"eval_accuracy_token": 0.9551983766753884,
"eval_f1_entity": 0.7571195044308698,
"eval_f1_token": 0.7571195044308698,
"eval_loss": 0.14811000227928162,
"eval_overall_accuracy": 0.9542371976290916,
"eval_overall_f1": 0.6257783312577834,
"eval_overall_precision": 0.5677966101694916,
"eval_overall_recall": 0.6969486823855756,
"eval_precision_entity": 0.7133592736705577,
"eval_precision_token": 0.7133592736705577,
"eval_recall_entity": 0.8065994500458296,
"eval_recall_token": 0.8065994500458296,
"eval_runtime": 11.3308,
"eval_samples_per_second": 16.68,
"eval_steps_per_second": 2.118,
"step": 350
},
{
"epoch": 9.06,
"learning_rate": 9.278350515463918e-06,
"loss": 0.0597,
"step": 360
},
{
"epoch": 9.31,
"learning_rate": 8.865979381443299e-06,
"loss": 0.056,
"step": 370
},
{
"epoch": 9.43,
"eval_AGE_f1": 0.7079646017699115,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6666666666666666,
"eval_AGE_recall": 0.7547169811320755,
"eval_ALTI_f1": 0.15384615384615385,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.2,
"eval_ALTI_recall": 0.125,
"eval_EMAIL_f1": 0.6666666666666666,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.4,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2857142857142857,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5555555555555556,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.4613935969868173,
"eval_REGION_recall": 0.698005698005698,
"eval_SITE_f1": 0.47632311977715874,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.44072164948453607,
"eval_SITE_recall": 0.5181818181818182,
"eval_TAXA_f1": 0.8040109389243391,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7709790209790209,
"eval_TAXA_recall": 0.84,
"eval_accuracy_entity": 0.9559993592139692,
"eval_accuracy_token": 0.9559993592139692,
"eval_f1_entity": 0.7634735597229263,
"eval_f1_token": 0.7634735597229263,
"eval_loss": 0.15191707015037537,
"eval_overall_accuracy": 0.9548779836599562,
"eval_overall_f1": 0.6385467980295567,
"eval_overall_precision": 0.5741971207087486,
"eval_overall_recall": 0.7191400832177531,
"eval_precision_entity": 0.7079743067523109,
"eval_precision_token": 0.7079743067523109,
"eval_recall_entity": 0.8284142988084326,
"eval_recall_token": 0.8284142988084326,
"eval_runtime": 9.9604,
"eval_samples_per_second": 18.975,
"eval_steps_per_second": 2.41,
"step": 375
},
{
"epoch": 9.56,
"learning_rate": 8.453608247422681e-06,
"loss": 0.0579,
"step": 380
},
{
"epoch": 9.81,
"learning_rate": 8.041237113402063e-06,
"loss": 0.0499,
"step": 390
},
{
"epoch": 10.06,
"learning_rate": 7.628865979381444e-06,
"loss": 0.0529,
"step": 400
},
{
"epoch": 10.06,
"eval_AGE_f1": 0.7025495750708216,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6391752577319587,
"eval_AGE_recall": 0.779874213836478,
"eval_ALTI_f1": 0.3225806451612903,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.3333333333333333,
"eval_ALTI_recall": 0.3125,
"eval_EMAIL_f1": 0.7819548872180451,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.6419753086419753,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.4,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2857142857142857,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5511811023622047,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.45539033457249073,
"eval_REGION_recall": 0.698005698005698,
"eval_SITE_f1": 0.4936530324400564,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.46174142480211083,
"eval_SITE_recall": 0.5303030303030303,
"eval_TAXA_f1": 0.8047445255474452,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7723292469352014,
"eval_TAXA_recall": 0.84,
"eval_accuracy_entity": 0.9571207347679821,
"eval_accuracy_token": 0.9571207347679821,
"eval_f1_entity": 0.7682700421940929,
"eval_f1_token": 0.7682700421940929,
"eval_loss": 0.154266357421875,
"eval_overall_accuracy": 0.9559993592139692,
"eval_overall_f1": 0.646713977167541,
"eval_overall_precision": 0.5825458588104503,
"eval_overall_recall": 0.7267683772538142,
"eval_precision_entity": 0.7118060985144644,
"eval_precision_token": 0.7118060985144644,
"eval_recall_entity": 0.8344637946837764,
"eval_recall_token": 0.8344637946837764,
"eval_runtime": 10.1935,
"eval_samples_per_second": 18.541,
"eval_steps_per_second": 2.354,
"step": 400
},
{
"epoch": 10.31,
"learning_rate": 7.216494845360825e-06,
"loss": 0.0504,
"step": 410
},
{
"epoch": 10.57,
"learning_rate": 6.804123711340207e-06,
"loss": 0.0527,
"step": 420
},
{
"epoch": 10.69,
"eval_AGE_f1": 0.6966292134831462,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6294416243654822,
"eval_AGE_recall": 0.779874213836478,
"eval_ALTI_f1": 0.2962962962962963,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.36363636363636365,
"eval_ALTI_recall": 0.25,
"eval_EMAIL_f1": 0.7938931297709924,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.6582278481012658,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.37500000000000006,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2608695652173913,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5187878787878788,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.45147679324894513,
"eval_REGION_recall": 0.6096866096866097,
"eval_SITE_f1": 0.36940836940836935,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3526170798898072,
"eval_SITE_recall": 0.3878787878787879,
"eval_TAXA_f1": 0.7914735866543096,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7707581227436823,
"eval_TAXA_recall": 0.8133333333333334,
"eval_accuracy_entity": 0.9547355867642086,
"eval_accuracy_token": 0.9547355867642086,
"eval_f1_entity": 0.7530343007915568,
"eval_f1_token": 0.7530343007915568,
"eval_loss": 0.15111711621284485,
"eval_overall_accuracy": 0.9537744077179118,
"eval_overall_f1": 0.6076996500159084,
"eval_overall_precision": 0.5614344503233392,
"eval_overall_recall": 0.6622746185852982,
"eval_precision_entity": 0.7237531699070161,
"eval_precision_token": 0.7237531699070161,
"eval_recall_entity": 0.7847846012832264,
"eval_recall_token": 0.7847846012832264,
"eval_runtime": 10.0406,
"eval_samples_per_second": 18.824,
"eval_steps_per_second": 2.39,
"step": 425
},
{
"epoch": 10.82,
"learning_rate": 6.391752577319588e-06,
"loss": 0.0483,
"step": 430
},
{
"epoch": 11.07,
"learning_rate": 5.979381443298969e-06,
"loss": 0.0487,
"step": 440
},
{
"epoch": 11.32,
"learning_rate": 5.567010309278351e-06,
"loss": 0.0508,
"step": 450
},
{
"epoch": 11.32,
"eval_AGE_f1": 0.7130434782608696,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6612903225806451,
"eval_AGE_recall": 0.7735849056603774,
"eval_ALTI_f1": 0.21428571428571427,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.25,
"eval_ALTI_recall": 0.1875,
"eval_EMAIL_f1": 0.7428571428571429,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5909090909090909,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.4,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2857142857142857,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.525030525030525,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.4594017094017094,
"eval_REGION_recall": 0.6125356125356125,
"eval_SITE_f1": 0.38904899135446686,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3708791208791209,
"eval_SITE_recall": 0.4090909090909091,
"eval_TAXA_f1": 0.7802197802197802,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7513227513227513,
"eval_TAXA_recall": 0.8114285714285714,
"eval_accuracy_entity": 0.9558925615421584,
"eval_accuracy_token": 0.9558925615421584,
"eval_f1_entity": 0.7576967438559136,
"eval_f1_token": 0.7576967438559136,
"eval_loss": 0.15142428874969482,
"eval_overall_accuracy": 0.9549135828838932,
"eval_overall_f1": 0.6099110546378654,
"eval_overall_precision": 0.5627198124267292,
"eval_overall_recall": 0.665742024965326,
"eval_precision_entity": 0.734181568088033,
"eval_precision_token": 0.734181568088033,
"eval_recall_entity": 0.7827681026581118,
"eval_recall_token": 0.7827681026581118,
"eval_runtime": 9.85,
"eval_samples_per_second": 19.188,
"eval_steps_per_second": 2.437,
"step": 450
},
{
"epoch": 11.57,
"learning_rate": 5.154639175257732e-06,
"loss": 0.0464,
"step": 460
},
{
"epoch": 11.82,
"learning_rate": 4.742268041237113e-06,
"loss": 0.0459,
"step": 470
},
{
"epoch": 11.95,
"eval_AGE_f1": 0.6956521739130435,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6451612903225806,
"eval_AGE_recall": 0.7547169811320755,
"eval_ALTI_f1": 0.13793103448275862,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.15384615384615385,
"eval_ALTI_recall": 0.125,
"eval_EMAIL_f1": 0.732394366197183,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5777777777777777,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.3870967741935484,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2727272727272727,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5467980295566502,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.48156182212581344,
"eval_REGION_recall": 0.6324786324786325,
"eval_SITE_f1": 0.41466854724964736,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.38786279683377306,
"eval_SITE_recall": 0.44545454545454544,
"eval_TAXA_f1": 0.7944700460829494,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7696428571428572,
"eval_TAXA_recall": 0.820952380952381,
"eval_accuracy_entity": 0.9552161762873569,
"eval_accuracy_token": 0.9552161762873569,
"eval_f1_entity": 0.7573407684935088,
"eval_f1_token": 0.7573407684935088,
"eval_loss": 0.15560036897659302,
"eval_overall_accuracy": 0.9541481995692493,
"eval_overall_f1": 0.6216301934665398,
"eval_overall_precision": 0.5727644652250146,
"eval_overall_recall": 0.6796116504854369,
"eval_precision_entity": 0.7216871471272003,
"eval_precision_token": 0.7216871471272003,
"eval_recall_entity": 0.7967002749770853,
"eval_recall_token": 0.7967002749770853,
"eval_runtime": 10.1795,
"eval_samples_per_second": 18.567,
"eval_steps_per_second": 2.358,
"step": 475
},
{
"epoch": 12.08,
"learning_rate": 4.329896907216495e-06,
"loss": 0.0418,
"step": 480
},
{
"epoch": 12.33,
"learning_rate": 3.917525773195877e-06,
"loss": 0.045,
"step": 490
},
{
"epoch": 12.58,
"learning_rate": 3.5051546391752577e-06,
"loss": 0.0484,
"step": 500
},
{
"epoch": 12.58,
"eval_AGE_f1": 0.7134502923976608,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6666666666666666,
"eval_AGE_recall": 0.7672955974842768,
"eval_ALTI_f1": 0.20689655172413793,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.23076923076923078,
"eval_ALTI_recall": 0.1875,
"eval_EMAIL_f1": 0.7172413793103448,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5591397849462365,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.3870967741935484,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.2727272727272727,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.560093348891482,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.4743083003952569,
"eval_REGION_recall": 0.6837606837606838,
"eval_SITE_f1": 0.44044321329639885,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.40561224489795916,
"eval_SITE_recall": 0.4818181818181818,
"eval_TAXA_f1": 0.7956600361663652,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7573149741824441,
"eval_TAXA_recall": 0.8380952380952381,
"eval_accuracy_entity": 0.9561061568857799,
"eval_accuracy_token": 0.9561061568857799,
"eval_f1_entity": 0.7653287788215201,
"eval_f1_token": 0.7653287788215201,
"eval_loss": 0.15589508414268494,
"eval_overall_accuracy": 0.9551271782275147,
"eval_overall_f1": 0.6324257425742574,
"eval_overall_precision": 0.5709497206703911,
"eval_overall_recall": 0.7087378640776699,
"eval_precision_entity": 0.71638689048761,
"eval_precision_token": 0.71638689048761,
"eval_recall_entity": 0.821448212648946,
"eval_recall_token": 0.821448212648946,
"eval_runtime": 12.7467,
"eval_samples_per_second": 14.827,
"eval_steps_per_second": 1.883,
"step": 500
},
{
"epoch": 12.83,
"learning_rate": 3.0927835051546395e-06,
"loss": 0.0461,
"step": 510
},
{
"epoch": 13.08,
"learning_rate": 2.680412371134021e-06,
"loss": 0.0386,
"step": 520
},
{
"epoch": 13.21,
"eval_AGE_f1": 0.7055393586005833,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.657608695652174,
"eval_AGE_recall": 0.7610062893081762,
"eval_ALTI_f1": 0.0,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.0,
"eval_ALTI_recall": 0.0,
"eval_EMAIL_f1": 0.6933333333333334,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5306122448979592,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.41379310344827586,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.3,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.558858501783591,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.47959183673469385,
"eval_REGION_recall": 0.6695156695156695,
"eval_SITE_f1": 0.42758620689655175,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3924050632911392,
"eval_SITE_recall": 0.4696969696969697,
"eval_TAXA_f1": 0.7948951686417502,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7622377622377622,
"eval_TAXA_recall": 0.8304761904761905,
"eval_accuracy_entity": 0.9557679642583792,
"eval_accuracy_token": 0.9557679642583792,
"eval_f1_entity": 0.7621009268795055,
"eval_f1_token": 0.7621009268795055,
"eval_loss": 0.15739484131336212,
"eval_overall_accuracy": 0.9548245848240509,
"eval_overall_f1": 0.6255835667600373,
"eval_overall_precision": 0.567476002258611,
"eval_overall_recall": 0.6969486823855756,
"eval_precision_entity": 0.716475714055188,
"eval_precision_token": 0.716475714055188,
"eval_recall_entity": 0.8139321723189734,
"eval_recall_token": 0.8139321723189734,
"eval_runtime": 10.5618,
"eval_samples_per_second": 17.895,
"eval_steps_per_second": 2.272,
"step": 525
},
{
"epoch": 13.33,
"learning_rate": 2.268041237113402e-06,
"loss": 0.0405,
"step": 530
},
{
"epoch": 13.58,
"learning_rate": 1.8556701030927837e-06,
"loss": 0.0438,
"step": 540
},
{
"epoch": 13.84,
"learning_rate": 1.4432989690721649e-06,
"loss": 0.0464,
"step": 550
},
{
"epoch": 13.84,
"eval_AGE_f1": 0.7045454545454547,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6424870466321243,
"eval_AGE_recall": 0.779874213836478,
"eval_ALTI_f1": 0.20689655172413793,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.23076923076923078,
"eval_ALTI_recall": 0.1875,
"eval_EMAIL_f1": 0.7027027027027027,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5416666666666666,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.36363636363636365,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.25,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.5545023696682464,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.4746450304259635,
"eval_REGION_recall": 0.6666666666666666,
"eval_SITE_f1": 0.41408450704225347,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3868421052631579,
"eval_SITE_recall": 0.44545454545454544,
"eval_TAXA_f1": 0.7978241160471441,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7612456747404844,
"eval_TAXA_recall": 0.8380952380952381,
"eval_accuracy_entity": 0.955144977839483,
"eval_accuracy_token": 0.955144977839483,
"eval_f1_entity": 0.7586857682079438,
"eval_f1_token": 0.7586857682079438,
"eval_loss": 0.1583557277917862,
"eval_overall_accuracy": 0.9541481995692493,
"eval_overall_f1": 0.6250388319353837,
"eval_overall_precision": 0.566122678671919,
"eval_overall_recall": 0.6976421636615812,
"eval_precision_entity": 0.7129958078039342,
"eval_precision_token": 0.7129958078039342,
"eval_recall_entity": 0.8106324472960587,
"eval_recall_token": 0.8106324472960587,
"eval_runtime": 12.1366,
"eval_samples_per_second": 15.573,
"eval_steps_per_second": 1.977,
"step": 550
},
{
"epoch": 14.09,
"learning_rate": 1.0309278350515464e-06,
"loss": 0.0405,
"step": 560
},
{
"epoch": 14.34,
"learning_rate": 6.185567010309279e-07,
"loss": 0.0448,
"step": 570
},
{
"epoch": 14.47,
"eval_AGE_f1": 0.7163323782234957,
"eval_AGE_number": 159,
"eval_AGE_precision": 0.6578947368421053,
"eval_AGE_recall": 0.7861635220125787,
"eval_ALTI_f1": 0.20689655172413793,
"eval_ALTI_number": 16,
"eval_ALTI_precision": 0.23076923076923078,
"eval_ALTI_recall": 0.1875,
"eval_EMAIL_f1": 0.732394366197183,
"eval_EMAIL_number": 52,
"eval_EMAIL_precision": 0.5777777777777777,
"eval_EMAIL_recall": 1.0,
"eval_GEOG_f1": 0.36363636363636365,
"eval_GEOG_number": 9,
"eval_GEOG_precision": 0.25,
"eval_GEOG_recall": 0.6666666666666666,
"eval_REGION_f1": 0.56,
"eval_REGION_number": 351,
"eval_REGION_precision": 0.47695390781563124,
"eval_REGION_recall": 0.6780626780626781,
"eval_SITE_f1": 0.41310541310541316,
"eval_SITE_number": 330,
"eval_SITE_precision": 0.3897849462365591,
"eval_SITE_recall": 0.4393939393939394,
"eval_TAXA_f1": 0.7981735159817351,
"eval_TAXA_number": 525,
"eval_TAXA_precision": 0.7666666666666667,
"eval_TAXA_recall": 0.8323809523809523,
"eval_accuracy_entity": 0.9550203805557039,
"eval_accuracy_token": 0.9550203805557039,
"eval_f1_entity": 0.7577735784229513,
"eval_f1_token": 0.7577735784229513,
"eval_loss": 0.1591457575559616,
"eval_overall_accuracy": 0.9540236022854702,
"eval_overall_f1": 0.62875,
"eval_overall_precision": 0.5722411831626849,
"eval_overall_recall": 0.6976421636615812,
"eval_precision_entity": 0.7129465007273315,
"eval_precision_token": 0.7129465007273315,
"eval_recall_entity": 0.8086159486709441,
"eval_recall_token": 0.8086159486709441,
"eval_runtime": 10.2385,
"eval_samples_per_second": 18.46,
"eval_steps_per_second": 2.344,
"step": 575
},
{
"epoch": 14.59,
"learning_rate": 2.061855670103093e-07,
"loss": 0.0413,
"step": 580
},
{
"epoch": 14.72,
"step": 585,
"total_flos": 4125504727794096.0,
"train_loss": 0.23708797097206116,
"train_runtime": 1988.5186,
"train_samples_per_second": 9.572,
"train_steps_per_second": 0.294
}
],
"max_steps": 585,
"num_train_epochs": 15,
"total_flos": 4125504727794096.0,
"trial_name": null,
"trial_params": null
}