bert-base-uncased-coqa / trainer_state.json
WillHeld's picture
End of training
93e5915
{
"best_metric": 57.56979472888117,
"best_model_checkpoint": "./results_train_sae/bert-base-uncased/coqa/checkpoint-28000",
"epoch": 9.999931351685316,
"global_step": 72830,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 2.2883295194508013e-06,
"loss": 5.9079,
"step": 500
},
{
"epoch": 0.07,
"eval_HasAns_exact": 0.0,
"eval_HasAns_f1": 0.058699242323848086,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 98.46153846153847,
"eval_NoAns_f1": 98.46153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 0.8142302392584242,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 0.859924915535542,
"eval_best_f1_thresh": 0.0,
"eval_exact": 0.80170362019291,
"eval_f1": 0.859924915535542,
"eval_total": 7983,
"step": 500
},
{
"epoch": 0.14,
"learning_rate": 4.576659038901603e-06,
"loss": 4.7938,
"step": 1000
},
{
"epoch": 0.14,
"eval_HasAns_exact": 6.870421823692852,
"eval_HasAns_f1": 27.70107501407698,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 1.5384615384615385,
"eval_NoAns_f1": 1.5384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 6.827007390705249,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 27.48805110377818,
"eval_best_f1_thresh": 0.0,
"eval_exact": 6.827007390705249,
"eval_f1": 27.48805110377822,
"eval_total": 7983,
"step": 1000
},
{
"epoch": 0.21,
"learning_rate": 6.8649885583524035e-06,
"loss": 3.991,
"step": 1500
},
{
"epoch": 0.21,
"eval_HasAns_exact": 11.896943672644607,
"eval_HasAns_f1": 37.05032211892552,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 7.6923076923076925,
"eval_NoAns_f1": 7.6923076923076925,
"eval_NoAns_total": 65,
"eval_best_exact": 11.862708255041964,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 36.81128028781815,
"eval_best_f1_thresh": 0.0,
"eval_exact": 11.862708255041964,
"eval_f1": 36.81128028781814,
"eval_total": 7983,
"step": 1500
},
{
"epoch": 0.27,
"learning_rate": 9.153318077803205e-06,
"loss": 3.7176,
"step": 2000
},
{
"epoch": 0.27,
"eval_HasAns_exact": 14.52386966405658,
"eval_HasAns_f1": 42.09036402930084,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 3.076923076923077,
"eval_NoAns_f1": 3.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 14.418138544406865,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 41.76017817662584,
"eval_best_f1_thresh": 0.0,
"eval_exact": 14.430665163472378,
"eval_f1": 41.77270479569133,
"eval_total": 7983,
"step": 2000
},
{
"epoch": 0.34,
"learning_rate": 1.1441647597254006e-05,
"loss": 3.4929,
"step": 2500
},
{
"epoch": 0.34,
"eval_HasAns_exact": 15.635261429653953,
"eval_HasAns_f1": 42.60135406380397,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 15.658273831892773,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 42.40480038546909,
"eval_best_f1_thresh": 0.0,
"eval_exact": 15.658273831892773,
"eval_f1": 42.404800385469095,
"eval_total": 7983,
"step": 2500
},
{
"epoch": 0.41,
"learning_rate": 1.3729977116704807e-05,
"loss": 3.3632,
"step": 3000
},
{
"epoch": 0.41,
"eval_HasAns_exact": 17.70649153826724,
"eval_HasAns_f1": 46.86612402307515,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 1.5384615384615385,
"eval_NoAns_f1": 1.5384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 17.574846548916447,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 46.49705248837645,
"eval_best_f1_thresh": 0.0,
"eval_exact": 17.574846548916447,
"eval_f1": 46.49705248837643,
"eval_total": 7983,
"step": 3000
},
{
"epoch": 0.48,
"learning_rate": 1.6018306636155606e-05,
"loss": 3.2348,
"step": 3500
},
{
"epoch": 0.48,
"eval_HasAns_exact": 18.615812073756,
"eval_HasAns_f1": 48.88254968548444,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 18.464236502567957,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 48.484533184224716,
"eval_best_f1_thresh": 0.0,
"eval_exact": 18.464236502567957,
"eval_f1": 48.4845331842247,
"eval_total": 7983,
"step": 3500
},
{
"epoch": 0.55,
"learning_rate": 1.830663615560641e-05,
"loss": 3.0918,
"step": 4000
},
{
"epoch": 0.55,
"eval_HasAns_exact": 19.790351098762315,
"eval_HasAns_f1": 50.19536205413491,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 19.629212075660778,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 49.7866562375849,
"eval_best_f1_thresh": 0.0,
"eval_exact": 19.629212075660778,
"eval_f1": 49.7866562375849,
"eval_total": 7983,
"step": 4000
},
{
"epoch": 0.62,
"learning_rate": 1.996202161846334e-05,
"loss": 2.9685,
"step": 4500
},
{
"epoch": 0.62,
"eval_HasAns_exact": 20.661783278605707,
"eval_HasAns_f1": 51.24202719367006,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 20.49354879118126,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 50.8247991130502,
"eval_best_f1_thresh": 0.0,
"eval_exact": 20.49354879118126,
"eval_f1": 50.824799113050176,
"eval_total": 7983,
"step": 4500
},
{
"epoch": 0.69,
"learning_rate": 1.98159509202454e-05,
"loss": 2.8876,
"step": 5000
},
{
"epoch": 0.69,
"eval_HasAns_exact": 21.987875726193483,
"eval_HasAns_f1": 53.06234486539824,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.80884379306025,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 52.63029520784457,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.80884379306025,
"eval_f1": 52.630295207844576,
"eval_total": 7983,
"step": 5000
},
{
"epoch": 0.76,
"learning_rate": 1.9669880222027462e-05,
"loss": 2.8069,
"step": 5500
},
{
"epoch": 0.76,
"eval_HasAns_exact": 22.139429148774944,
"eval_HasAns_f1": 52.947930590885036,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.959163221846424,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 52.5168125289525,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.959163221846424,
"eval_f1": 52.51681252895249,
"eval_total": 7983,
"step": 5500
},
{
"epoch": 0.82,
"learning_rate": 1.9523809523809524e-05,
"loss": 2.753,
"step": 6000
},
{
"epoch": 0.82,
"eval_HasAns_exact": 22.467794897701438,
"eval_HasAns_f1": 52.74131115227161,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 22.284855317549795,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 52.31187544828844,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.284855317549795,
"eval_f1": 52.31187544828843,
"eval_total": 7983,
"step": 6000
},
{
"epoch": 0.89,
"learning_rate": 1.937773882559159e-05,
"loss": 2.7304,
"step": 6500
},
{
"epoch": 0.89,
"eval_HasAns_exact": 24.05910583480677,
"eval_HasAns_f1": 55.094001124088884,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 23.863209319804586,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.64540910691915,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.863209319804586,
"eval_f1": 54.645409106919175,
"eval_total": 7983,
"step": 6500
},
{
"epoch": 0.96,
"learning_rate": 1.923166812737365e-05,
"loss": 2.6887,
"step": 7000
},
{
"epoch": 0.96,
"eval_HasAns_exact": 23.503409952008084,
"eval_HasAns_f1": 54.51083938244222,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 1.5384615384615385,
"eval_NoAns_f1": 1.5384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 23.324564699987473,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.07952226358227,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.324564699987473,
"eval_f1": 54.07952226358229,
"eval_total": 7983,
"step": 7000
},
{
"epoch": 1.03,
"learning_rate": 1.9085597429155715e-05,
"loss": 2.5921,
"step": 7500
},
{
"epoch": 1.03,
"eval_HasAns_exact": 22.467794897701438,
"eval_HasAns_f1": 53.881350612333,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 22.284855317549795,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 53.44263236232651,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.284855317549795,
"eval_f1": 53.44263236232653,
"eval_total": 7983,
"step": 7500
},
{
"epoch": 1.1,
"learning_rate": 1.8939526730937776e-05,
"loss": 2.4825,
"step": 8000
},
{
"epoch": 1.1,
"eval_HasAns_exact": 23.137155847436222,
"eval_HasAns_f1": 53.99581621835903,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 22.948766128022047,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 53.55616595477474,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.948766128022047,
"eval_f1": 53.55616595477475,
"eval_total": 7983,
"step": 8000
},
{
"epoch": 1.17,
"learning_rate": 1.8793456032719838e-05,
"loss": 2.4281,
"step": 8500
},
{
"epoch": 1.17,
"eval_HasAns_exact": 23.553927759535235,
"eval_HasAns_f1": 54.02861374681815,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 3.076923076923077,
"eval_NoAns_f1": 3.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 23.387197795315043,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 53.61374967397043,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.387197795315043,
"eval_f1": 53.61374967397047,
"eval_total": 7983,
"step": 8500
},
{
"epoch": 1.24,
"learning_rate": 1.86473853345019e-05,
"loss": 2.4263,
"step": 9000
},
{
"epoch": 1.24,
"eval_HasAns_exact": 24.109623642333922,
"eval_HasAns_f1": 54.76436323474705,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 23.91331579606664,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.3184552289524,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.91331579606664,
"eval_f1": 54.318455228952416,
"eval_total": 7983,
"step": 9000
},
{
"epoch": 1.3,
"learning_rate": 1.8501314636283964e-05,
"loss": 2.4629,
"step": 9500
},
{
"epoch": 1.3,
"eval_HasAns_exact": 24.475877746905784,
"eval_HasAns_f1": 55.617867547126586,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 24.276587748966556,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.16501005112716,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.276587748966556,
"eval_f1": 55.16501005112718,
"eval_total": 7983,
"step": 9500
},
{
"epoch": 1.37,
"learning_rate": 1.8355243938066025e-05,
"loss": 2.4136,
"step": 10000
},
{
"epoch": 1.37,
"eval_HasAns_exact": 24.475877746905784,
"eval_HasAns_f1": 56.18918648654074,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 24.276587748966556,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.731677138974,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.276587748966556,
"eval_f1": 55.73167713897402,
"eval_total": 7983,
"step": 10000
},
{
"epoch": 1.44,
"learning_rate": 1.8209173239848087e-05,
"loss": 2.4286,
"step": 10500
},
{
"epoch": 1.44,
"eval_HasAns_exact": 24.299065420560748,
"eval_HasAns_f1": 56.63451506748617,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 24.101215082049354,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.17337971994934,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.101215082049354,
"eval_f1": 56.17337971994933,
"eval_total": 7983,
"step": 10500
},
{
"epoch": 1.51,
"learning_rate": 1.806310254163015e-05,
"loss": 2.421,
"step": 11000
},
{
"epoch": 1.51,
"eval_HasAns_exact": 24.791614043950492,
"eval_HasAns_f1": 56.09913988305096,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.627333082800952,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.67994357935579,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.627333082800952,
"eval_f1": 55.679943579355815,
"eval_total": 7983,
"step": 11000
},
{
"epoch": 1.58,
"learning_rate": 1.7917031843412213e-05,
"loss": 2.4138,
"step": 11500
},
{
"epoch": 1.58,
"eval_HasAns_exact": 23.869664056579943,
"eval_HasAns_f1": 55.71886205295582,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 10.76923076923077,
"eval_NoAns_f1": 10.76923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 23.762996367280472,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.35286856260852,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.762996367280472,
"eval_f1": 55.35286856260858,
"eval_total": 7983,
"step": 11500
},
{
"epoch": 1.65,
"learning_rate": 1.7770961145194278e-05,
"loss": 2.3941,
"step": 12000
},
{
"epoch": 1.65,
"eval_HasAns_exact": 24.917908562768375,
"eval_HasAns_f1": 55.98821830578535,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.752599273456095,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.569925159114156,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.752599273456095,
"eval_f1": 55.56992515911417,
"eval_total": 7983,
"step": 12000
},
{
"epoch": 1.72,
"learning_rate": 1.7624890446976336e-05,
"loss": 2.3891,
"step": 12500
},
{
"epoch": 1.72,
"eval_HasAns_exact": 24.65269007325082,
"eval_HasAns_f1": 56.420675481209294,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 6.153846153846154,
"eval_NoAns_f1": 6.153846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 24.489540273080294,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.998861137443946,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.50206689214581,
"eval_f1": 56.01138775650948,
"eval_total": 7983,
"step": 12500
},
{
"epoch": 1.78,
"learning_rate": 1.74788197487584e-05,
"loss": 2.3541,
"step": 13000
},
{
"epoch": 1.78,
"eval_HasAns_exact": 24.65269007325082,
"eval_HasAns_f1": 56.3286384049731,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.489540273080294,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.90757345491381,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.489540273080294,
"eval_f1": 55.907573454913816,
"eval_total": 7983,
"step": 13000
},
{
"epoch": 1.85,
"learning_rate": 1.7332749050540462e-05,
"loss": 2.3694,
"step": 13500
},
{
"epoch": 1.85,
"eval_HasAns_exact": 25.34730992674918,
"eval_HasAns_f1": 56.89667335733098,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 25.140924464487036,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.43340343772345,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.140924464487036,
"eval_f1": 56.433403437723506,
"eval_total": 7983,
"step": 13500
},
{
"epoch": 1.92,
"learning_rate": 1.7186678352322527e-05,
"loss": 2.3684,
"step": 14000
},
{
"epoch": 1.92,
"eval_HasAns_exact": 25.082091437231625,
"eval_HasAns_f1": 56.242751844782845,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 3.076923076923077,
"eval_NoAns_f1": 3.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 24.902918702242264,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.809859590002546,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.902918702242264,
"eval_f1": 55.809859590002574,
"eval_total": 7983,
"step": 14000
},
{
"epoch": 1.99,
"learning_rate": 1.7040607654104588e-05,
"loss": 2.3991,
"step": 14500
},
{
"epoch": 1.99,
"eval_HasAns_exact": 23.99595857539783,
"eval_HasAns_f1": 56.43417395738433,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 3.076923076923077,
"eval_NoAns_f1": 3.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 23.825629462608042,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.99972308587861,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.825629462608042,
"eval_f1": 55.999723085878635,
"eval_total": 7983,
"step": 14500
},
{
"epoch": 2.06,
"learning_rate": 1.689453695588665e-05,
"loss": 2.0923,
"step": 15000
},
{
"epoch": 2.06,
"eval_HasAns_exact": 24.981055822177318,
"eval_HasAns_f1": 56.740647572969316,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.815232368783665,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.316227919675676,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.815232368783665,
"eval_f1": 56.31622791967569,
"eval_total": 7983,
"step": 15000
},
{
"epoch": 2.13,
"learning_rate": 1.6748466257668714e-05,
"loss": 2.0467,
"step": 15500
},
{
"epoch": 2.13,
"eval_HasAns_exact": 25.284162667340237,
"eval_HasAns_f1": 56.17685433436681,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 25.115871226356006,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.75702525610878,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.115871226356006,
"eval_f1": 55.75702525610878,
"eval_total": 7983,
"step": 15500
},
{
"epoch": 2.2,
"learning_rate": 1.6602395559450776e-05,
"loss": 2.0438,
"step": 16000
},
{
"epoch": 2.2,
"eval_HasAns_exact": 24.324324324324323,
"eval_HasAns_f1": 56.49055815994823,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 0.0,
"eval_NoAns_f1": 0.0,
"eval_NoAns_total": 65,
"eval_best_exact": 24.126268320180383,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.03059495308402,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.126268320180383,
"eval_f1": 56.03059495308406,
"eval_total": 7983,
"step": 16000
},
{
"epoch": 2.27,
"learning_rate": 1.6456324861232837e-05,
"loss": 2.0502,
"step": 16500
},
{
"epoch": 2.27,
"eval_HasAns_exact": 23.89492296034352,
"eval_HasAns_f1": 55.95219524867858,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 1.5384615384615385,
"eval_NoAns_f1": 1.5384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 23.712889891018413,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.50914217450042,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.712889891018413,
"eval_f1": 55.50914217450044,
"eval_total": 7983,
"step": 16500
},
{
"epoch": 2.33,
"learning_rate": 1.63102541630149e-05,
"loss": 2.0676,
"step": 17000
},
{
"epoch": 2.33,
"eval_HasAns_exact": 24.463248295023995,
"eval_HasAns_f1": 55.285627746177674,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 6.153846153846154,
"eval_NoAns_f1": 6.153846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 24.314167606163096,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.8855819233665,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.314167606163096,
"eval_f1": 54.88558192336651,
"eval_total": 7983,
"step": 17000
},
{
"epoch": 2.4,
"learning_rate": 1.6164183464796963e-05,
"loss": 2.0655,
"step": 17500
},
{
"epoch": 2.4,
"eval_HasAns_exact": 25.372568830512755,
"eval_HasAns_f1": 57.0197153609346,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 7.6923076923076925,
"eval_NoAns_f1": 7.6923076923076925,
"eval_NoAns_total": 65,
"eval_best_exact": 25.228610797945635,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.61807669145432,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.228610797945635,
"eval_f1": 56.61807669145436,
"eval_total": 7983,
"step": 17500
},
{
"epoch": 2.47,
"learning_rate": 1.6018112766579025e-05,
"loss": 2.0479,
"step": 18000
},
{
"epoch": 2.47,
"eval_HasAns_exact": 25.71356403132104,
"eval_HasAns_f1": 57.821942508234095,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 3.076923076923077,
"eval_NoAns_f1": 3.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 25.529249655517976,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.37619200553649,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.529249655517976,
"eval_f1": 57.37619200553646,
"eval_total": 7983,
"step": 18000
},
{
"epoch": 2.54,
"learning_rate": 1.587204206836109e-05,
"loss": 2.0603,
"step": 18500
},
{
"epoch": 2.54,
"eval_HasAns_exact": 25.018944177822682,
"eval_HasAns_f1": 57.38397521872463,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.85281222598021,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.954317397201734,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.85281222598021,
"eval_f1": 56.95431739720177,
"eval_total": 7983,
"step": 18500
},
{
"epoch": 2.61,
"learning_rate": 1.572597137014315e-05,
"loss": 2.0788,
"step": 19000
},
{
"epoch": 2.61,
"eval_HasAns_exact": 24.715837332659763,
"eval_HasAns_f1": 57.37643493713972,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 3.076923076923077,
"eval_NoAns_f1": 3.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 24.539646749342353,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.93431189180411,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.539646749342353,
"eval_f1": 56.93431189180413,
"eval_total": 7983,
"step": 19000
},
{
"epoch": 2.68,
"learning_rate": 1.5579900671925213e-05,
"loss": 2.076,
"step": 19500
},
{
"epoch": 2.68,
"eval_HasAns_exact": 24.917908562768375,
"eval_HasAns_f1": 57.176560884370765,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.752599273456095,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.748591893078725,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.752599273456095,
"eval_f1": 56.74859189307877,
"eval_total": 7983,
"step": 19500
},
{
"epoch": 2.75,
"learning_rate": 1.5433829973707274e-05,
"loss": 2.0729,
"step": 20000
},
{
"epoch": 2.75,
"eval_HasAns_exact": 25.663046223793888,
"eval_HasAns_f1": 57.259618778706425,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 25.491669798321432,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.83097350492259,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.491669798321432,
"eval_f1": 56.830973504922646,
"eval_total": 7983,
"step": 20000
},
{
"epoch": 2.81,
"learning_rate": 1.528775927548934e-05,
"loss": 2.0671,
"step": 20500
},
{
"epoch": 2.81,
"eval_HasAns_exact": 24.66531952513261,
"eval_HasAns_f1": 57.27218980931721,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 1.5384615384615385,
"eval_NoAns_f1": 1.5384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 24.477013654014783,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.81838894026976,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.477013654014783,
"eval_f1": 56.818388940269784,
"eval_total": 7983,
"step": 20500
},
{
"epoch": 2.88,
"learning_rate": 1.51416885772714e-05,
"loss": 2.0876,
"step": 21000
},
{
"epoch": 2.88,
"eval_HasAns_exact": 24.842131851477646,
"eval_HasAns_f1": 57.122549033702775,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 7.6923076923076925,
"eval_NoAns_f1": 7.6923076923076925,
"eval_NoAns_total": 65,
"eval_best_exact": 24.702492797194036,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.72007306136267,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.702492797194036,
"eval_f1": 56.720073061362704,
"eval_total": 7983,
"step": 21000
},
{
"epoch": 2.95,
"learning_rate": 1.4995617879053463e-05,
"loss": 2.0692,
"step": 21500
},
{
"epoch": 2.95,
"eval_HasAns_exact": 25.63778732003031,
"eval_HasAns_f1": 57.346401166726885,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 9.23076923076923,
"eval_NoAns_f1": 9.23076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 25.504196417386947,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.95462914169401,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.504196417386947,
"eval_f1": 56.95462914169406,
"eval_total": 7983,
"step": 21500
},
{
"epoch": 3.02,
"learning_rate": 1.4849547180835526e-05,
"loss": 1.9856,
"step": 22000
},
{
"epoch": 3.02,
"eval_HasAns_exact": 24.51376610255115,
"eval_HasAns_f1": 56.65859501004218,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 7.6923076923076925,
"eval_NoAns_f1": 7.6923076923076925,
"eval_NoAns_total": 65,
"eval_best_exact": 24.37680070149067,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.259896691658966,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.37680070149067,
"eval_f1": 56.25989669165901,
"eval_total": 7983,
"step": 22000
},
{
"epoch": 3.09,
"learning_rate": 1.470347648261759e-05,
"loss": 1.7772,
"step": 22500
},
{
"epoch": 3.09,
"eval_HasAns_exact": 25.208385956049508,
"eval_HasAns_f1": 57.541934442000205,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 9.23076923076923,
"eval_NoAns_f1": 9.23076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 25.078291369159462,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.14857032591221,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.078291369159462,
"eval_f1": 57.14857032591224,
"eval_total": 7983,
"step": 22500
},
{
"epoch": 3.16,
"learning_rate": 1.455740578439965e-05,
"loss": 1.7533,
"step": 23000
},
{
"epoch": 3.16,
"eval_HasAns_exact": 25.852488002020714,
"eval_HasAns_f1": 57.54889352900813,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 25.679569084304145,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.117892892732826,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.679569084304145,
"eval_f1": 57.11789289273286,
"eval_total": 7983,
"step": 23000
},
{
"epoch": 3.23,
"learning_rate": 1.4411335086181712e-05,
"loss": 1.7728,
"step": 23500
},
{
"epoch": 3.23,
"eval_HasAns_exact": 25.599898964384945,
"eval_HasAns_f1": 57.81775981872567,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 6.153846153846154,
"eval_NoAns_f1": 6.153846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 25.441563322059377,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.397096610881825,
"eval_best_f1_thresh": 0.0,
"eval_exact": 25.441563322059377,
"eval_f1": 57.39709661088185,
"eval_total": 7983,
"step": 23500
},
{
"epoch": 3.3,
"learning_rate": 1.4265264387963775e-05,
"loss": 1.7535,
"step": 24000
},
{
"epoch": 3.3,
"eval_HasAns_exact": 24.86739075524122,
"eval_HasAns_f1": 57.557703123488565,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.702492797194036,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.126630756831055,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.702492797194036,
"eval_f1": 57.12663075683106,
"eval_total": 7983,
"step": 24000
},
{
"epoch": 3.36,
"learning_rate": 1.4119193689745838e-05,
"loss": 1.764,
"step": 24500
},
{
"epoch": 3.36,
"eval_HasAns_exact": 24.943167466531953,
"eval_HasAns_f1": 56.947380755274594,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 7.6923076923076925,
"eval_NoAns_f1": 7.6923076923076925,
"eval_NoAns_total": 65,
"eval_best_exact": 24.80270574971815,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.54633105602702,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.80270574971815,
"eval_f1": 56.546331056027086,
"eval_total": 7983,
"step": 24500
},
{
"epoch": 3.43,
"learning_rate": 1.3973122991527902e-05,
"loss": 1.799,
"step": 25000
},
{
"epoch": 3.43,
"eval_HasAns_exact": 24.564283910078302,
"eval_HasAns_f1": 55.87293948312867,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 29.23076923076923,
"eval_NoAns_f1": 29.23076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 24.602279844669923,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.65601087653921,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.602279844669923,
"eval_f1": 55.65601087653924,
"eval_total": 7983,
"step": 25000
},
{
"epoch": 3.5,
"learning_rate": 1.3827052293309963e-05,
"loss": 1.8033,
"step": 25500
},
{
"epoch": 3.5,
"eval_HasAns_exact": 24.943167466531953,
"eval_HasAns_f1": 56.693149175873096,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 10.76923076923077,
"eval_NoAns_f1": 10.76923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 24.82775898784918,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.319222745153795,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.82775898784918,
"eval_f1": 56.31922274515385,
"eval_total": 7983,
"step": 25500
},
{
"epoch": 3.57,
"learning_rate": 1.3680981595092026e-05,
"loss": 1.7901,
"step": 26000
},
{
"epoch": 3.57,
"eval_HasAns_exact": 24.488507198787573,
"eval_HasAns_f1": 56.74255621835055,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 7.6923076923076925,
"eval_NoAns_f1": 7.6923076923076925,
"eval_NoAns_total": 65,
"eval_best_exact": 24.35174746335964,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.34317426242004,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.35174746335964,
"eval_f1": 56.3431742624201,
"eval_total": 7983,
"step": 26000
},
{
"epoch": 3.64,
"learning_rate": 1.3534910896874088e-05,
"loss": 1.7752,
"step": 26500
},
{
"epoch": 3.64,
"eval_HasAns_exact": 25.09472088911341,
"eval_HasAns_f1": 57.45911652355072,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 9.23076923076923,
"eval_NoAns_f1": 9.23076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 24.965551797569837,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.066426735998284,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.965551797569837,
"eval_f1": 57.0664267359983,
"eval_total": 7983,
"step": 26500
},
{
"epoch": 3.71,
"learning_rate": 1.338884019865615e-05,
"loss": 1.8101,
"step": 27000
},
{
"epoch": 3.71,
"eval_HasAns_exact": 24.854761303359435,
"eval_HasAns_f1": 56.59464728748924,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 24.77765251158712,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.259102746127944,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.77765251158712,
"eval_f1": 56.25910274612799,
"eval_total": 7983,
"step": 27000
},
{
"epoch": 3.78,
"learning_rate": 1.3242769500438212e-05,
"loss": 1.779,
"step": 27500
},
{
"epoch": 3.78,
"eval_HasAns_exact": 25.157868148522354,
"eval_HasAns_f1": 57.443891564398484,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 24.990605035700863,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.013745885870875,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.990605035700863,
"eval_f1": 57.013745885870904,
"eval_total": 7983,
"step": 27500
},
{
"epoch": 3.84,
"learning_rate": 1.3096698802220275e-05,
"loss": 1.7697,
"step": 28000
},
{
"epoch": 3.84,
"eval_HasAns_exact": 24.981055822177318,
"eval_HasAns_f1": 57.991875640396366,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 6.153846153846154,
"eval_NoAns_f1": 6.153846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 24.82775898784918,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 57.56979472888116,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.82775898784918,
"eval_f1": 57.56979472888117,
"eval_total": 7983,
"step": 28000
},
{
"epoch": 3.91,
"learning_rate": 1.2950628104002338e-05,
"loss": 1.8014,
"step": 28500
},
{
"epoch": 3.91,
"eval_HasAns_exact": 23.958070219752464,
"eval_HasAns_f1": 56.83764415249211,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 4.615384615384615,
"eval_NoAns_f1": 4.615384615384615,
"eval_NoAns_total": 65,
"eval_best_exact": 23.800576224477012,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.41243472371692,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.800576224477012,
"eval_f1": 56.41243472371696,
"eval_total": 7983,
"step": 28500
},
{
"epoch": 3.98,
"learning_rate": 1.2804557405784401e-05,
"loss": 1.7952,
"step": 29000
},
{
"epoch": 3.98,
"eval_HasAns_exact": 24.501136650669363,
"eval_HasAns_f1": 56.987466541223796,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 6.153846153846154,
"eval_NoAns_f1": 6.153846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 24.35174746335964,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.5735638323199,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.35174746335964,
"eval_f1": 56.57356383231995,
"eval_total": 7983,
"step": 29000
},
{
"epoch": 4.05,
"learning_rate": 1.2658486707566464e-05,
"loss": 1.5768,
"step": 29500
},
{
"epoch": 4.05,
"eval_HasAns_exact": 24.172770901742865,
"eval_HasAns_f1": 56.488669720521,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 24.101215082049354,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.15398808055679,
"eval_best_f1_thresh": 0.0,
"eval_exact": 24.101215082049354,
"eval_f1": 56.15398808055684,
"eval_total": 7983,
"step": 29500
},
{
"epoch": 4.12,
"learning_rate": 1.2512416009348524e-05,
"loss": 1.5075,
"step": 30000
},
{
"epoch": 4.12,
"eval_HasAns_exact": 23.869664056579943,
"eval_HasAns_f1": 55.37001243988256,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 12.307692307692308,
"eval_NoAns_f1": 12.307692307692308,
"eval_NoAns_total": 65,
"eval_best_exact": 23.775522986345987,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.01938600763996,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.775522986345987,
"eval_f1": 55.01938600763998,
"eval_total": 7983,
"step": 30000
},
{
"epoch": 4.19,
"learning_rate": 1.2366345311130587e-05,
"loss": 1.5191,
"step": 30500
},
{
"epoch": 4.19,
"eval_HasAns_exact": 23.30133872189947,
"eval_HasAns_f1": 55.78659265350773,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 13.846153846153847,
"eval_NoAns_f1": 13.846153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 23.22435174746336,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.4451009182606,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.22435174746336,
"eval_f1": 55.4451009182606,
"eval_total": 7983,
"step": 30500
},
{
"epoch": 4.26,
"learning_rate": 1.222027461291265e-05,
"loss": 1.5108,
"step": 31000
},
{
"epoch": 4.26,
"eval_HasAns_exact": 23.250820914372316,
"eval_HasAns_f1": 56.43743176160512,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 10.76923076923077,
"eval_NoAns_f1": 10.76923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 23.149192033070275,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.065587459399865,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.149192033070275,
"eval_f1": 56.065587459399865,
"eval_total": 7983,
"step": 31000
},
{
"epoch": 4.33,
"learning_rate": 1.2074203914694714e-05,
"loss": 1.5025,
"step": 31500
},
{
"epoch": 4.33,
"eval_HasAns_exact": 23.45289214448093,
"eval_HasAns_f1": 56.04845888253506,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 23.399724414380557,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.729888191395766,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.399724414380557,
"eval_f1": 55.72988819139578,
"eval_total": 7983,
"step": 31500
},
{
"epoch": 4.39,
"learning_rate": 1.1928133216476777e-05,
"loss": 1.5335,
"step": 32000
},
{
"epoch": 4.39,
"eval_HasAns_exact": 22.85930790603688,
"eval_HasAns_f1": 56.68438606813033,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 12.307692307692308,
"eval_NoAns_f1": 12.307692307692308,
"eval_NoAns_total": 65,
"eval_best_exact": 22.77339346110485,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.32305760834969,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.77339346110485,
"eval_f1": 56.323057608349735,
"eval_total": 7983,
"step": 32000
},
{
"epoch": 4.46,
"learning_rate": 1.1782062518258838e-05,
"loss": 1.5225,
"step": 32500
},
{
"epoch": 4.46,
"eval_HasAns_exact": 23.60444556706239,
"eval_HasAns_f1": 56.20113671315002,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 6.153846153846154,
"eval_NoAns_f1": 6.153846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 23.46235750970813,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.793636539486585,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.46235750970813,
"eval_f1": 55.793636539486634,
"eval_total": 7983,
"step": 32500
},
{
"epoch": 4.53,
"learning_rate": 1.1635991820040901e-05,
"loss": 1.5258,
"step": 33000
},
{
"epoch": 4.53,
"eval_HasAns_exact": 23.68022227835312,
"eval_HasAns_f1": 56.10398795615236,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 9.23076923076923,
"eval_NoAns_f1": 9.23076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 23.562570462232244,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.722332035176514,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.562570462232244,
"eval_f1": 55.72233203517653,
"eval_total": 7983,
"step": 33000
},
{
"epoch": 4.6,
"learning_rate": 1.1489921121822963e-05,
"loss": 1.5243,
"step": 33500
},
{
"epoch": 4.6,
"eval_HasAns_exact": 23.124526395554433,
"eval_HasAns_f1": 55.16381098253084,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 13.846153846153847,
"eval_NoAns_f1": 13.846153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 23.04897908054616,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.827390123973345,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.04897908054616,
"eval_f1": 54.82739012397335,
"eval_total": 7983,
"step": 33500
},
{
"epoch": 4.67,
"learning_rate": 1.1343850423605026e-05,
"loss": 1.5106,
"step": 34000
},
{
"epoch": 4.67,
"eval_HasAns_exact": 23.857034604698157,
"eval_HasAns_f1": 55.75167317754203,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 13.846153846153847,
"eval_NoAns_f1": 13.846153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 23.775522986345987,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.41046576722756,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.775522986345987,
"eval_f1": 55.41046576722758,
"eval_total": 7983,
"step": 34000
},
{
"epoch": 4.74,
"learning_rate": 1.1197779725387087e-05,
"loss": 1.5087,
"step": 34500
},
{
"epoch": 4.74,
"eval_HasAns_exact": 23.617075018944178,
"eval_HasAns_f1": 56.55795709995034,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 12.307692307692308,
"eval_NoAns_f1": 12.307692307692308,
"eval_NoAns_total": 65,
"eval_best_exact": 23.5249906050357,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.19765806305982,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.5249906050357,
"eval_f1": 56.197658063059876,
"eval_total": 7983,
"step": 34500
},
{
"epoch": 4.81,
"learning_rate": 1.105170902716915e-05,
"loss": 1.5146,
"step": 35000
},
{
"epoch": 4.81,
"eval_HasAns_exact": 23.654963374589542,
"eval_HasAns_f1": 56.11957102159652,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 23.600150319428785,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.80042131391719,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.600150319428785,
"eval_f1": 55.80042131391721,
"eval_total": 7983,
"step": 35000
},
{
"epoch": 4.87,
"learning_rate": 1.0905638328951213e-05,
"loss": 1.5457,
"step": 35500
},
{
"epoch": 4.87,
"eval_HasAns_exact": 23.187673654963376,
"eval_HasAns_f1": 55.30196544515009,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 21.53846153846154,
"eval_NoAns_f1": 21.53846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 23.174245271201304,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.02705278650863,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.174245271201304,
"eval_f1": 55.027052786508634,
"eval_total": 7983,
"step": 35500
},
{
"epoch": 4.94,
"learning_rate": 1.0759567630733276e-05,
"loss": 1.5391,
"step": 36000
},
{
"epoch": 4.94,
"eval_HasAns_exact": 22.909825713564032,
"eval_HasAns_f1": 54.75304453221414,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 13.846153846153847,
"eval_NoAns_f1": 13.846153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 22.83602655643242,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.419968258307854,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.83602655643242,
"eval_f1": 54.41996825830788,
"eval_total": 7983,
"step": 36000
},
{
"epoch": 5.01,
"learning_rate": 1.061349693251534e-05,
"loss": 1.4678,
"step": 36500
},
{
"epoch": 5.01,
"eval_HasAns_exact": 23.263450366254105,
"eval_HasAns_f1": 55.457692051771524,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 23.19929850933233,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.13140494374632,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.19929850933233,
"eval_f1": 55.13140494374634,
"eval_total": 7983,
"step": 36500
},
{
"epoch": 5.08,
"learning_rate": 1.04674262342974e-05,
"loss": 1.231,
"step": 37000
},
{
"epoch": 5.08,
"eval_HasAns_exact": 23.07400858802728,
"eval_HasAns_f1": 55.804051165907055,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 23.04897908054616,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.51252375443468,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.04897908054616,
"eval_f1": 55.512523754434696,
"eval_total": 7983,
"step": 37000
},
{
"epoch": 5.15,
"learning_rate": 1.0321355536079462e-05,
"loss": 1.2651,
"step": 37500
},
{
"epoch": 5.15,
"eval_HasAns_exact": 24.033846931043193,
"eval_HasAns_f1": 56.78984223580061,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 23.975948891394214,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.46523497721016,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.975948891394214,
"eval_f1": 56.46523497721018,
"eval_total": 7983,
"step": 37500
},
{
"epoch": 5.22,
"learning_rate": 1.0175284837861525e-05,
"loss": 1.2697,
"step": 38000
},
{
"epoch": 5.22,
"eval_HasAns_exact": 23.54129830765345,
"eval_HasAns_f1": 56.15134431131498,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 23.487410747839156,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.83193589590276,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.487410747839156,
"eval_f1": 55.831935895902795,
"eval_total": 7983,
"step": 38000
},
{
"epoch": 5.29,
"learning_rate": 1.0029214139643589e-05,
"loss": 1.2678,
"step": 38500
},
{
"epoch": 5.29,
"eval_HasAns_exact": 22.972972972972972,
"eval_HasAns_f1": 56.30865181101293,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 9.23076923076923,
"eval_NoAns_f1": 9.23076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 22.861079794563448,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.925329455041975,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.861079794563448,
"eval_f1": 55.925329455042025,
"eval_total": 7983,
"step": 38500
},
{
"epoch": 5.35,
"learning_rate": 9.883143441425652e-06,
"loss": 1.2719,
"step": 39000
},
{
"epoch": 5.35,
"eval_HasAns_exact": 22.98560242485476,
"eval_HasAns_f1": 56.43712830994619,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 22.936239508956533,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.115392954798146,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.936239508956533,
"eval_f1": 56.11539295479819,
"eval_total": 7983,
"step": 39000
},
{
"epoch": 5.42,
"learning_rate": 9.737072743207713e-06,
"loss": 1.2461,
"step": 39500
},
{
"epoch": 5.42,
"eval_HasAns_exact": 21.94998737054812,
"eval_HasAns_f1": 54.461077183587264,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.934109983715395,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.180484672384274,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.934109983715395,
"eval_f1": 54.18048467238429,
"eval_total": 7983,
"step": 39500
},
{
"epoch": 5.49,
"learning_rate": 9.591002044989776e-06,
"loss": 1.2682,
"step": 40000
},
{
"epoch": 5.49,
"eval_HasAns_exact": 22.480424349583227,
"eval_HasAns_f1": 56.09513335441032,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 9.23076923076923,
"eval_NoAns_f1": 9.23076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 22.36001503194288,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.701022911213904,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.372541651008394,
"eval_f1": 55.713549530279444,
"eval_total": 7983,
"step": 40000
},
{
"epoch": 5.56,
"learning_rate": 9.44493134677184e-06,
"loss": 1.2697,
"step": 40500
},
{
"epoch": 5.56,
"eval_HasAns_exact": 21.735286688557718,
"eval_HasAns_f1": 53.78512964065436,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 26.153846153846153,
"eval_NoAns_f1": 26.153846153846153,
"eval_NoAns_total": 65,
"eval_best_exact": 21.77126393586371,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 53.56014737500954,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.77126393586371,
"eval_f1": 53.56014737500955,
"eval_total": 7983,
"step": 40500
},
{
"epoch": 5.63,
"learning_rate": 9.2988606485539e-06,
"loss": 1.2917,
"step": 41000
},
{
"epoch": 5.63,
"eval_HasAns_exact": 23.023490780500126,
"eval_HasAns_f1": 55.033207325250956,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 21.53846153846154,
"eval_NoAns_f1": 21.53846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 23.011399223349617,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.760482976492185,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.011399223349617,
"eval_f1": 54.76048297649218,
"eval_total": 7983,
"step": 41000
},
{
"epoch": 5.7,
"learning_rate": 9.152789950335964e-06,
"loss": 1.2778,
"step": 41500
},
{
"epoch": 5.7,
"eval_HasAns_exact": 22.480424349583227,
"eval_HasAns_f1": 55.70683691098,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 12.307692307692308,
"eval_NoAns_f1": 12.307692307692308,
"eval_NoAns_total": 65,
"eval_best_exact": 22.39759488913942,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.3534679520405,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.39759488913942,
"eval_f1": 55.35346795204054,
"eval_total": 7983,
"step": 41500
},
{
"epoch": 5.77,
"learning_rate": 9.006719252118025e-06,
"loss": 1.2687,
"step": 42000
},
{
"epoch": 5.77,
"eval_HasAns_exact": 22.796160646627936,
"eval_HasAns_f1": 56.24362857300818,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 22.760866842039334,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.9359953702967,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.760866842039334,
"eval_f1": 55.93599537029674,
"eval_total": 7983,
"step": 42000
},
{
"epoch": 5.84,
"learning_rate": 8.860648553900088e-06,
"loss": 1.2824,
"step": 42500
},
{
"epoch": 5.84,
"eval_HasAns_exact": 22.745642839100782,
"eval_HasAns_f1": 56.39484118651382,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 10.76923076923077,
"eval_NoAns_f1": 10.76923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 22.648127270449706,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.02334366964999,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.648127270449706,
"eval_f1": 56.023343669650046,
"eval_total": 7983,
"step": 42500
},
{
"epoch": 5.9,
"learning_rate": 8.714577855682151e-06,
"loss": 1.2765,
"step": 43000
},
{
"epoch": 5.9,
"eval_HasAns_exact": 23.08663803990907,
"eval_HasAns_f1": 56.275076616780346,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 23.02392584241513,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.94213411645579,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.02392584241513,
"eval_f1": 55.94213411645581,
"eval_total": 7983,
"step": 43000
},
{
"epoch": 5.97,
"learning_rate": 8.568507157464213e-06,
"loss": 1.2842,
"step": 43500
},
{
"epoch": 5.97,
"eval_HasAns_exact": 22.935084617327608,
"eval_HasAns_f1": 56.49077118373285,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 22.886133032694477,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.16859905208523,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.886133032694477,
"eval_f1": 56.16859905208528,
"eval_total": 7983,
"step": 43500
},
{
"epoch": 6.04,
"learning_rate": 8.422436459246276e-06,
"loss": 1.1443,
"step": 44000
},
{
"epoch": 6.04,
"eval_HasAns_exact": 22.417277090174288,
"eval_HasAns_f1": 55.25309346308609,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 23.076923076923077,
"eval_NoAns_f1": 23.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 22.42264812727045,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.9911053539666,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.42264812727045,
"eval_f1": 54.99110535396661,
"eval_total": 7983,
"step": 44000
},
{
"epoch": 6.11,
"learning_rate": 8.276365761028339e-06,
"loss": 1.0544,
"step": 44500
},
{
"epoch": 6.11,
"eval_HasAns_exact": 23.21293255872695,
"eval_HasAns_f1": 56.57201194681735,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 23.149192033070275,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.236651709244576,
"eval_best_f1_thresh": 0.0,
"eval_exact": 23.16171865213579,
"eval_f1": 56.24917832831013,
"eval_total": 7983,
"step": 44500
},
{
"epoch": 6.18,
"learning_rate": 8.1302950628104e-06,
"loss": 1.0672,
"step": 45000
},
{
"epoch": 6.18,
"eval_HasAns_exact": 22.354129830765345,
"eval_HasAns_f1": 55.7700117261907,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 22.297381936615306,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.441181616933214,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.297381936615306,
"eval_f1": 55.44118161693323,
"eval_total": 7983,
"step": 45000
},
{
"epoch": 6.25,
"learning_rate": 7.984224364592464e-06,
"loss": 1.0696,
"step": 45500
},
{
"epoch": 6.25,
"eval_HasAns_exact": 23.07400858802728,
"eval_HasAns_f1": 56.442304320306086,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 12.307692307692308,
"eval_NoAns_f1": 12.307692307692308,
"eval_NoAns_total": 65,
"eval_best_exact": 22.98634598521859,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.08294696331998,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.98634598521859,
"eval_f1": 56.082946963320026,
"eval_total": 7983,
"step": 45500
},
{
"epoch": 6.32,
"learning_rate": 7.838153666374527e-06,
"loss": 1.0671,
"step": 46000
},
{
"epoch": 6.32,
"eval_HasAns_exact": 22.202576408183884,
"eval_HasAns_f1": 55.34797695561554,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 21.53846153846154,
"eval_NoAns_f1": 21.53846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 22.197168984091192,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.072689657342316,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.197168984091192,
"eval_f1": 55.07268965734232,
"eval_total": 7983,
"step": 46000
},
{
"epoch": 6.38,
"learning_rate": 7.69208296815659e-06,
"loss": 1.0649,
"step": 46500
},
{
"epoch": 6.38,
"eval_HasAns_exact": 22.32887092700177,
"eval_HasAns_f1": 55.65813462809328,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 22.30990855568082,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.36779531319585,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.30990855568082,
"eval_f1": 55.36779531319583,
"eval_total": 7983,
"step": 46500
},
{
"epoch": 6.45,
"learning_rate": 7.54601226993865e-06,
"loss": 1.0704,
"step": 47000
},
{
"epoch": 6.45,
"eval_HasAns_exact": 22.682495579691842,
"eval_HasAns_f1": 56.39872408814156,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 12.307692307692308,
"eval_NoAns_f1": 12.307692307692308,
"eval_NoAns_total": 65,
"eval_best_exact": 22.598020794187647,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.03972157458405,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.598020794187647,
"eval_f1": 56.03972157458409,
"eval_total": 7983,
"step": 47000
},
{
"epoch": 6.52,
"learning_rate": 7.3999415717207134e-06,
"loss": 1.0793,
"step": 47500
},
{
"epoch": 6.52,
"eval_HasAns_exact": 22.063652437484212,
"eval_HasAns_f1": 55.758375206459505,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 22.03432293623951,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.45469308339549,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.03432293623951,
"eval_f1": 55.454693083395476,
"eval_total": 7983,
"step": 47500
},
{
"epoch": 6.59,
"learning_rate": 7.2538708735027766e-06,
"loss": 1.0882,
"step": 48000
},
{
"epoch": 6.59,
"eval_HasAns_exact": 22.85930790603688,
"eval_HasAns_f1": 56.577537520045155,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 13.846153846153847,
"eval_NoAns_f1": 13.846153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 22.785920080170364,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.229605672518765,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.785920080170364,
"eval_f1": 56.229605672518794,
"eval_total": 7983,
"step": 48000
},
{
"epoch": 6.66,
"learning_rate": 7.107800175284838e-06,
"loss": 1.0902,
"step": 48500
},
{
"epoch": 6.66,
"eval_HasAns_exact": 22.139429148774944,
"eval_HasAns_f1": 56.283972169058366,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 22.084429412501567,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.95095723845719,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.084429412501567,
"eval_f1": 55.950957238457235,
"eval_total": 7983,
"step": 48500
},
{
"epoch": 6.73,
"learning_rate": 6.961729477066901e-06,
"loss": 1.0719,
"step": 49000
},
{
"epoch": 6.73,
"eval_HasAns_exact": 22.455165445819652,
"eval_HasAns_f1": 55.93362321999497,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 22.410121508204934,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.61598755554552,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.42264812727045,
"eval_f1": 55.6285141746111,
"eval_total": 7983,
"step": 49000
},
{
"epoch": 6.8,
"learning_rate": 6.815658778848963e-06,
"loss": 1.0736,
"step": 49500
},
{
"epoch": 6.8,
"eval_HasAns_exact": 21.71002778479414,
"eval_HasAns_f1": 55.39234728917103,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.671050983339597,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.079118857028206,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.671050983339597,
"eval_f1": 55.07911885702822,
"eval_total": 7983,
"step": 49500
},
{
"epoch": 6.87,
"learning_rate": 6.6695880806310264e-06,
"loss": 1.099,
"step": 50000
},
{
"epoch": 6.87,
"eval_HasAns_exact": 22.240464763829248,
"eval_HasAns_f1": 55.81572714282118,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 21.53846153846154,
"eval_NoAns_f1": 21.53846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 22.234748841287736,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.53663128107956,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.234748841287736,
"eval_f1": 55.53663128107958,
"eval_total": 7983,
"step": 50000
},
{
"epoch": 6.93,
"learning_rate": 6.523517382413088e-06,
"loss": 1.0901,
"step": 50500
},
{
"epoch": 6.93,
"eval_HasAns_exact": 21.987875726193483,
"eval_HasAns_f1": 54.90813130105857,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.934109983715395,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.5863188828488,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.934109983715395,
"eval_f1": 54.58631888284879,
"eval_total": 7983,
"step": 50500
},
{
"epoch": 7.0,
"learning_rate": 6.377446684195151e-06,
"loss": 1.0659,
"step": 51000
},
{
"epoch": 7.0,
"eval_HasAns_exact": 21.811063399848447,
"eval_HasAns_f1": 54.90414620994612,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 21.53846153846154,
"eval_NoAns_f1": 21.53846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 21.80884379306025,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.63247271581528,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.80884379306025,
"eval_f1": 54.63247271581526,
"eval_total": 7983,
"step": 51000
},
{
"epoch": 7.07,
"learning_rate": 6.231375985977214e-06,
"loss": 0.9032,
"step": 51500
},
{
"epoch": 7.07,
"eval_HasAns_exact": 22.15205860065673,
"eval_HasAns_f1": 55.72255495660219,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 22.09695603156708,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.39411125471326,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.09695603156708,
"eval_f1": 55.39411125471329,
"eval_total": 7983,
"step": 51500
},
{
"epoch": 7.14,
"learning_rate": 6.0853052877592755e-06,
"loss": 0.9125,
"step": 52000
},
{
"epoch": 7.14,
"eval_HasAns_exact": 22.278353119474616,
"eval_HasAns_f1": 55.7348659358302,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 22.24727546035325,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.43137523235669,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.24727546035325,
"eval_f1": 55.43137523235669,
"eval_total": 7983,
"step": 52000
},
{
"epoch": 7.21,
"learning_rate": 5.939234589541339e-06,
"loss": 0.8917,
"step": 52500
},
{
"epoch": 7.21,
"eval_HasAns_exact": 22.75827229098257,
"eval_HasAns_f1": 56.48355048657508,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 13.846153846153847,
"eval_NoAns_f1": 13.846153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 22.68570712764625,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.13638390989616,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.68570712764625,
"eval_f1": 56.13638390989625,
"eval_total": 7983,
"step": 52500
},
{
"epoch": 7.28,
"learning_rate": 5.793163891323401e-06,
"loss": 0.9111,
"step": 53000
},
{
"epoch": 7.28,
"eval_HasAns_exact": 21.71002778479414,
"eval_HasAns_f1": 55.32799628852263,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.671050983339597,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.015291821686354,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.671050983339597,
"eval_f1": 55.01529182168635,
"eval_total": 7983,
"step": 53000
},
{
"epoch": 7.35,
"learning_rate": 5.647093193105464e-06,
"loss": 0.929,
"step": 53500
},
{
"epoch": 7.35,
"eval_HasAns_exact": 21.92472846678454,
"eval_HasAns_f1": 55.97435992895805,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.871476888387825,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.643865954840265,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.871476888387825,
"eval_f1": 55.6438659548403,
"eval_total": 7983,
"step": 53500
},
{
"epoch": 7.41,
"learning_rate": 5.501022494887525e-06,
"loss": 0.9245,
"step": 54000
},
{
"epoch": 7.41,
"eval_HasAns_exact": 21.444809295276585,
"eval_HasAns_f1": 54.25388000235857,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 24.615384615384617,
"eval_NoAns_f1": 24.615384615384617,
"eval_NoAns_total": 65,
"eval_best_exact": 21.47062507829137,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 54.01255441045664,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.47062507829137,
"eval_f1": 54.01255441045667,
"eval_total": 7983,
"step": 54000
},
{
"epoch": 7.48,
"learning_rate": 5.3549517966695885e-06,
"loss": 0.9281,
"step": 54500
},
{
"epoch": 7.48,
"eval_HasAns_exact": 21.217479161404395,
"eval_HasAns_f1": 55.51878832249496,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.182512839784543,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.204530369223946,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.182512839784543,
"eval_f1": 55.204530369223974,
"eval_total": 7983,
"step": 54500
},
{
"epoch": 7.55,
"learning_rate": 5.2088810984516516e-06,
"loss": 0.921,
"step": 55000
},
{
"epoch": 7.55,
"eval_HasAns_exact": 21.55847436221268,
"eval_HasAns_f1": 55.80802472366072,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.4956783164224,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.46635848201745,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.50820493548791,
"eval_f1": 55.478885101083,
"eval_total": 7983,
"step": 55000
},
{
"epoch": 7.62,
"learning_rate": 5.062810400233713e-06,
"loss": 0.9311,
"step": 55500
},
{
"epoch": 7.62,
"eval_HasAns_exact": 21.962616822429908,
"eval_HasAns_f1": 56.38546877505227,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 12.307692307692308,
"eval_NoAns_f1": 12.307692307692308,
"eval_NoAns_total": 65,
"eval_best_exact": 21.88400350745334,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.02657419026227,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.88400350745334,
"eval_f1": 56.026574190262274,
"eval_total": 7983,
"step": 55500
},
{
"epoch": 7.69,
"learning_rate": 4.916739702015776e-06,
"loss": 0.9116,
"step": 56000
},
{
"epoch": 7.69,
"eval_HasAns_exact": 21.71002778479414,
"eval_HasAns_f1": 55.8268981189265,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 24.615384615384617,
"eval_NoAns_f1": 24.615384615384617,
"eval_NoAns_total": 65,
"eval_best_exact": 21.733684078667167,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.57276453785041,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.733684078667167,
"eval_f1": 55.57276453785043,
"eval_total": 7983,
"step": 56000
},
{
"epoch": 7.76,
"learning_rate": 4.770669003797838e-06,
"loss": 0.9173,
"step": 56500
},
{
"epoch": 7.76,
"eval_HasAns_exact": 21.596362717858046,
"eval_HasAns_f1": 56.19351406929686,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 23.076923076923077,
"eval_NoAns_f1": 23.076923076923077,
"eval_NoAns_total": 65,
"eval_best_exact": 21.608417888012024,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.9238687712254,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.608417888012024,
"eval_f1": 55.92386877122544,
"eval_total": 7983,
"step": 56500
},
{
"epoch": 7.83,
"learning_rate": 4.624598305579901e-06,
"loss": 0.922,
"step": 57000
},
{
"epoch": 7.83,
"eval_HasAns_exact": 22.17731750442031,
"eval_HasAns_f1": 55.756455451415086,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 24.615384615384617,
"eval_NoAns_f1": 24.615384615384617,
"eval_NoAns_total": 65,
"eval_best_exact": 22.197168984091192,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.50289543583923,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.197168984091192,
"eval_f1": 55.502895435839214,
"eval_total": 7983,
"step": 57000
},
{
"epoch": 7.9,
"learning_rate": 4.478527607361964e-06,
"loss": 0.9138,
"step": 57500
},
{
"epoch": 7.9,
"eval_HasAns_exact": 22.08891134124779,
"eval_HasAns_f1": 56.82319956291719,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 22.046849555305023,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.49832069888238,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.059376174370538,
"eval_f1": 56.51084731794791,
"eval_total": 7983,
"step": 57500
},
{
"epoch": 7.96,
"learning_rate": 4.332456909144026e-06,
"loss": 0.9051,
"step": 58000
},
{
"epoch": 7.96,
"eval_HasAns_exact": 21.886840111139175,
"eval_HasAns_f1": 55.728471748611895,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.871476888387825,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.437559727609774,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.871476888387825,
"eval_f1": 55.43755972760981,
"eval_total": 7983,
"step": 58000
},
{
"epoch": 8.03,
"learning_rate": 4.186386210926088e-06,
"loss": 0.8438,
"step": 58500
},
{
"epoch": 8.03,
"eval_HasAns_exact": 21.92472846678454,
"eval_HasAns_f1": 56.222570513713045,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 21.88400350745334,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.9025821530226,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.896530126518854,
"eval_f1": 55.91510877208819,
"eval_total": 7983,
"step": 58500
},
{
"epoch": 8.1,
"learning_rate": 4.040315512708151e-06,
"loss": 0.776,
"step": 59000
},
{
"epoch": 8.1,
"eval_HasAns_exact": 22.227835311947462,
"eval_HasAns_f1": 56.1608777793549,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 22.18464236502568,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.84139173956304,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.197168984091192,
"eval_f1": 55.85391835862862,
"eval_total": 7983,
"step": 59000
},
{
"epoch": 8.17,
"learning_rate": 3.894244814490214e-06,
"loss": 0.7949,
"step": 59500
},
{
"epoch": 8.17,
"eval_HasAns_exact": 22.025764081838847,
"eval_HasAns_f1": 56.274619626461195,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.959163221846424,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.92915422802447,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.97168984091194,
"eval_f1": 55.94168084709003,
"eval_total": 7983,
"step": 59500
},
{
"epoch": 8.24,
"learning_rate": 3.7481741162722763e-06,
"loss": 0.7951,
"step": 60000
},
{
"epoch": 8.24,
"eval_HasAns_exact": 21.684768881030564,
"eval_HasAns_f1": 56.08759973467501,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.671050983339597,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.79376358501269,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.671050983339597,
"eval_f1": 55.79376358501277,
"eval_total": 7983,
"step": 60000
},
{
"epoch": 8.31,
"learning_rate": 3.6021034180543385e-06,
"loss": 0.7791,
"step": 60500
},
{
"epoch": 8.31,
"eval_HasAns_exact": 22.051022985602426,
"eval_HasAns_f1": 56.14666242246213,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.996743079042965,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.81476550933922,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.996743079042965,
"eval_f1": 55.81476550933923,
"eval_total": 7983,
"step": 60500
},
{
"epoch": 8.38,
"learning_rate": 3.4560327198364012e-06,
"loss": 0.8014,
"step": 61000
},
{
"epoch": 8.38,
"eval_HasAns_exact": 22.354129830765345,
"eval_HasAns_f1": 56.44277640131104,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 22.284855317549795,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.0959418195641,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.297381936615306,
"eval_f1": 56.10846843862965,
"eval_total": 7983,
"step": 61000
},
{
"epoch": 8.44,
"learning_rate": 3.3099620216184635e-06,
"loss": 0.7841,
"step": 61500
},
{
"epoch": 8.44,
"eval_HasAns_exact": 22.215205860065673,
"eval_HasAns_f1": 56.09094279428335,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 22.172115745960166,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.77202618628775,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.172115745960166,
"eval_f1": 55.77202618628781,
"eval_total": 7983,
"step": 61500
},
{
"epoch": 8.51,
"learning_rate": 3.1638913234005257e-06,
"loss": 0.8008,
"step": 62000
},
{
"epoch": 8.51,
"eval_HasAns_exact": 22.063652437484212,
"eval_HasAns_f1": 56.17916434394415,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 22.046849555305023,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.88458264754471,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.046849555305023,
"eval_f1": 55.88458264754477,
"eval_total": 7983,
"step": 62000
},
{
"epoch": 8.58,
"learning_rate": 3.017820625182589e-06,
"loss": 0.7879,
"step": 62500
},
{
"epoch": 8.58,
"eval_HasAns_exact": 22.10154079312958,
"eval_HasAns_f1": 56.32847927477324,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 13.846153846153847,
"eval_NoAns_f1": 13.846153846153847,
"eval_NoAns_total": 65,
"eval_best_exact": 22.021796317173994,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.9700487157277,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.03432293623951,
"eval_f1": 55.98257533479327,
"eval_total": 7983,
"step": 62500
},
{
"epoch": 8.65,
"learning_rate": 2.871749926964651e-06,
"loss": 0.7893,
"step": 63000
},
{
"epoch": 8.65,
"eval_HasAns_exact": 21.811063399848447,
"eval_HasAns_f1": 55.61502667468564,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 21.53846153846154,
"eval_NoAns_f1": 21.53846153846154,
"eval_NoAns_total": 65,
"eval_best_exact": 21.79631717399474,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.32503835778039,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.80884379306025,
"eval_f1": 55.33756497684592,
"eval_total": 7983,
"step": 63000
},
{
"epoch": 8.72,
"learning_rate": 2.725679228746714e-06,
"loss": 0.8072,
"step": 63500
},
{
"epoch": 8.72,
"eval_HasAns_exact": 21.94998737054812,
"eval_HasAns_f1": 56.147388772329045,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 21.909056745584365,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.82801256411139,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.92158336464988,
"eval_f1": 55.84053918317692,
"eval_total": 7983,
"step": 63500
},
{
"epoch": 8.79,
"learning_rate": 2.579608530528776e-06,
"loss": 0.7824,
"step": 64000
},
{
"epoch": 8.79,
"eval_HasAns_exact": 22.038393533720637,
"eval_HasAns_f1": 56.069960647102285,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 21.996743079042965,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.751214882093905,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.00926969810848,
"eval_f1": 55.763741501159465,
"eval_total": 7983,
"step": 64000
},
{
"epoch": 8.86,
"learning_rate": 2.4335378323108387e-06,
"loss": 0.7966,
"step": 64500
},
{
"epoch": 8.86,
"eval_HasAns_exact": 22.10154079312958,
"eval_HasAns_f1": 56.371415222133756,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 22.059376174370538,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 56.05021492281784,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.071902793436053,
"eval_f1": 56.06274154188338,
"eval_total": 7983,
"step": 64500
},
{
"epoch": 8.92,
"learning_rate": 2.287467134092901e-06,
"loss": 0.7966,
"step": 65000
},
{
"epoch": 8.92,
"eval_HasAns_exact": 21.94998737054812,
"eval_HasAns_f1": 55.94050441592927,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.92158336464988,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.63533934176723,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.934109983715395,
"eval_f1": 55.6478659608328,
"eval_total": 7983,
"step": 65000
},
{
"epoch": 8.99,
"learning_rate": 2.1413964358749637e-06,
"loss": 0.7947,
"step": 65500
},
{
"epoch": 8.99,
"eval_HasAns_exact": 21.62162162162162,
"eval_HasAns_f1": 56.009996934703764,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.595891268946513,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.70426603143982,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.608417888012024,
"eval_f1": 55.7167926505054,
"eval_total": 7983,
"step": 65500
},
{
"epoch": 9.06,
"learning_rate": 1.9953257376570264e-06,
"loss": 0.6858,
"step": 66000
},
{
"epoch": 9.06,
"eval_HasAns_exact": 21.596362717858046,
"eval_HasAns_f1": 55.77625294716333,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 21.55831141174997,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.459898639062885,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.570838030815484,
"eval_f1": 55.47242525812843,
"eval_total": 7983,
"step": 66000
},
{
"epoch": 9.13,
"learning_rate": 1.8492550394390888e-06,
"loss": 0.7001,
"step": 66500
},
{
"epoch": 9.13,
"eval_HasAns_exact": 21.912099014902754,
"eval_HasAns_f1": 56.00529549829087,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.846423650256796,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.66202301834734,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.85895026932231,
"eval_f1": 55.6745496374129,
"eval_total": 7983,
"step": 66500
},
{
"epoch": 9.2,
"learning_rate": 1.7031843412211513e-06,
"loss": 0.7017,
"step": 67000
},
{
"epoch": 9.2,
"eval_HasAns_exact": 21.48269765092195,
"eval_HasAns_f1": 55.98671029097834,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.433045221094826,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.6561157564783,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.44557184016034,
"eval_f1": 55.668642375543875,
"eval_total": 7983,
"step": 67000
},
{
"epoch": 9.27,
"learning_rate": 1.5571136430032136e-06,
"loss": 0.7042,
"step": 67500
},
{
"epoch": 9.27,
"eval_HasAns_exact": 21.84895175549381,
"eval_HasAns_f1": 55.89859581000308,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 20.0,
"eval_NoAns_f1": 20.0,
"eval_NoAns_total": 65,
"eval_best_exact": 21.821370412125766,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.59377196838335,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.83389703119128,
"eval_f1": 55.60629858744889,
"eval_total": 7983,
"step": 67500
},
{
"epoch": 9.34,
"learning_rate": 1.411042944785276e-06,
"loss": 0.7119,
"step": 68000
},
{
"epoch": 9.34,
"eval_HasAns_exact": 21.899469563020965,
"eval_HasAns_f1": 56.260524050489586,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.846423650256796,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.92770004156034,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.85895026932231,
"eval_f1": 55.940226660625896,
"eval_total": 7983,
"step": 68000
},
{
"epoch": 9.41,
"learning_rate": 1.2649722465673387e-06,
"loss": 0.7158,
"step": 68500
},
{
"epoch": 9.41,
"eval_HasAns_exact": 21.242738065167973,
"eval_HasAns_f1": 55.89174064933859,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.195039458850058,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.561919386378875,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.20756607791557,
"eval_f1": 55.57444600544444,
"eval_total": 7983,
"step": 68500
},
{
"epoch": 9.47,
"learning_rate": 1.1189015483494012e-06,
"loss": 0.6944,
"step": 69000
},
{
"epoch": 9.47,
"eval_HasAns_exact": 21.672139429148775,
"eval_HasAns_f1": 55.86251843204239,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.608417888012024,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.52040848614698,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.62094450707754,
"eval_f1": 55.53293510521254,
"eval_total": 7983,
"step": 69000
},
{
"epoch": 9.54,
"learning_rate": 9.728308501314637e-07,
"loss": 0.7007,
"step": 69500
},
{
"epoch": 9.54,
"eval_HasAns_exact": 21.672139429148775,
"eval_HasAns_f1": 55.84201571688193,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 15.384615384615385,
"eval_NoAns_f1": 15.384615384615385,
"eval_NoAns_total": 65,
"eval_best_exact": 21.608417888012024,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.50007271029319,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.62094450707754,
"eval_f1": 55.51259932935878,
"eval_total": 7983,
"step": 69500
},
{
"epoch": 9.61,
"learning_rate": 8.267601519135262e-07,
"loss": 0.7084,
"step": 70000
},
{
"epoch": 9.61,
"eval_HasAns_exact": 21.747916140439504,
"eval_HasAns_f1": 56.25415794858626,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 21.708630840536138,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.9339123934493,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.721157459601653,
"eval_f1": 55.94643901251486,
"eval_total": 7983,
"step": 70000
},
{
"epoch": 9.68,
"learning_rate": 6.806894536955887e-07,
"loss": 0.7008,
"step": 70500
},
{
"epoch": 9.68,
"eval_HasAns_exact": 21.747916140439504,
"eval_HasAns_f1": 56.058704157634516,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 18.46153846153846,
"eval_NoAns_f1": 18.46153846153846,
"eval_NoAns_total": 65,
"eval_best_exact": 21.708630840536138,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.740050046367244,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.721157459601653,
"eval_f1": 55.75257666543282,
"eval_total": 7983,
"step": 70500
},
{
"epoch": 9.75,
"learning_rate": 5.346187554776512e-07,
"loss": 0.6984,
"step": 71000
},
{
"epoch": 9.75,
"eval_HasAns_exact": 21.78580449608487,
"eval_HasAns_f1": 56.249722496375995,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.733684078667167,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.91698643696666,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.746210697732682,
"eval_f1": 55.92951305603222,
"eval_total": 7983,
"step": 71000
},
{
"epoch": 9.82,
"learning_rate": 3.8854805725971376e-07,
"loss": 0.7118,
"step": 71500
},
{
"epoch": 9.82,
"eval_HasAns_exact": 22.051022985602426,
"eval_HasAns_f1": 56.254669133111044,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.996743079042965,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.92189279668958,
"eval_best_f1_thresh": 0.0,
"eval_exact": 22.00926969810848,
"eval_f1": 55.934419415755144,
"eval_total": 7983,
"step": 71500
},
{
"epoch": 9.89,
"learning_rate": 2.4247735904177623e-07,
"loss": 0.6861,
"step": 72000
},
{
"epoch": 9.89,
"eval_HasAns_exact": 22.025764081838847,
"eval_HasAns_f1": 56.10462500608517,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.97168984091194,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.77307037431819,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.984216459977453,
"eval_f1": 55.785596993383734,
"eval_total": 7983,
"step": 72000
},
{
"epoch": 9.95,
"learning_rate": 9.640666082383875e-08,
"loss": 0.6937,
"step": 72500
},
{
"epoch": 9.95,
"eval_HasAns_exact": 21.94998737054812,
"eval_HasAns_f1": 56.1125349455772,
"eval_HasAns_total": 7918,
"eval_NoAns_exact": 16.923076923076923,
"eval_NoAns_f1": 16.923076923076923,
"eval_NoAns_total": 65,
"eval_best_exact": 21.896530126518854,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 55.78091590869094,
"eval_best_f1_thresh": 0.0,
"eval_exact": 21.909056745584365,
"eval_f1": 55.793442527756504,
"eval_total": 7983,
"step": 72500
},
{
"epoch": 10.0,
"step": 72830,
"total_flos": 3.045026980558111e+17,
"train_loss": 1.5957024367517223,
"train_runtime": 72711.6119,
"train_samples_per_second": 16.027,
"train_steps_per_second": 1.002
}
],
"max_steps": 72830,
"num_train_epochs": 10,
"total_flos": 3.045026980558111e+17,
"trial_name": null,
"trial_params": null
}