emilys's picture
End of training
a257e1b
{
"best_metric": 0.9590143324113654,
"best_model_checkpoint": "twitter-roberta-base-dec2021-CoNLL/checkpoint-2000",
"epoch": 10.0,
"global_step": 2200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.11,
"eval_accuracy": 0.9349324403255325,
"eval_f1": 0.5845156059991893,
"eval_loss": 0.21257123351097107,
"eval_precision": 0.5638980134522134,
"eval_recall": 0.6066980814540559,
"eval_runtime": 5.9566,
"eval_samples_per_second": 545.785,
"eval_steps_per_second": 0.672,
"step": 25
},
{
"epoch": 0.23,
"eval_accuracy": 0.9765001362875277,
"eval_f1": 0.8431372549019608,
"eval_loss": 0.08492632955312729,
"eval_precision": 0.8258553905745643,
"eval_recall": 0.8611578593066308,
"eval_runtime": 5.965,
"eval_samples_per_second": 545.015,
"eval_steps_per_second": 0.671,
"step": 50
},
{
"epoch": 0.34,
"eval_accuracy": 0.9819905766909388,
"eval_f1": 0.8853031689262247,
"eval_loss": 0.06398079544305801,
"eval_precision": 0.8751850024666995,
"eval_recall": 0.8956580276001347,
"eval_runtime": 6.2595,
"eval_samples_per_second": 519.369,
"eval_steps_per_second": 0.639,
"step": 75
},
{
"epoch": 0.45,
"eval_accuracy": 0.9831587555001752,
"eval_f1": 0.8939961695395121,
"eval_loss": 0.05720128118991852,
"eval_precision": 0.88478655018955,
"eval_recall": 0.9033995287781892,
"eval_runtime": 6.1814,
"eval_samples_per_second": 525.936,
"eval_steps_per_second": 0.647,
"step": 100
},
{
"epoch": 0.57,
"eval_accuracy": 0.986585413340602,
"eval_f1": 0.9154577288644322,
"eval_loss": 0.046862851828336716,
"eval_precision": 0.9071381361533377,
"eval_recall": 0.9239313362504208,
"eval_runtime": 6.2511,
"eval_samples_per_second": 520.07,
"eval_steps_per_second": 0.64,
"step": 125
},
{
"epoch": 0.68,
"eval_accuracy": 0.987675713562556,
"eval_f1": 0.9237600536193029,
"eval_loss": 0.044157467782497406,
"eval_precision": 0.9197530864197531,
"eval_recall": 0.927802086839448,
"eval_runtime": 5.9975,
"eval_samples_per_second": 542.063,
"eval_steps_per_second": 0.667,
"step": 150
},
{
"epoch": 0.8,
"eval_accuracy": 0.9880845761457887,
"eval_f1": 0.9256350267379679,
"eval_loss": 0.04243418201804161,
"eval_precision": 0.9191835380019914,
"eval_recall": 0.9321777179400875,
"eval_runtime": 6.2444,
"eval_samples_per_second": 520.63,
"eval_steps_per_second": 0.641,
"step": 175
},
{
"epoch": 0.91,
"eval_accuracy": 0.9890775281336397,
"eval_f1": 0.9290815479156287,
"eval_loss": 0.04066213220357895,
"eval_precision": 0.9170491803278689,
"eval_recall": 0.9414338606529788,
"eval_runtime": 6.0302,
"eval_samples_per_second": 539.124,
"eval_steps_per_second": 0.663,
"step": 200
},
{
"epoch": 1.02,
"eval_accuracy": 0.9894279817764106,
"eval_f1": 0.9332665163284056,
"eval_loss": 0.0402386300265789,
"eval_precision": 0.9263803680981595,
"eval_recall": 0.9402558061258836,
"eval_runtime": 6.3589,
"eval_samples_per_second": 511.254,
"eval_steps_per_second": 0.629,
"step": 225
},
{
"epoch": 1.14,
"eval_accuracy": 0.9897394961255402,
"eval_f1": 0.9387072497700476,
"eval_loss": 0.03986027464270592,
"eval_precision": 0.932856905434602,
"eval_recall": 0.9446314372265231,
"eval_runtime": 6.1252,
"eval_samples_per_second": 530.756,
"eval_steps_per_second": 0.653,
"step": 250
},
{
"epoch": 1.25,
"eval_accuracy": 0.9896616175382579,
"eval_f1": 0.9345029239766081,
"eval_loss": 0.038380175828933716,
"eval_precision": 0.9278367617783676,
"eval_recall": 0.941265567149108,
"eval_runtime": 6.065,
"eval_samples_per_second": 536.028,
"eval_steps_per_second": 0.66,
"step": 275
},
{
"epoch": 1.36,
"eval_accuracy": 0.9905572212920057,
"eval_f1": 0.9427423405323957,
"eval_loss": 0.03632938861846924,
"eval_precision": 0.9378747501665556,
"eval_recall": 0.9476607202961965,
"eval_runtime": 6.3308,
"eval_samples_per_second": 513.519,
"eval_steps_per_second": 0.632,
"step": 300
},
{
"epoch": 1.48,
"eval_accuracy": 0.9904598730579027,
"eval_f1": 0.9436266309802609,
"eval_loss": 0.03615300729870796,
"eval_precision": 0.9379780512138344,
"eval_recall": 0.9493436553349041,
"eval_runtime": 6.0859,
"eval_samples_per_second": 534.186,
"eval_steps_per_second": 0.657,
"step": 325
},
{
"epoch": 1.59,
"eval_accuracy": 0.9905377516451852,
"eval_f1": 0.9446723026701265,
"eval_loss": 0.03641640394926071,
"eval_precision": 0.9397169025811823,
"eval_recall": 0.9496802423426456,
"eval_runtime": 6.3707,
"eval_samples_per_second": 510.303,
"eval_steps_per_second": 0.628,
"step": 350
},
{
"epoch": 1.7,
"eval_accuracy": 0.9898952533001051,
"eval_f1": 0.9398998330550917,
"eval_loss": 0.03667406737804413,
"eval_precision": 0.9324279562769129,
"eval_recall": 0.9474924267923258,
"eval_runtime": 6.0794,
"eval_samples_per_second": 534.757,
"eval_steps_per_second": 0.658,
"step": 375
},
{
"epoch": 1.82,
"eval_accuracy": 0.9898952533001051,
"eval_f1": 0.9404383469968212,
"eval_loss": 0.03719446063041687,
"eval_precision": 0.9349634065202928,
"eval_recall": 0.9459777852574891,
"eval_runtime": 6.4259,
"eval_samples_per_second": 505.925,
"eval_steps_per_second": 0.622,
"step": 400
},
{
"epoch": 1.93,
"eval_accuracy": 0.9909076749347767,
"eval_f1": 0.9461879655201272,
"eval_loss": 0.033916592597961426,
"eval_precision": 0.9410687531213584,
"eval_recall": 0.9513631773813531,
"eval_runtime": 6.1497,
"eval_samples_per_second": 528.643,
"eval_steps_per_second": 0.65,
"step": 425
},
{
"epoch": 2.05,
"eval_accuracy": 0.9911413106966239,
"eval_f1": 0.9473772274742742,
"eval_loss": 0.03361179679632187,
"eval_precision": 0.9419397770753618,
"eval_recall": 0.9528778189161898,
"eval_runtime": 6.1538,
"eval_samples_per_second": 528.288,
"eval_steps_per_second": 0.65,
"step": 450
},
{
"epoch": 2.16,
"eval_accuracy": 0.9913554768116506,
"eval_f1": 0.9491667364542332,
"eval_loss": 0.03356914222240448,
"eval_precision": 0.9446574429071511,
"eval_recall": 0.9537192864355436,
"eval_runtime": 6.3848,
"eval_samples_per_second": 509.18,
"eval_steps_per_second": 0.626,
"step": 475
},
{
"epoch": 2.27,
"learning_rate": 3.8636363636363636e-05,
"loss": 0.079,
"step": 500
},
{
"epoch": 2.27,
"eval_accuracy": 0.9913749464584712,
"eval_f1": 0.9492317969271877,
"eval_loss": 0.03446485847234726,
"eval_precision": 0.9419953596287703,
"eval_recall": 0.9565802760013463,
"eval_runtime": 6.1351,
"eval_samples_per_second": 529.902,
"eval_steps_per_second": 0.652,
"step": 500
},
{
"epoch": 2.39,
"eval_accuracy": 0.9912970678711888,
"eval_f1": 0.9478974702630256,
"eval_loss": 0.03643050789833069,
"eval_precision": 0.9436290860573716,
"eval_recall": 0.9522046449007069,
"eval_runtime": 6.3303,
"eval_samples_per_second": 513.56,
"eval_steps_per_second": 0.632,
"step": 525
},
{
"epoch": 2.5,
"eval_accuracy": 0.9916085822203186,
"eval_f1": 0.9496052410549304,
"eval_loss": 0.03402611240744591,
"eval_precision": 0.9478537894030852,
"eval_recall": 0.9513631773813531,
"eval_runtime": 6.2277,
"eval_samples_per_second": 522.02,
"eval_steps_per_second": 0.642,
"step": 550
},
{
"epoch": 2.61,
"eval_accuracy": 0.9917254001012422,
"eval_f1": 0.9519818989357244,
"eval_loss": 0.03392445296049118,
"eval_precision": 0.9480887998664663,
"eval_recall": 0.9559071019858634,
"eval_runtime": 6.3207,
"eval_samples_per_second": 514.343,
"eval_steps_per_second": 0.633,
"step": 575
},
{
"epoch": 2.73,
"eval_accuracy": 0.9901872980024142,
"eval_f1": 0.9414020171709594,
"eval_loss": 0.039618950337171555,
"eval_precision": 0.932617671345995,
"eval_recall": 0.9503534163581285,
"eval_runtime": 6.1153,
"eval_samples_per_second": 531.622,
"eval_steps_per_second": 0.654,
"step": 600
},
{
"epoch": 2.84,
"eval_accuracy": 0.9914722946925743,
"eval_f1": 0.9502345844504022,
"eval_loss": 0.03481649234890938,
"eval_precision": 0.9461127794461128,
"eval_recall": 0.9543924604510265,
"eval_runtime": 6.3663,
"eval_samples_per_second": 510.659,
"eval_steps_per_second": 0.628,
"step": 625
},
{
"epoch": 2.95,
"eval_accuracy": 0.9907908570538531,
"eval_f1": 0.9472891566265059,
"eval_loss": 0.03590630739927292,
"eval_precision": 0.9419301164725458,
"eval_recall": 0.9527095254123191,
"eval_runtime": 6.1326,
"eval_samples_per_second": 530.121,
"eval_steps_per_second": 0.652,
"step": 650
},
{
"epoch": 3.07,
"eval_accuracy": 0.9916475215139597,
"eval_f1": 0.9502965499958232,
"eval_loss": 0.03470408916473389,
"eval_precision": 0.9434400398075966,
"eval_recall": 0.9572534500168294,
"eval_runtime": 6.3596,
"eval_samples_per_second": 511.198,
"eval_steps_per_second": 0.629,
"step": 675
},
{
"epoch": 3.18,
"eval_accuracy": 0.9918227483353452,
"eval_f1": 0.9514563106796117,
"eval_loss": 0.03510947525501251,
"eval_precision": 0.9463869463869464,
"eval_recall": 0.9565802760013463,
"eval_runtime": 6.0809,
"eval_samples_per_second": 534.622,
"eval_steps_per_second": 0.658,
"step": 700
},
{
"epoch": 3.3,
"eval_accuracy": 0.9910634321093416,
"eval_f1": 0.9490787269681741,
"eval_loss": 0.03696366772055626,
"eval_precision": 0.944648216072024,
"eval_recall": 0.9535509929316729,
"eval_runtime": 6.1802,
"eval_samples_per_second": 526.033,
"eval_steps_per_second": 0.647,
"step": 725
},
{
"epoch": 3.41,
"eval_accuracy": 0.9916669911607804,
"eval_f1": 0.9521739130434784,
"eval_loss": 0.03580446541309357,
"eval_precision": 0.9461615154536391,
"eval_recall": 0.9582632110400539,
"eval_runtime": 6.3604,
"eval_samples_per_second": 511.128,
"eval_steps_per_second": 0.629,
"step": 750
},
{
"epoch": 3.52,
"eval_accuracy": 0.9919785055099101,
"eval_f1": 0.9523250942605781,
"eval_loss": 0.03529668599367142,
"eval_precision": 0.9482729851493409,
"eval_recall": 0.9564119824974756,
"eval_runtime": 6.1111,
"eval_samples_per_second": 531.982,
"eval_steps_per_second": 0.655,
"step": 775
},
{
"epoch": 3.64,
"eval_accuracy": 0.9915696429266773,
"eval_f1": 0.9516075016744809,
"eval_loss": 0.035107776522636414,
"eval_precision": 0.9468510496501167,
"eval_recall": 0.9564119824974756,
"eval_runtime": 6.1664,
"eval_samples_per_second": 527.215,
"eval_steps_per_second": 0.649,
"step": 800
},
{
"epoch": 3.75,
"eval_accuracy": 0.9918811572758071,
"eval_f1": 0.9528751987946764,
"eval_loss": 0.036074355244636536,
"eval_precision": 0.9478767693588677,
"eval_recall": 0.9579266240323123,
"eval_runtime": 6.3953,
"eval_samples_per_second": 508.343,
"eval_steps_per_second": 0.625,
"step": 825
},
{
"epoch": 3.86,
"eval_accuracy": 0.9918032786885246,
"eval_f1": 0.9539209115281501,
"eval_loss": 0.0369994230568409,
"eval_precision": 0.9497831164497831,
"eval_recall": 0.9580949175361831,
"eval_runtime": 6.198,
"eval_samples_per_second": 524.528,
"eval_steps_per_second": 0.645,
"step": 850
},
{
"epoch": 3.98,
"eval_accuracy": 0.9915112339862155,
"eval_f1": 0.9516560722649716,
"eval_loss": 0.03739459067583084,
"eval_precision": 0.9459594280013303,
"eval_recall": 0.9574217435207001,
"eval_runtime": 6.4107,
"eval_samples_per_second": 507.122,
"eval_steps_per_second": 0.624,
"step": 875
},
{
"epoch": 4.09,
"eval_accuracy": 0.9921732019781161,
"eval_f1": 0.9550213585727447,
"eval_loss": 0.03806319832801819,
"eval_precision": 0.9506419876604969,
"eval_recall": 0.9594412655671491,
"eval_runtime": 6.1503,
"eval_samples_per_second": 528.594,
"eval_steps_per_second": 0.65,
"step": 900
},
{
"epoch": 4.2,
"eval_accuracy": 0.9911997196370858,
"eval_f1": 0.9508580996232734,
"eval_loss": 0.041537731885910034,
"eval_precision": 0.9460269865067467,
"eval_recall": 0.9557388084819926,
"eval_runtime": 6.222,
"eval_samples_per_second": 522.501,
"eval_steps_per_second": 0.643,
"step": 925
},
{
"epoch": 4.32,
"eval_accuracy": 0.9916864608076009,
"eval_f1": 0.9524448544829321,
"eval_loss": 0.03895916789770126,
"eval_precision": 0.9493395753218525,
"eval_recall": 0.9555705149781218,
"eval_runtime": 6.4146,
"eval_samples_per_second": 506.815,
"eval_steps_per_second": 0.624,
"step": 950
},
{
"epoch": 4.43,
"eval_accuracy": 0.9919200965694482,
"eval_f1": 0.9536479250334672,
"eval_loss": 0.038863833993673325,
"eval_precision": 0.9482529118136439,
"eval_recall": 0.9591046785594076,
"eval_runtime": 6.2052,
"eval_samples_per_second": 523.911,
"eval_steps_per_second": 0.645,
"step": 975
},
{
"epoch": 4.55,
"learning_rate": 2.7272727272727273e-05,
"loss": 0.0123,
"step": 1000
},
{
"epoch": 4.55,
"eval_accuracy": 0.9918227483353452,
"eval_f1": 0.95163179916318,
"eval_loss": 0.03789864480495453,
"eval_precision": 0.9464047936085219,
"eval_recall": 0.9569168630090878,
"eval_runtime": 6.4251,
"eval_samples_per_second": 505.987,
"eval_steps_per_second": 0.623,
"step": 1000
},
{
"epoch": 4.66,
"eval_accuracy": 0.9919785055099101,
"eval_f1": 0.9520782805051433,
"eval_loss": 0.037610627710819244,
"eval_precision": 0.9463009143807148,
"eval_recall": 0.9579266240323123,
"eval_runtime": 5.9694,
"eval_samples_per_second": 544.608,
"eval_steps_per_second": 0.67,
"step": 1025
},
{
"epoch": 4.77,
"eval_accuracy": 0.9917059304544216,
"eval_f1": 0.9534747254589656,
"eval_loss": 0.03730636462569237,
"eval_precision": 0.9498914314347754,
"eval_recall": 0.9570851565129586,
"eval_runtime": 6.4491,
"eval_samples_per_second": 504.105,
"eval_steps_per_second": 0.62,
"step": 1050
},
{
"epoch": 4.89,
"eval_accuracy": 0.9922510805653986,
"eval_f1": 0.9552163703455216,
"eval_loss": 0.03659652918577194,
"eval_precision": 0.9520227348712805,
"eval_recall": 0.9584315045439246,
"eval_runtime": 6.1088,
"eval_samples_per_second": 532.187,
"eval_steps_per_second": 0.655,
"step": 1075
},
{
"epoch": 5.0,
"eval_accuracy": 0.9922705502122191,
"eval_f1": 0.9546746947650109,
"eval_loss": 0.03736859932541847,
"eval_precision": 0.9488031914893617,
"eval_recall": 0.9606193200942443,
"eval_runtime": 6.1341,
"eval_samples_per_second": 529.989,
"eval_steps_per_second": 0.652,
"step": 1100
},
{
"epoch": 5.11,
"eval_accuracy": 0.9920369144503719,
"eval_f1": 0.9552388935456831,
"eval_loss": 0.039282701909542084,
"eval_precision": 0.9515698062792252,
"eval_recall": 0.9589363850555369,
"eval_runtime": 6.409,
"eval_samples_per_second": 507.255,
"eval_steps_per_second": 0.624,
"step": 1125
},
{
"epoch": 5.23,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.9570613887957062,
"eval_loss": 0.038866784423589706,
"eval_precision": 0.9538615847542627,
"eval_recall": 0.9602827330865029,
"eval_runtime": 6.1822,
"eval_samples_per_second": 525.868,
"eval_steps_per_second": 0.647,
"step": 1150
},
{
"epoch": 5.34,
"eval_accuracy": 0.9916864608076009,
"eval_f1": 0.9530988274706869,
"eval_loss": 0.039710164070129395,
"eval_precision": 0.94864954984995,
"eval_recall": 0.9575900370245709,
"eval_runtime": 6.3284,
"eval_samples_per_second": 513.715,
"eval_steps_per_second": 0.632,
"step": 1175
},
{
"epoch": 5.45,
"eval_accuracy": 0.9919395662162689,
"eval_f1": 0.9523490494933422,
"eval_loss": 0.03970210626721382,
"eval_precision": 0.9478246374395732,
"eval_recall": 0.9569168630090878,
"eval_runtime": 6.2875,
"eval_samples_per_second": 517.058,
"eval_steps_per_second": 0.636,
"step": 1200
},
{
"epoch": 5.57,
"eval_accuracy": 0.9920174448035513,
"eval_f1": 0.9537354639002761,
"eval_loss": 0.03881015256047249,
"eval_precision": 0.9482615205456663,
"eval_recall": 0.9592729720632783,
"eval_runtime": 6.0937,
"eval_samples_per_second": 533.498,
"eval_steps_per_second": 0.656,
"step": 1225
},
{
"epoch": 5.68,
"eval_accuracy": 0.9922900198590398,
"eval_f1": 0.9553937567997322,
"eval_loss": 0.038882434368133545,
"eval_precision": 0.9502247378058931,
"eval_recall": 0.9606193200942443,
"eval_runtime": 6.4419,
"eval_samples_per_second": 504.662,
"eval_steps_per_second": 0.621,
"step": 1250
},
{
"epoch": 5.8,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.958162153098013,
"eval_loss": 0.038017645478248596,
"eval_precision": 0.9547201336675021,
"eval_recall": 0.9616290811174689,
"eval_runtime": 6.1177,
"eval_samples_per_second": 531.411,
"eval_steps_per_second": 0.654,
"step": 1275
},
{
"epoch": 5.91,
"eval_accuracy": 0.9924263073867841,
"eval_f1": 0.954899171617438,
"eval_loss": 0.03911532089114189,
"eval_precision": 0.9495756365451822,
"eval_recall": 0.9602827330865029,
"eval_runtime": 6.3742,
"eval_samples_per_second": 510.022,
"eval_steps_per_second": 0.628,
"step": 1300
},
{
"epoch": 6.02,
"eval_accuracy": 0.9924457770336046,
"eval_f1": 0.9575432119483135,
"eval_loss": 0.038087744265794754,
"eval_precision": 0.9548192771084337,
"eval_recall": 0.9602827330865029,
"eval_runtime": 6.0894,
"eval_samples_per_second": 533.875,
"eval_steps_per_second": 0.657,
"step": 1325
},
{
"epoch": 6.14,
"eval_accuracy": 0.9921926716249367,
"eval_f1": 0.9562300855274191,
"eval_loss": 0.03999880701303482,
"eval_precision": 0.9528743315508021,
"eval_recall": 0.9596095590710199,
"eval_runtime": 6.1345,
"eval_samples_per_second": 529.956,
"eval_steps_per_second": 0.652,
"step": 1350
},
{
"epoch": 6.25,
"eval_accuracy": 0.9927378217359137,
"eval_f1": 0.958001508927823,
"eval_loss": 0.03927755728363991,
"eval_precision": 0.9544012026056455,
"eval_recall": 0.9616290811174689,
"eval_runtime": 6.3512,
"eval_samples_per_second": 511.868,
"eval_steps_per_second": 0.63,
"step": 1375
},
{
"epoch": 6.36,
"eval_accuracy": 0.9924263073867841,
"eval_f1": 0.9567400217555017,
"eval_loss": 0.04191247373819351,
"eval_precision": 0.9514062239973373,
"eval_recall": 0.9621339616290812,
"eval_runtime": 6.1376,
"eval_samples_per_second": 529.682,
"eval_steps_per_second": 0.652,
"step": 1400
},
{
"epoch": 6.48,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.9578832789081471,
"eval_loss": 0.04148797690868378,
"eval_precision": 0.9531744709215131,
"eval_recall": 0.9626388421406934,
"eval_runtime": 6.379,
"eval_samples_per_second": 509.643,
"eval_steps_per_second": 0.627,
"step": 1425
},
{
"epoch": 6.59,
"eval_accuracy": 0.9923289591526809,
"eval_f1": 0.9566236811254396,
"eval_loss": 0.04145730286836624,
"eval_precision": 0.952,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.1372,
"eval_samples_per_second": 529.721,
"eval_steps_per_second": 0.652,
"step": 1450
},
{
"epoch": 6.7,
"eval_accuracy": 0.9925236556208871,
"eval_f1": 0.9576590928146222,
"eval_loss": 0.03992067277431488,
"eval_precision": 0.95421888053467,
"eval_recall": 0.9611242006058566,
"eval_runtime": 6.4046,
"eval_samples_per_second": 507.601,
"eval_steps_per_second": 0.625,
"step": 1475
},
{
"epoch": 6.82,
"learning_rate": 1.590909090909091e-05,
"loss": 0.0052,
"step": 1500
},
{
"epoch": 6.82,
"eval_accuracy": 0.9920563840971924,
"eval_f1": 0.9556468516810598,
"eval_loss": 0.0415743812918663,
"eval_precision": 0.9522138680033417,
"eval_recall": 0.9591046785594076,
"eval_runtime": 6.2338,
"eval_samples_per_second": 521.515,
"eval_steps_per_second": 0.642,
"step": 1500
},
{
"epoch": 6.93,
"eval_accuracy": 0.9919006269226276,
"eval_f1": 0.9550439514441188,
"eval_loss": 0.04101209715008736,
"eval_precision": 0.9501915708812261,
"eval_recall": 0.9599461460787614,
"eval_runtime": 5.9759,
"eval_samples_per_second": 544.016,
"eval_steps_per_second": 0.669,
"step": 1525
},
{
"epoch": 7.05,
"eval_accuracy": 0.9920758537440131,
"eval_f1": 0.9559832635983264,
"eval_loss": 0.040564827620983124,
"eval_precision": 0.9507323568575233,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.3076,
"eval_samples_per_second": 515.41,
"eval_steps_per_second": 0.634,
"step": 1550
},
{
"epoch": 7.16,
"eval_accuracy": 0.9922705502122191,
"eval_f1": 0.9555388093443858,
"eval_loss": 0.039956897497177124,
"eval_precision": 0.9508415264122646,
"eval_recall": 0.9602827330865029,
"eval_runtime": 6.1016,
"eval_samples_per_second": 532.811,
"eval_steps_per_second": 0.656,
"step": 1575
},
{
"epoch": 7.27,
"eval_accuracy": 0.9924263073867841,
"eval_f1": 0.957126109529392,
"eval_loss": 0.04024273902177811,
"eval_precision": 0.9525,
"eval_recall": 0.9617973746213396,
"eval_runtime": 6.1018,
"eval_samples_per_second": 532.791,
"eval_steps_per_second": 0.656,
"step": 1600
},
{
"epoch": 7.39,
"eval_accuracy": 0.9924847163272458,
"eval_f1": 0.9591152815013404,
"eval_loss": 0.04005241021513939,
"eval_precision": 0.954954954954955,
"eval_recall": 0.9633120161561763,
"eval_runtime": 6.4344,
"eval_samples_per_second": 505.253,
"eval_steps_per_second": 0.622,
"step": 1625
},
{
"epoch": 7.5,
"eval_accuracy": 0.9927183520890931,
"eval_f1": 0.9600535968511849,
"eval_loss": 0.039704449474811554,
"eval_precision": 0.9554925820970162,
"eval_recall": 0.9646583641871423,
"eval_runtime": 6.185,
"eval_samples_per_second": 525.625,
"eval_steps_per_second": 0.647,
"step": 1650
},
{
"epoch": 7.61,
"eval_accuracy": 0.9921732019781161,
"eval_f1": 0.956769436997319,
"eval_loss": 0.04118635505437851,
"eval_precision": 0.9526192859526192,
"eval_recall": 0.9609559071019859,
"eval_runtime": 6.2989,
"eval_samples_per_second": 516.125,
"eval_steps_per_second": 0.635,
"step": 1675
},
{
"epoch": 7.73,
"eval_accuracy": 0.9923289591526809,
"eval_f1": 0.9573594705537405,
"eval_loss": 0.041853681206703186,
"eval_precision": 0.9531276063386155,
"eval_recall": 0.9616290811174689,
"eval_runtime": 6.0836,
"eval_samples_per_second": 534.391,
"eval_steps_per_second": 0.658,
"step": 1700
},
{
"epoch": 7.84,
"eval_accuracy": 0.9927378217359137,
"eval_f1": 0.9588259958071279,
"eval_loss": 0.040749866515398026,
"eval_precision": 0.9555406986461641,
"eval_recall": 0.9621339616290812,
"eval_runtime": 6.3737,
"eval_samples_per_second": 510.067,
"eval_steps_per_second": 0.628,
"step": 1725
},
{
"epoch": 7.95,
"eval_accuracy": 0.9926988824422724,
"eval_f1": 0.9589339591015756,
"eval_loss": 0.04090812802314758,
"eval_precision": 0.9550918196994992,
"eval_recall": 0.9628071356445641,
"eval_runtime": 6.1325,
"eval_samples_per_second": 530.13,
"eval_steps_per_second": 0.652,
"step": 1750
},
{
"epoch": 8.07,
"eval_accuracy": 0.9923873680931428,
"eval_f1": 0.9567983924983255,
"eval_loss": 0.041253186762332916,
"eval_precision": 0.9520159946684439,
"eval_recall": 0.9616290811174689,
"eval_runtime": 6.1524,
"eval_samples_per_second": 528.415,
"eval_steps_per_second": 0.65,
"step": 1775
},
{
"epoch": 8.18,
"eval_accuracy": 0.9922510805653986,
"eval_f1": 0.95546626485853,
"eval_loss": 0.041376810520887375,
"eval_precision": 0.9505329780146569,
"eval_recall": 0.9604510265903736,
"eval_runtime": 6.3306,
"eval_samples_per_second": 513.537,
"eval_steps_per_second": 0.632,
"step": 1800
},
{
"epoch": 8.3,
"eval_accuracy": 0.9924263073867841,
"eval_f1": 0.957309401996142,
"eval_loss": 0.04096854478120804,
"eval_precision": 0.9541882628323023,
"eval_recall": 0.9604510265903736,
"eval_runtime": 6.092,
"eval_samples_per_second": 533.646,
"eval_steps_per_second": 0.657,
"step": 1825
},
{
"epoch": 8.41,
"eval_accuracy": 0.9924457770336046,
"eval_f1": 0.9576093343406362,
"eval_loss": 0.04169493913650513,
"eval_precision": 0.9552838720482332,
"eval_recall": 0.9599461460787614,
"eval_runtime": 6.3572,
"eval_samples_per_second": 511.386,
"eval_steps_per_second": 0.629,
"step": 1850
},
{
"epoch": 8.52,
"eval_accuracy": 0.9923289591526809,
"eval_f1": 0.9575574568025499,
"eval_loss": 0.04175976663827896,
"eval_precision": 0.954515050167224,
"eval_recall": 0.9606193200942443,
"eval_runtime": 6.2169,
"eval_samples_per_second": 522.929,
"eval_steps_per_second": 0.643,
"step": 1875
},
{
"epoch": 8.64,
"eval_accuracy": 0.9924263073867841,
"eval_f1": 0.958001508927823,
"eval_loss": 0.04138173907995224,
"eval_precision": 0.9544012026056455,
"eval_recall": 0.9616290811174689,
"eval_runtime": 6.4751,
"eval_samples_per_second": 502.077,
"eval_steps_per_second": 0.618,
"step": 1900
},
{
"epoch": 8.75,
"eval_accuracy": 0.9925236556208871,
"eval_f1": 0.9587386782958739,
"eval_loss": 0.04193359240889549,
"eval_precision": 0.9555332664660648,
"eval_recall": 0.9619656681252103,
"eval_runtime": 6.1398,
"eval_samples_per_second": 529.492,
"eval_steps_per_second": 0.651,
"step": 1925
},
{
"epoch": 8.86,
"eval_accuracy": 0.9925625949145283,
"eval_f1": 0.9577393929230252,
"eval_loss": 0.04151003435254097,
"eval_precision": 0.9543783422459893,
"eval_recall": 0.9611242006058566,
"eval_runtime": 6.1314,
"eval_samples_per_second": 530.223,
"eval_steps_per_second": 0.652,
"step": 1950
},
{
"epoch": 8.98,
"eval_accuracy": 0.9926210038549901,
"eval_f1": 0.9576590928146222,
"eval_loss": 0.041335199028253555,
"eval_precision": 0.95421888053467,
"eval_recall": 0.9611242006058566,
"eval_runtime": 6.4106,
"eval_samples_per_second": 507.128,
"eval_steps_per_second": 0.624,
"step": 1975
},
{
"epoch": 9.09,
"learning_rate": 4.5454545454545455e-06,
"loss": 0.0027,
"step": 2000
},
{
"epoch": 9.09,
"eval_accuracy": 0.9926599431486313,
"eval_f1": 0.9590143324113654,
"eval_loss": 0.0412251353263855,
"eval_precision": 0.9552512940390716,
"eval_recall": 0.9628071356445641,
"eval_runtime": 6.2732,
"eval_samples_per_second": 518.239,
"eval_steps_per_second": 0.638,
"step": 2000
},
{
"epoch": 9.2,
"eval_accuracy": 0.9926599431486313,
"eval_f1": 0.9591819629536502,
"eval_loss": 0.04075352102518082,
"eval_precision": 0.955418266822508,
"eval_recall": 0.9629754291484349,
"eval_runtime": 6.2741,
"eval_samples_per_second": 518.162,
"eval_steps_per_second": 0.638,
"step": 2025
},
{
"epoch": 9.32,
"eval_accuracy": 0.9926210038549901,
"eval_f1": 0.9579070937447594,
"eval_loss": 0.040350958704948425,
"eval_precision": 0.9545454545454546,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.0983,
"eval_samples_per_second": 533.103,
"eval_steps_per_second": 0.656,
"step": 2050
},
{
"epoch": 9.43,
"eval_accuracy": 0.9926404735018107,
"eval_f1": 0.9587317564167085,
"eval_loss": 0.040736954659223557,
"eval_precision": 0.955685618729097,
"eval_recall": 0.9617973746213396,
"eval_runtime": 6.0517,
"eval_samples_per_second": 537.203,
"eval_steps_per_second": 0.661,
"step": 2075
},
{
"epoch": 9.55,
"eval_accuracy": 0.9926015342081694,
"eval_f1": 0.9584905660377357,
"eval_loss": 0.04098973423242569,
"eval_precision": 0.9552064181848571,
"eval_recall": 0.9617973746213396,
"eval_runtime": 6.3854,
"eval_samples_per_second": 509.128,
"eval_steps_per_second": 0.626,
"step": 2100
},
{
"epoch": 9.66,
"eval_accuracy": 0.9925041859740664,
"eval_f1": 0.9585778970316955,
"eval_loss": 0.04119739308953285,
"eval_precision": 0.9552139037433155,
"eval_recall": 0.9619656681252103,
"eval_runtime": 6.1845,
"eval_samples_per_second": 525.672,
"eval_steps_per_second": 0.647,
"step": 2125
},
{
"epoch": 9.77,
"eval_accuracy": 0.9924847163272458,
"eval_f1": 0.9589064072458906,
"eval_loss": 0.04128846526145935,
"eval_precision": 0.9557004346372451,
"eval_recall": 0.9621339616290812,
"eval_runtime": 6.444,
"eval_samples_per_second": 504.5,
"eval_steps_per_second": 0.621,
"step": 2150
},
{
"epoch": 9.89,
"eval_accuracy": 0.9925041859740664,
"eval_f1": 0.9589064072458906,
"eval_loss": 0.04132496938109398,
"eval_precision": 0.9557004346372451,
"eval_recall": 0.9621339616290812,
"eval_runtime": 6.0985,
"eval_samples_per_second": 533.086,
"eval_steps_per_second": 0.656,
"step": 2175
},
{
"epoch": 10.0,
"eval_accuracy": 0.9925041859740664,
"eval_f1": 0.9589064072458906,
"eval_loss": 0.041328806430101395,
"eval_precision": 0.9557004346372451,
"eval_recall": 0.9621339616290812,
"eval_runtime": 6.1664,
"eval_samples_per_second": 527.211,
"eval_steps_per_second": 0.649,
"step": 2200
},
{
"epoch": 10.0,
"step": 2200,
"total_flos": 4144211411102244.0,
"train_loss": 0.022697925716638565,
"train_runtime": 1311.4885,
"train_samples_per_second": 107.069,
"train_steps_per_second": 1.677
}
],
"max_steps": 2200,
"num_train_epochs": 10,
"total_flos": 4144211411102244.0,
"trial_name": null,
"trial_params": null
}