{ "best_metric": 0.9590143324113654, "best_model_checkpoint": "twitter-roberta-base-dec2021-CoNLL/checkpoint-2000", "epoch": 10.0, "global_step": 2200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.11, "eval_accuracy": 0.9349324403255325, "eval_f1": 0.5845156059991893, "eval_loss": 0.21257123351097107, "eval_precision": 0.5638980134522134, "eval_recall": 0.6066980814540559, "eval_runtime": 5.9566, "eval_samples_per_second": 545.785, "eval_steps_per_second": 0.672, "step": 25 }, { "epoch": 0.23, "eval_accuracy": 0.9765001362875277, "eval_f1": 0.8431372549019608, "eval_loss": 0.08492632955312729, "eval_precision": 0.8258553905745643, "eval_recall": 0.8611578593066308, "eval_runtime": 5.965, "eval_samples_per_second": 545.015, "eval_steps_per_second": 0.671, "step": 50 }, { "epoch": 0.34, "eval_accuracy": 0.9819905766909388, "eval_f1": 0.8853031689262247, "eval_loss": 0.06398079544305801, "eval_precision": 0.8751850024666995, "eval_recall": 0.8956580276001347, "eval_runtime": 6.2595, "eval_samples_per_second": 519.369, "eval_steps_per_second": 0.639, "step": 75 }, { "epoch": 0.45, "eval_accuracy": 0.9831587555001752, "eval_f1": 0.8939961695395121, "eval_loss": 0.05720128118991852, "eval_precision": 0.88478655018955, "eval_recall": 0.9033995287781892, "eval_runtime": 6.1814, "eval_samples_per_second": 525.936, "eval_steps_per_second": 0.647, "step": 100 }, { "epoch": 0.57, "eval_accuracy": 0.986585413340602, "eval_f1": 0.9154577288644322, "eval_loss": 0.046862851828336716, "eval_precision": 0.9071381361533377, "eval_recall": 0.9239313362504208, "eval_runtime": 6.2511, "eval_samples_per_second": 520.07, "eval_steps_per_second": 0.64, "step": 125 }, { "epoch": 0.68, "eval_accuracy": 0.987675713562556, "eval_f1": 0.9237600536193029, "eval_loss": 0.044157467782497406, "eval_precision": 0.9197530864197531, "eval_recall": 0.927802086839448, "eval_runtime": 5.9975, "eval_samples_per_second": 542.063, "eval_steps_per_second": 0.667, "step": 150 }, { "epoch": 0.8, "eval_accuracy": 0.9880845761457887, "eval_f1": 0.9256350267379679, "eval_loss": 0.04243418201804161, "eval_precision": 0.9191835380019914, "eval_recall": 0.9321777179400875, "eval_runtime": 6.2444, "eval_samples_per_second": 520.63, "eval_steps_per_second": 0.641, "step": 175 }, { "epoch": 0.91, "eval_accuracy": 0.9890775281336397, "eval_f1": 0.9290815479156287, "eval_loss": 0.04066213220357895, "eval_precision": 0.9170491803278689, "eval_recall": 0.9414338606529788, "eval_runtime": 6.0302, "eval_samples_per_second": 539.124, "eval_steps_per_second": 0.663, "step": 200 }, { "epoch": 1.02, "eval_accuracy": 0.9894279817764106, "eval_f1": 0.9332665163284056, "eval_loss": 0.0402386300265789, "eval_precision": 0.9263803680981595, "eval_recall": 0.9402558061258836, "eval_runtime": 6.3589, "eval_samples_per_second": 511.254, "eval_steps_per_second": 0.629, "step": 225 }, { "epoch": 1.14, "eval_accuracy": 0.9897394961255402, "eval_f1": 0.9387072497700476, "eval_loss": 0.03986027464270592, "eval_precision": 0.932856905434602, "eval_recall": 0.9446314372265231, "eval_runtime": 6.1252, "eval_samples_per_second": 530.756, "eval_steps_per_second": 0.653, "step": 250 }, { "epoch": 1.25, "eval_accuracy": 0.9896616175382579, "eval_f1": 0.9345029239766081, "eval_loss": 0.038380175828933716, "eval_precision": 0.9278367617783676, "eval_recall": 0.941265567149108, "eval_runtime": 6.065, "eval_samples_per_second": 536.028, "eval_steps_per_second": 0.66, "step": 275 }, { "epoch": 1.36, "eval_accuracy": 0.9905572212920057, "eval_f1": 0.9427423405323957, "eval_loss": 0.03632938861846924, "eval_precision": 0.9378747501665556, "eval_recall": 0.9476607202961965, "eval_runtime": 6.3308, "eval_samples_per_second": 513.519, "eval_steps_per_second": 0.632, "step": 300 }, { "epoch": 1.48, "eval_accuracy": 0.9904598730579027, "eval_f1": 0.9436266309802609, "eval_loss": 0.03615300729870796, "eval_precision": 0.9379780512138344, "eval_recall": 0.9493436553349041, "eval_runtime": 6.0859, "eval_samples_per_second": 534.186, "eval_steps_per_second": 0.657, "step": 325 }, { "epoch": 1.59, "eval_accuracy": 0.9905377516451852, "eval_f1": 0.9446723026701265, "eval_loss": 0.03641640394926071, "eval_precision": 0.9397169025811823, "eval_recall": 0.9496802423426456, "eval_runtime": 6.3707, "eval_samples_per_second": 510.303, "eval_steps_per_second": 0.628, "step": 350 }, { "epoch": 1.7, "eval_accuracy": 0.9898952533001051, "eval_f1": 0.9398998330550917, "eval_loss": 0.03667406737804413, "eval_precision": 0.9324279562769129, "eval_recall": 0.9474924267923258, "eval_runtime": 6.0794, "eval_samples_per_second": 534.757, "eval_steps_per_second": 0.658, "step": 375 }, { "epoch": 1.82, "eval_accuracy": 0.9898952533001051, "eval_f1": 0.9404383469968212, "eval_loss": 0.03719446063041687, "eval_precision": 0.9349634065202928, "eval_recall": 0.9459777852574891, "eval_runtime": 6.4259, "eval_samples_per_second": 505.925, "eval_steps_per_second": 0.622, "step": 400 }, { "epoch": 1.93, "eval_accuracy": 0.9909076749347767, "eval_f1": 0.9461879655201272, "eval_loss": 0.033916592597961426, "eval_precision": 0.9410687531213584, "eval_recall": 0.9513631773813531, "eval_runtime": 6.1497, "eval_samples_per_second": 528.643, "eval_steps_per_second": 0.65, "step": 425 }, { "epoch": 2.05, "eval_accuracy": 0.9911413106966239, "eval_f1": 0.9473772274742742, "eval_loss": 0.03361179679632187, "eval_precision": 0.9419397770753618, "eval_recall": 0.9528778189161898, "eval_runtime": 6.1538, "eval_samples_per_second": 528.288, "eval_steps_per_second": 0.65, "step": 450 }, { "epoch": 2.16, "eval_accuracy": 0.9913554768116506, "eval_f1": 0.9491667364542332, "eval_loss": 0.03356914222240448, "eval_precision": 0.9446574429071511, "eval_recall": 0.9537192864355436, "eval_runtime": 6.3848, "eval_samples_per_second": 509.18, "eval_steps_per_second": 0.626, "step": 475 }, { "epoch": 2.27, "learning_rate": 3.8636363636363636e-05, "loss": 0.079, "step": 500 }, { "epoch": 2.27, "eval_accuracy": 0.9913749464584712, "eval_f1": 0.9492317969271877, "eval_loss": 0.03446485847234726, "eval_precision": 0.9419953596287703, "eval_recall": 0.9565802760013463, "eval_runtime": 6.1351, "eval_samples_per_second": 529.902, "eval_steps_per_second": 0.652, "step": 500 }, { "epoch": 2.39, "eval_accuracy": 0.9912970678711888, "eval_f1": 0.9478974702630256, "eval_loss": 0.03643050789833069, "eval_precision": 0.9436290860573716, "eval_recall": 0.9522046449007069, "eval_runtime": 6.3303, "eval_samples_per_second": 513.56, "eval_steps_per_second": 0.632, "step": 525 }, { "epoch": 2.5, "eval_accuracy": 0.9916085822203186, "eval_f1": 0.9496052410549304, "eval_loss": 0.03402611240744591, "eval_precision": 0.9478537894030852, "eval_recall": 0.9513631773813531, "eval_runtime": 6.2277, "eval_samples_per_second": 522.02, "eval_steps_per_second": 0.642, "step": 550 }, { "epoch": 2.61, "eval_accuracy": 0.9917254001012422, "eval_f1": 0.9519818989357244, "eval_loss": 0.03392445296049118, "eval_precision": 0.9480887998664663, "eval_recall": 0.9559071019858634, "eval_runtime": 6.3207, "eval_samples_per_second": 514.343, "eval_steps_per_second": 0.633, "step": 575 }, { "epoch": 2.73, "eval_accuracy": 0.9901872980024142, "eval_f1": 0.9414020171709594, "eval_loss": 0.039618950337171555, "eval_precision": 0.932617671345995, "eval_recall": 0.9503534163581285, "eval_runtime": 6.1153, "eval_samples_per_second": 531.622, "eval_steps_per_second": 0.654, "step": 600 }, { "epoch": 2.84, "eval_accuracy": 0.9914722946925743, "eval_f1": 0.9502345844504022, "eval_loss": 0.03481649234890938, "eval_precision": 0.9461127794461128, "eval_recall": 0.9543924604510265, "eval_runtime": 6.3663, "eval_samples_per_second": 510.659, "eval_steps_per_second": 0.628, "step": 625 }, { "epoch": 2.95, "eval_accuracy": 0.9907908570538531, "eval_f1": 0.9472891566265059, "eval_loss": 0.03590630739927292, "eval_precision": 0.9419301164725458, "eval_recall": 0.9527095254123191, "eval_runtime": 6.1326, "eval_samples_per_second": 530.121, "eval_steps_per_second": 0.652, "step": 650 }, { "epoch": 3.07, "eval_accuracy": 0.9916475215139597, "eval_f1": 0.9502965499958232, "eval_loss": 0.03470408916473389, "eval_precision": 0.9434400398075966, "eval_recall": 0.9572534500168294, "eval_runtime": 6.3596, "eval_samples_per_second": 511.198, "eval_steps_per_second": 0.629, "step": 675 }, { "epoch": 3.18, "eval_accuracy": 0.9918227483353452, "eval_f1": 0.9514563106796117, "eval_loss": 0.03510947525501251, "eval_precision": 0.9463869463869464, "eval_recall": 0.9565802760013463, "eval_runtime": 6.0809, "eval_samples_per_second": 534.622, "eval_steps_per_second": 0.658, "step": 700 }, { "epoch": 3.3, "eval_accuracy": 0.9910634321093416, "eval_f1": 0.9490787269681741, "eval_loss": 0.03696366772055626, "eval_precision": 0.944648216072024, "eval_recall": 0.9535509929316729, "eval_runtime": 6.1802, "eval_samples_per_second": 526.033, "eval_steps_per_second": 0.647, "step": 725 }, { "epoch": 3.41, "eval_accuracy": 0.9916669911607804, "eval_f1": 0.9521739130434784, "eval_loss": 0.03580446541309357, "eval_precision": 0.9461615154536391, "eval_recall": 0.9582632110400539, "eval_runtime": 6.3604, "eval_samples_per_second": 511.128, "eval_steps_per_second": 0.629, "step": 750 }, { "epoch": 3.52, "eval_accuracy": 0.9919785055099101, "eval_f1": 0.9523250942605781, "eval_loss": 0.03529668599367142, "eval_precision": 0.9482729851493409, "eval_recall": 0.9564119824974756, "eval_runtime": 6.1111, "eval_samples_per_second": 531.982, "eval_steps_per_second": 0.655, "step": 775 }, { "epoch": 3.64, "eval_accuracy": 0.9915696429266773, "eval_f1": 0.9516075016744809, "eval_loss": 0.035107776522636414, "eval_precision": 0.9468510496501167, "eval_recall": 0.9564119824974756, "eval_runtime": 6.1664, "eval_samples_per_second": 527.215, "eval_steps_per_second": 0.649, "step": 800 }, { "epoch": 3.75, "eval_accuracy": 0.9918811572758071, "eval_f1": 0.9528751987946764, "eval_loss": 0.036074355244636536, "eval_precision": 0.9478767693588677, "eval_recall": 0.9579266240323123, "eval_runtime": 6.3953, "eval_samples_per_second": 508.343, "eval_steps_per_second": 0.625, "step": 825 }, { "epoch": 3.86, "eval_accuracy": 0.9918032786885246, "eval_f1": 0.9539209115281501, "eval_loss": 0.0369994230568409, "eval_precision": 0.9497831164497831, "eval_recall": 0.9580949175361831, "eval_runtime": 6.198, "eval_samples_per_second": 524.528, "eval_steps_per_second": 0.645, "step": 850 }, { "epoch": 3.98, "eval_accuracy": 0.9915112339862155, "eval_f1": 0.9516560722649716, "eval_loss": 0.03739459067583084, "eval_precision": 0.9459594280013303, "eval_recall": 0.9574217435207001, "eval_runtime": 6.4107, "eval_samples_per_second": 507.122, "eval_steps_per_second": 0.624, "step": 875 }, { "epoch": 4.09, "eval_accuracy": 0.9921732019781161, "eval_f1": 0.9550213585727447, "eval_loss": 0.03806319832801819, "eval_precision": 0.9506419876604969, "eval_recall": 0.9594412655671491, "eval_runtime": 6.1503, "eval_samples_per_second": 528.594, "eval_steps_per_second": 0.65, "step": 900 }, { "epoch": 4.2, "eval_accuracy": 0.9911997196370858, "eval_f1": 0.9508580996232734, "eval_loss": 0.041537731885910034, "eval_precision": 0.9460269865067467, "eval_recall": 0.9557388084819926, "eval_runtime": 6.222, "eval_samples_per_second": 522.501, "eval_steps_per_second": 0.643, "step": 925 }, { "epoch": 4.32, "eval_accuracy": 0.9916864608076009, "eval_f1": 0.9524448544829321, "eval_loss": 0.03895916789770126, "eval_precision": 0.9493395753218525, "eval_recall": 0.9555705149781218, "eval_runtime": 6.4146, "eval_samples_per_second": 506.815, "eval_steps_per_second": 0.624, "step": 950 }, { "epoch": 4.43, "eval_accuracy": 0.9919200965694482, "eval_f1": 0.9536479250334672, "eval_loss": 0.038863833993673325, "eval_precision": 0.9482529118136439, "eval_recall": 0.9591046785594076, "eval_runtime": 6.2052, "eval_samples_per_second": 523.911, "eval_steps_per_second": 0.645, "step": 975 }, { "epoch": 4.55, "learning_rate": 2.7272727272727273e-05, "loss": 0.0123, "step": 1000 }, { "epoch": 4.55, "eval_accuracy": 0.9918227483353452, "eval_f1": 0.95163179916318, "eval_loss": 0.03789864480495453, "eval_precision": 0.9464047936085219, "eval_recall": 0.9569168630090878, "eval_runtime": 6.4251, "eval_samples_per_second": 505.987, "eval_steps_per_second": 0.623, "step": 1000 }, { "epoch": 4.66, "eval_accuracy": 0.9919785055099101, "eval_f1": 0.9520782805051433, "eval_loss": 0.037610627710819244, "eval_precision": 0.9463009143807148, "eval_recall": 0.9579266240323123, "eval_runtime": 5.9694, "eval_samples_per_second": 544.608, "eval_steps_per_second": 0.67, "step": 1025 }, { "epoch": 4.77, "eval_accuracy": 0.9917059304544216, "eval_f1": 0.9534747254589656, "eval_loss": 0.03730636462569237, "eval_precision": 0.9498914314347754, "eval_recall": 0.9570851565129586, "eval_runtime": 6.4491, "eval_samples_per_second": 504.105, "eval_steps_per_second": 0.62, "step": 1050 }, { "epoch": 4.89, "eval_accuracy": 0.9922510805653986, "eval_f1": 0.9552163703455216, "eval_loss": 0.03659652918577194, "eval_precision": 0.9520227348712805, "eval_recall": 0.9584315045439246, "eval_runtime": 6.1088, "eval_samples_per_second": 532.187, "eval_steps_per_second": 0.655, "step": 1075 }, { "epoch": 5.0, "eval_accuracy": 0.9922705502122191, "eval_f1": 0.9546746947650109, "eval_loss": 0.03736859932541847, "eval_precision": 0.9488031914893617, "eval_recall": 0.9606193200942443, "eval_runtime": 6.1341, "eval_samples_per_second": 529.989, "eval_steps_per_second": 0.652, "step": 1100 }, { "epoch": 5.11, "eval_accuracy": 0.9920369144503719, "eval_f1": 0.9552388935456831, "eval_loss": 0.039282701909542084, "eval_precision": 0.9515698062792252, "eval_recall": 0.9589363850555369, "eval_runtime": 6.409, "eval_samples_per_second": 507.255, "eval_steps_per_second": 0.624, "step": 1125 }, { "epoch": 5.23, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.9570613887957062, "eval_loss": 0.038866784423589706, "eval_precision": 0.9538615847542627, "eval_recall": 0.9602827330865029, "eval_runtime": 6.1822, "eval_samples_per_second": 525.868, "eval_steps_per_second": 0.647, "step": 1150 }, { "epoch": 5.34, "eval_accuracy": 0.9916864608076009, "eval_f1": 0.9530988274706869, "eval_loss": 0.039710164070129395, "eval_precision": 0.94864954984995, "eval_recall": 0.9575900370245709, "eval_runtime": 6.3284, "eval_samples_per_second": 513.715, "eval_steps_per_second": 0.632, "step": 1175 }, { "epoch": 5.45, "eval_accuracy": 0.9919395662162689, "eval_f1": 0.9523490494933422, "eval_loss": 0.03970210626721382, "eval_precision": 0.9478246374395732, "eval_recall": 0.9569168630090878, "eval_runtime": 6.2875, "eval_samples_per_second": 517.058, "eval_steps_per_second": 0.636, "step": 1200 }, { "epoch": 5.57, "eval_accuracy": 0.9920174448035513, "eval_f1": 0.9537354639002761, "eval_loss": 0.03881015256047249, "eval_precision": 0.9482615205456663, "eval_recall": 0.9592729720632783, "eval_runtime": 6.0937, "eval_samples_per_second": 533.498, "eval_steps_per_second": 0.656, "step": 1225 }, { "epoch": 5.68, "eval_accuracy": 0.9922900198590398, "eval_f1": 0.9553937567997322, "eval_loss": 0.038882434368133545, "eval_precision": 0.9502247378058931, "eval_recall": 0.9606193200942443, "eval_runtime": 6.4419, "eval_samples_per_second": 504.662, "eval_steps_per_second": 0.621, "step": 1250 }, { "epoch": 5.8, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.958162153098013, "eval_loss": 0.038017645478248596, "eval_precision": 0.9547201336675021, "eval_recall": 0.9616290811174689, "eval_runtime": 6.1177, "eval_samples_per_second": 531.411, "eval_steps_per_second": 0.654, "step": 1275 }, { "epoch": 5.91, "eval_accuracy": 0.9924263073867841, "eval_f1": 0.954899171617438, "eval_loss": 0.03911532089114189, "eval_precision": 0.9495756365451822, "eval_recall": 0.9602827330865029, "eval_runtime": 6.3742, "eval_samples_per_second": 510.022, "eval_steps_per_second": 0.628, "step": 1300 }, { "epoch": 6.02, "eval_accuracy": 0.9924457770336046, "eval_f1": 0.9575432119483135, "eval_loss": 0.038087744265794754, "eval_precision": 0.9548192771084337, "eval_recall": 0.9602827330865029, "eval_runtime": 6.0894, "eval_samples_per_second": 533.875, "eval_steps_per_second": 0.657, "step": 1325 }, { "epoch": 6.14, "eval_accuracy": 0.9921926716249367, "eval_f1": 0.9562300855274191, "eval_loss": 0.03999880701303482, "eval_precision": 0.9528743315508021, "eval_recall": 0.9596095590710199, "eval_runtime": 6.1345, "eval_samples_per_second": 529.956, "eval_steps_per_second": 0.652, "step": 1350 }, { "epoch": 6.25, "eval_accuracy": 0.9927378217359137, "eval_f1": 0.958001508927823, "eval_loss": 0.03927755728363991, "eval_precision": 0.9544012026056455, "eval_recall": 0.9616290811174689, "eval_runtime": 6.3512, "eval_samples_per_second": 511.868, "eval_steps_per_second": 0.63, "step": 1375 }, { "epoch": 6.36, "eval_accuracy": 0.9924263073867841, "eval_f1": 0.9567400217555017, "eval_loss": 0.04191247373819351, "eval_precision": 0.9514062239973373, "eval_recall": 0.9621339616290812, "eval_runtime": 6.1376, "eval_samples_per_second": 529.682, "eval_steps_per_second": 0.652, "step": 1400 }, { "epoch": 6.48, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.9578832789081471, "eval_loss": 0.04148797690868378, "eval_precision": 0.9531744709215131, "eval_recall": 0.9626388421406934, "eval_runtime": 6.379, "eval_samples_per_second": 509.643, "eval_steps_per_second": 0.627, "step": 1425 }, { "epoch": 6.59, "eval_accuracy": 0.9923289591526809, "eval_f1": 0.9566236811254396, "eval_loss": 0.04145730286836624, "eval_precision": 0.952, "eval_recall": 0.9612924941097274, "eval_runtime": 6.1372, "eval_samples_per_second": 529.721, "eval_steps_per_second": 0.652, "step": 1450 }, { "epoch": 6.7, "eval_accuracy": 0.9925236556208871, "eval_f1": 0.9576590928146222, "eval_loss": 0.03992067277431488, "eval_precision": 0.95421888053467, "eval_recall": 0.9611242006058566, "eval_runtime": 6.4046, "eval_samples_per_second": 507.601, "eval_steps_per_second": 0.625, "step": 1475 }, { "epoch": 6.82, "learning_rate": 1.590909090909091e-05, "loss": 0.0052, "step": 1500 }, { "epoch": 6.82, "eval_accuracy": 0.9920563840971924, "eval_f1": 0.9556468516810598, "eval_loss": 0.0415743812918663, "eval_precision": 0.9522138680033417, "eval_recall": 0.9591046785594076, "eval_runtime": 6.2338, "eval_samples_per_second": 521.515, "eval_steps_per_second": 0.642, "step": 1500 }, { "epoch": 6.93, "eval_accuracy": 0.9919006269226276, "eval_f1": 0.9550439514441188, "eval_loss": 0.04101209715008736, "eval_precision": 0.9501915708812261, "eval_recall": 0.9599461460787614, "eval_runtime": 5.9759, "eval_samples_per_second": 544.016, "eval_steps_per_second": 0.669, "step": 1525 }, { "epoch": 7.05, "eval_accuracy": 0.9920758537440131, "eval_f1": 0.9559832635983264, "eval_loss": 0.040564827620983124, "eval_precision": 0.9507323568575233, "eval_recall": 0.9612924941097274, "eval_runtime": 6.3076, "eval_samples_per_second": 515.41, "eval_steps_per_second": 0.634, "step": 1550 }, { "epoch": 7.16, "eval_accuracy": 0.9922705502122191, "eval_f1": 0.9555388093443858, "eval_loss": 0.039956897497177124, "eval_precision": 0.9508415264122646, "eval_recall": 0.9602827330865029, "eval_runtime": 6.1016, "eval_samples_per_second": 532.811, "eval_steps_per_second": 0.656, "step": 1575 }, { "epoch": 7.27, "eval_accuracy": 0.9924263073867841, "eval_f1": 0.957126109529392, "eval_loss": 0.04024273902177811, "eval_precision": 0.9525, "eval_recall": 0.9617973746213396, "eval_runtime": 6.1018, "eval_samples_per_second": 532.791, "eval_steps_per_second": 0.656, "step": 1600 }, { "epoch": 7.39, "eval_accuracy": 0.9924847163272458, "eval_f1": 0.9591152815013404, "eval_loss": 0.04005241021513939, "eval_precision": 0.954954954954955, "eval_recall": 0.9633120161561763, "eval_runtime": 6.4344, "eval_samples_per_second": 505.253, "eval_steps_per_second": 0.622, "step": 1625 }, { "epoch": 7.5, "eval_accuracy": 0.9927183520890931, "eval_f1": 0.9600535968511849, "eval_loss": 0.039704449474811554, "eval_precision": 0.9554925820970162, "eval_recall": 0.9646583641871423, "eval_runtime": 6.185, "eval_samples_per_second": 525.625, "eval_steps_per_second": 0.647, "step": 1650 }, { "epoch": 7.61, "eval_accuracy": 0.9921732019781161, "eval_f1": 0.956769436997319, "eval_loss": 0.04118635505437851, "eval_precision": 0.9526192859526192, "eval_recall": 0.9609559071019859, "eval_runtime": 6.2989, "eval_samples_per_second": 516.125, "eval_steps_per_second": 0.635, "step": 1675 }, { "epoch": 7.73, "eval_accuracy": 0.9923289591526809, "eval_f1": 0.9573594705537405, "eval_loss": 0.041853681206703186, "eval_precision": 0.9531276063386155, "eval_recall": 0.9616290811174689, "eval_runtime": 6.0836, "eval_samples_per_second": 534.391, "eval_steps_per_second": 0.658, "step": 1700 }, { "epoch": 7.84, "eval_accuracy": 0.9927378217359137, "eval_f1": 0.9588259958071279, "eval_loss": 0.040749866515398026, "eval_precision": 0.9555406986461641, "eval_recall": 0.9621339616290812, "eval_runtime": 6.3737, "eval_samples_per_second": 510.067, "eval_steps_per_second": 0.628, "step": 1725 }, { "epoch": 7.95, "eval_accuracy": 0.9926988824422724, "eval_f1": 0.9589339591015756, "eval_loss": 0.04090812802314758, "eval_precision": 0.9550918196994992, "eval_recall": 0.9628071356445641, "eval_runtime": 6.1325, "eval_samples_per_second": 530.13, "eval_steps_per_second": 0.652, "step": 1750 }, { "epoch": 8.07, "eval_accuracy": 0.9923873680931428, "eval_f1": 0.9567983924983255, "eval_loss": 0.041253186762332916, "eval_precision": 0.9520159946684439, "eval_recall": 0.9616290811174689, "eval_runtime": 6.1524, "eval_samples_per_second": 528.415, "eval_steps_per_second": 0.65, "step": 1775 }, { "epoch": 8.18, "eval_accuracy": 0.9922510805653986, "eval_f1": 0.95546626485853, "eval_loss": 0.041376810520887375, "eval_precision": 0.9505329780146569, "eval_recall": 0.9604510265903736, "eval_runtime": 6.3306, "eval_samples_per_second": 513.537, "eval_steps_per_second": 0.632, "step": 1800 }, { "epoch": 8.3, "eval_accuracy": 0.9924263073867841, "eval_f1": 0.957309401996142, "eval_loss": 0.04096854478120804, "eval_precision": 0.9541882628323023, "eval_recall": 0.9604510265903736, "eval_runtime": 6.092, "eval_samples_per_second": 533.646, "eval_steps_per_second": 0.657, "step": 1825 }, { "epoch": 8.41, "eval_accuracy": 0.9924457770336046, "eval_f1": 0.9576093343406362, "eval_loss": 0.04169493913650513, "eval_precision": 0.9552838720482332, "eval_recall": 0.9599461460787614, "eval_runtime": 6.3572, "eval_samples_per_second": 511.386, "eval_steps_per_second": 0.629, "step": 1850 }, { "epoch": 8.52, "eval_accuracy": 0.9923289591526809, "eval_f1": 0.9575574568025499, "eval_loss": 0.04175976663827896, "eval_precision": 0.954515050167224, "eval_recall": 0.9606193200942443, "eval_runtime": 6.2169, "eval_samples_per_second": 522.929, "eval_steps_per_second": 0.643, "step": 1875 }, { "epoch": 8.64, "eval_accuracy": 0.9924263073867841, "eval_f1": 0.958001508927823, "eval_loss": 0.04138173907995224, "eval_precision": 0.9544012026056455, "eval_recall": 0.9616290811174689, "eval_runtime": 6.4751, "eval_samples_per_second": 502.077, "eval_steps_per_second": 0.618, "step": 1900 }, { "epoch": 8.75, "eval_accuracy": 0.9925236556208871, "eval_f1": 0.9587386782958739, "eval_loss": 0.04193359240889549, "eval_precision": 0.9555332664660648, "eval_recall": 0.9619656681252103, "eval_runtime": 6.1398, "eval_samples_per_second": 529.492, "eval_steps_per_second": 0.651, "step": 1925 }, { "epoch": 8.86, "eval_accuracy": 0.9925625949145283, "eval_f1": 0.9577393929230252, "eval_loss": 0.04151003435254097, "eval_precision": 0.9543783422459893, "eval_recall": 0.9611242006058566, "eval_runtime": 6.1314, "eval_samples_per_second": 530.223, "eval_steps_per_second": 0.652, "step": 1950 }, { "epoch": 8.98, "eval_accuracy": 0.9926210038549901, "eval_f1": 0.9576590928146222, "eval_loss": 0.041335199028253555, "eval_precision": 0.95421888053467, "eval_recall": 0.9611242006058566, "eval_runtime": 6.4106, "eval_samples_per_second": 507.128, "eval_steps_per_second": 0.624, "step": 1975 }, { "epoch": 9.09, "learning_rate": 4.5454545454545455e-06, "loss": 0.0027, "step": 2000 }, { "epoch": 9.09, "eval_accuracy": 0.9926599431486313, "eval_f1": 0.9590143324113654, "eval_loss": 0.0412251353263855, "eval_precision": 0.9552512940390716, "eval_recall": 0.9628071356445641, "eval_runtime": 6.2732, "eval_samples_per_second": 518.239, "eval_steps_per_second": 0.638, "step": 2000 }, { "epoch": 9.2, "eval_accuracy": 0.9926599431486313, "eval_f1": 0.9591819629536502, "eval_loss": 0.04075352102518082, "eval_precision": 0.955418266822508, "eval_recall": 0.9629754291484349, "eval_runtime": 6.2741, "eval_samples_per_second": 518.162, "eval_steps_per_second": 0.638, "step": 2025 }, { "epoch": 9.32, "eval_accuracy": 0.9926210038549901, "eval_f1": 0.9579070937447594, "eval_loss": 0.040350958704948425, "eval_precision": 0.9545454545454546, "eval_recall": 0.9612924941097274, "eval_runtime": 6.0983, "eval_samples_per_second": 533.103, "eval_steps_per_second": 0.656, "step": 2050 }, { "epoch": 9.43, "eval_accuracy": 0.9926404735018107, "eval_f1": 0.9587317564167085, "eval_loss": 0.040736954659223557, "eval_precision": 0.955685618729097, "eval_recall": 0.9617973746213396, "eval_runtime": 6.0517, "eval_samples_per_second": 537.203, "eval_steps_per_second": 0.661, "step": 2075 }, { "epoch": 9.55, "eval_accuracy": 0.9926015342081694, "eval_f1": 0.9584905660377357, "eval_loss": 0.04098973423242569, "eval_precision": 0.9552064181848571, "eval_recall": 0.9617973746213396, "eval_runtime": 6.3854, "eval_samples_per_second": 509.128, "eval_steps_per_second": 0.626, "step": 2100 }, { "epoch": 9.66, "eval_accuracy": 0.9925041859740664, "eval_f1": 0.9585778970316955, "eval_loss": 0.04119739308953285, "eval_precision": 0.9552139037433155, "eval_recall": 0.9619656681252103, "eval_runtime": 6.1845, "eval_samples_per_second": 525.672, "eval_steps_per_second": 0.647, "step": 2125 }, { "epoch": 9.77, "eval_accuracy": 0.9924847163272458, "eval_f1": 0.9589064072458906, "eval_loss": 0.04128846526145935, "eval_precision": 0.9557004346372451, "eval_recall": 0.9621339616290812, "eval_runtime": 6.444, "eval_samples_per_second": 504.5, "eval_steps_per_second": 0.621, "step": 2150 }, { "epoch": 9.89, "eval_accuracy": 0.9925041859740664, "eval_f1": 0.9589064072458906, "eval_loss": 0.04132496938109398, "eval_precision": 0.9557004346372451, "eval_recall": 0.9621339616290812, "eval_runtime": 6.0985, "eval_samples_per_second": 533.086, "eval_steps_per_second": 0.656, "step": 2175 }, { "epoch": 10.0, "eval_accuracy": 0.9925041859740664, "eval_f1": 0.9589064072458906, "eval_loss": 0.041328806430101395, "eval_precision": 0.9557004346372451, "eval_recall": 0.9621339616290812, "eval_runtime": 6.1664, "eval_samples_per_second": 527.211, "eval_steps_per_second": 0.649, "step": 2200 }, { "epoch": 10.0, "step": 2200, "total_flos": 4144211411102244.0, "train_loss": 0.022697925716638565, "train_runtime": 1311.4885, "train_samples_per_second": 107.069, "train_steps_per_second": 1.677 } ], "max_steps": 2200, "num_train_epochs": 10, "total_flos": 4144211411102244.0, "trial_name": null, "trial_params": null }