{ "best_metric": 0.9571847507331379, "best_model_checkpoint": "twitter-roberta-base-CoNLL/checkpoint-2000", "epoch": 10.0, "global_step": 2200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.11, "eval_accuracy": 0.9385927339278065, "eval_f1": 0.6587314799400699, "eval_loss": 0.2062799483537674, "eval_precision": 0.6516798418972332, "eval_recall": 0.6659373948165601, "eval_runtime": 5.976, "eval_samples_per_second": 544.011, "eval_steps_per_second": 0.669, "step": 25 }, { "epoch": 0.23, "eval_accuracy": 0.9771231649857871, "eval_f1": 0.8565321055660609, "eval_loss": 0.08096875995397568, "eval_precision": 0.8373251888763864, "eval_recall": 0.8766408616627398, "eval_runtime": 6.2407, "eval_samples_per_second": 520.938, "eval_steps_per_second": 0.641, "step": 50 }, { "epoch": 0.34, "eval_accuracy": 0.9826914839764807, "eval_f1": 0.8996990972918756, "eval_loss": 0.06511491537094116, "eval_precision": 0.8937230156094321, "eval_recall": 0.9057556378323797, "eval_runtime": 6.0069, "eval_samples_per_second": 541.208, "eval_steps_per_second": 0.666, "step": 75 }, { "epoch": 0.45, "eval_accuracy": 0.9849110237140298, "eval_f1": 0.907388833166165, "eval_loss": 0.05366199463605881, "eval_precision": 0.9013616738625041, "eval_recall": 0.9134971390104342, "eval_runtime": 6.3828, "eval_samples_per_second": 509.335, "eval_steps_per_second": 0.627, "step": 100 }, { "epoch": 0.57, "eval_accuracy": 0.986682761574705, "eval_f1": 0.9170283806343906, "eval_loss": 0.04637985676527023, "eval_precision": 0.9097383239483272, "eval_recall": 0.924436216762033, "eval_runtime": 6.0475, "eval_samples_per_second": 537.576, "eval_steps_per_second": 0.661, "step": 125 }, { "epoch": 0.68, "eval_accuracy": 0.9884544994353802, "eval_f1": 0.9296410942859533, "eval_loss": 0.042301442474126816, "eval_precision": 0.9243054400266179, "eval_recall": 0.9350387075058902, "eval_runtime": 6.0733, "eval_samples_per_second": 535.298, "eval_steps_per_second": 0.659, "step": 150 }, { "epoch": 0.8, "eval_accuracy": 0.9899731318873876, "eval_f1": 0.934277384423157, "eval_loss": 0.038059305399656296, "eval_precision": 0.9249546429160481, "eval_recall": 0.9437899697071693, "eval_runtime": 6.3028, "eval_samples_per_second": 515.805, "eval_steps_per_second": 0.635, "step": 175 }, { "epoch": 0.91, "eval_accuracy": 0.9895642693041549, "eval_f1": 0.9354220481626531, "eval_loss": 0.038840554654598236, "eval_precision": 0.9263904934807724, "eval_recall": 0.9446314372265231, "eval_runtime": 6.0497, "eval_samples_per_second": 537.384, "eval_steps_per_second": 0.661, "step": 200 }, { "epoch": 1.02, "eval_accuracy": 0.9898368443596434, "eval_f1": 0.9384409501505521, "eval_loss": 0.03943933546543121, "eval_precision": 0.9328234120385767, "eval_recall": 0.9441265567149109, "eval_runtime": 6.4439, "eval_samples_per_second": 504.505, "eval_steps_per_second": 0.621, "step": 225 }, { "epoch": 1.14, "eval_accuracy": 0.9895837389509754, "eval_f1": 0.9402710389827672, "eval_loss": 0.042259786278009415, "eval_precision": 0.9347970725216235, "eval_recall": 0.9458094917536183, "eval_runtime": 6.16, "eval_samples_per_second": 527.761, "eval_steps_per_second": 0.649, "step": 250 }, { "epoch": 1.25, "eval_accuracy": 0.9892138156613839, "eval_f1": 0.9354757720311323, "eval_loss": 0.04323225095868111, "eval_precision": 0.9304145163975363, "eval_recall": 0.9405923931336251, "eval_runtime": 6.3592, "eval_samples_per_second": 511.225, "eval_steps_per_second": 0.629, "step": 275 }, { "epoch": 1.36, "eval_accuracy": 0.9900899497683112, "eval_f1": 0.9432760787599497, "eval_loss": 0.03824295476078987, "eval_precision": 0.9392624728850325, "eval_recall": 0.9473241332884551, "eval_runtime": 6.1034, "eval_samples_per_second": 532.654, "eval_steps_per_second": 0.655, "step": 300 }, { "epoch": 1.48, "eval_accuracy": 0.99005101047467, "eval_f1": 0.9414020171709594, "eval_loss": 0.0380987711250782, "eval_precision": 0.932617671345995, "eval_recall": 0.9503534163581285, "eval_runtime": 6.1204, "eval_samples_per_second": 531.176, "eval_steps_per_second": 0.654, "step": 325 }, { "epoch": 1.59, "eval_accuracy": 0.9902262372960554, "eval_f1": 0.9429309339331834, "eval_loss": 0.03868376836180687, "eval_precision": 0.933674311169774, "eval_recall": 0.9523729384045776, "eval_runtime": 6.3273, "eval_samples_per_second": 513.801, "eval_steps_per_second": 0.632, "step": 350 }, { "epoch": 1.7, "eval_accuracy": 0.990148358708773, "eval_f1": 0.9439181825802665, "eval_loss": 0.03645554929971695, "eval_precision": 0.9403708034073827, "eval_recall": 0.9474924267923258, "eval_runtime": 6.2492, "eval_samples_per_second": 520.224, "eval_steps_per_second": 0.64, "step": 375 }, { "epoch": 1.82, "eval_accuracy": 0.9905182819983646, "eval_f1": 0.9473948735131512, "eval_loss": 0.0382225401699543, "eval_precision": 0.9431287525016678, "eval_recall": 0.9516997643890945, "eval_runtime": 6.4588, "eval_samples_per_second": 503.348, "eval_steps_per_second": 0.619, "step": 400 }, { "epoch": 1.93, "eval_accuracy": 0.9903235855301585, "eval_f1": 0.9460837582546184, "eval_loss": 0.03733981028199196, "eval_precision": 0.9398770968277694, "eval_recall": 0.9523729384045776, "eval_runtime": 6.1594, "eval_samples_per_second": 527.813, "eval_steps_per_second": 0.649, "step": 425 }, { "epoch": 2.05, "eval_accuracy": 0.9910439624625209, "eval_f1": 0.9497365559923059, "eval_loss": 0.03666611388325691, "eval_precision": 0.943973399833749, "eval_recall": 0.9555705149781218, "eval_runtime": 6.4014, "eval_samples_per_second": 507.859, "eval_steps_per_second": 0.625, "step": 450 }, { "epoch": 2.16, "eval_accuracy": 0.99069350881975, "eval_f1": 0.9474914433592119, "eval_loss": 0.03960287570953369, "eval_precision": 0.9400364419413616, "eval_recall": 0.9550656344665096, "eval_runtime": 6.2344, "eval_samples_per_second": 521.465, "eval_steps_per_second": 0.642, "step": 475 }, { "epoch": 2.27, "learning_rate": 4.636363636363636e-05, "loss": 0.0771, "step": 500 }, { "epoch": 2.27, "eval_accuracy": 0.991238658930727, "eval_f1": 0.9507813152836967, "eval_loss": 0.035283163189888, "eval_precision": 0.9442323651452282, "eval_recall": 0.9574217435207001, "eval_runtime": 6.1631, "eval_samples_per_second": 527.493, "eval_steps_per_second": 0.649, "step": 500 }, { "epoch": 2.39, "eval_accuracy": 0.9905572212920057, "eval_f1": 0.9453602209020165, "eval_loss": 0.03937030956149101, "eval_precision": 0.9400898652021967, "eval_recall": 0.9506900033658701, "eval_runtime": 6.243, "eval_samples_per_second": 520.742, "eval_steps_per_second": 0.641, "step": 525 }, { "epoch": 2.5, "eval_accuracy": 0.9909660838752385, "eval_f1": 0.9484536082474228, "eval_loss": 0.036998968571424484, "eval_precision": 0.9447320086825848, "eval_recall": 0.9522046449007069, "eval_runtime": 6.0773, "eval_samples_per_second": 534.945, "eval_steps_per_second": 0.658, "step": 550 }, { "epoch": 2.61, "eval_accuracy": 0.9908492659943149, "eval_f1": 0.9472013366750209, "eval_loss": 0.035233963280916214, "eval_precision": 0.940444591904446, "eval_recall": 0.9540558734432851, "eval_runtime": 6.3038, "eval_samples_per_second": 515.72, "eval_steps_per_second": 0.635, "step": 575 }, { "epoch": 2.73, "eval_accuracy": 0.9908103267006737, "eval_f1": 0.9448281601065159, "eval_loss": 0.0385683998465538, "eval_precision": 0.9344855967078189, "eval_recall": 0.9554022214742511, "eval_runtime": 6.1499, "eval_samples_per_second": 528.629, "eval_steps_per_second": 0.65, "step": 600 }, { "epoch": 2.84, "eval_accuracy": 0.9916280518671391, "eval_f1": 0.9501544627202138, "eval_loss": 0.036591168493032455, "eval_precision": 0.9428334714167357, "eval_recall": 0.9575900370245709, "eval_runtime": 6.1996, "eval_samples_per_second": 524.389, "eval_steps_per_second": 0.645, "step": 625 }, { "epoch": 2.95, "eval_accuracy": 0.9913360071648301, "eval_f1": 0.948574295509658, "eval_loss": 0.035347189754247665, "eval_precision": 0.9426624563736081, "eval_recall": 0.9545607539548974, "eval_runtime": 6.4287, "eval_samples_per_second": 505.702, "eval_steps_per_second": 0.622, "step": 650 }, { "epoch": 3.07, "eval_accuracy": 0.9911023714029827, "eval_f1": 0.9477730425336343, "eval_loss": 0.035899706184864044, "eval_precision": 0.9412448132780084, "eval_recall": 0.9543924604510265, "eval_runtime": 6.1591, "eval_samples_per_second": 527.837, "eval_steps_per_second": 0.649, "step": 675 }, { "epoch": 3.18, "eval_accuracy": 0.9919979751567306, "eval_f1": 0.9534164087981936, "eval_loss": 0.0355631485581398, "eval_precision": 0.9476309226932669, "eval_recall": 0.9592729720632783, "eval_runtime": 6.1923, "eval_samples_per_second": 525.005, "eval_steps_per_second": 0.646, "step": 700 }, { "epoch": 3.3, "eval_accuracy": 0.9918422179821658, "eval_f1": 0.953465015065283, "eval_loss": 0.03445196524262428, "eval_precision": 0.9483849483849484, "eval_recall": 0.9585997980477954, "eval_runtime": 6.3335, "eval_samples_per_second": 513.302, "eval_steps_per_second": 0.632, "step": 725 }, { "epoch": 3.41, "eval_accuracy": 0.9915696429266773, "eval_f1": 0.9491893698813304, "eval_loss": 0.03445504605770111, "eval_precision": 0.9427290836653387, "eval_recall": 0.9557388084819926, "eval_runtime": 6.1661, "eval_samples_per_second": 527.234, "eval_steps_per_second": 0.649, "step": 750 }, { "epoch": 3.52, "eval_accuracy": 0.9913944161052919, "eval_f1": 0.9478246374395733, "eval_loss": 0.03635535016655922, "eval_precision": 0.9389035667107001, "eval_recall": 0.9569168630090878, "eval_runtime": 6.4373, "eval_samples_per_second": 505.028, "eval_steps_per_second": 0.621, "step": 775 }, { "epoch": 3.64, "eval_accuracy": 0.9914917643393949, "eval_f1": 0.95067189717052, "eval_loss": 0.03599384054541588, "eval_precision": 0.943036926643484, "eval_recall": 0.9584315045439246, "eval_runtime": 6.1546, "eval_samples_per_second": 528.219, "eval_steps_per_second": 0.65, "step": 800 }, { "epoch": 3.75, "eval_accuracy": 0.9914528250457537, "eval_f1": 0.950514945993469, "eval_loss": 0.03866244852542877, "eval_precision": 0.9458423596067322, "eval_recall": 0.9552339279703803, "eval_runtime": 6.3798, "eval_samples_per_second": 509.575, "eval_steps_per_second": 0.627, "step": 825 }, { "epoch": 3.86, "eval_accuracy": 0.9917059304544216, "eval_f1": 0.9521419009370816, "eval_loss": 0.034695982933044434, "eval_precision": 0.9467554076539102, "eval_recall": 0.9575900370245709, "eval_runtime": 6.175, "eval_samples_per_second": 526.482, "eval_steps_per_second": 0.648, "step": 850 }, { "epoch": 3.98, "eval_accuracy": 0.9915307036330361, "eval_f1": 0.9509402423735897, "eval_loss": 0.03567422926425934, "eval_precision": 0.9445459073551387, "eval_recall": 0.9574217435207001, "eval_runtime": 6.2028, "eval_samples_per_second": 524.119, "eval_steps_per_second": 0.645, "step": 875 }, { "epoch": 4.09, "eval_accuracy": 0.9918032786885246, "eval_f1": 0.9520702634880803, "eval_loss": 0.03815401718020439, "eval_precision": 0.9464493597206054, "eval_recall": 0.9577583305284416, "eval_runtime": 6.4111, "eval_samples_per_second": 507.091, "eval_steps_per_second": 0.624, "step": 900 }, { "epoch": 4.2, "eval_accuracy": 0.9917643393948834, "eval_f1": 0.9518385124382277, "eval_loss": 0.03912338241934776, "eval_precision": 0.9474737368684342, "eval_recall": 0.9562436889936049, "eval_runtime": 6.1023, "eval_samples_per_second": 532.748, "eval_steps_per_second": 0.655, "step": 925 }, { "epoch": 4.32, "eval_accuracy": 0.9911802499902652, "eval_f1": 0.9506493506493505, "eval_loss": 0.0428401380777359, "eval_precision": 0.9466043717670616, "eval_recall": 0.9547290474587681, "eval_runtime": 6.3492, "eval_samples_per_second": 512.03, "eval_steps_per_second": 0.63, "step": 950 }, { "epoch": 4.43, "eval_accuracy": 0.9913360071648301, "eval_f1": 0.9506028131279304, "eval_loss": 0.04035865515470505, "eval_precision": 0.9458513828723759, "eval_recall": 0.9554022214742511, "eval_runtime": 6.1625, "eval_samples_per_second": 527.542, "eval_steps_per_second": 0.649, "step": 975 }, { "epoch": 4.55, "learning_rate": 3.2727272727272725e-05, "loss": 0.0118, "step": 1000 }, { "epoch": 4.55, "eval_accuracy": 0.9908687356411354, "eval_f1": 0.9461397365349341, "eval_loss": 0.04028761386871338, "eval_precision": 0.9375413086582948, "eval_recall": 0.9548973409626389, "eval_runtime": 6.261, "eval_samples_per_second": 519.243, "eval_steps_per_second": 0.639, "step": 1000 }, { "epoch": 4.66, "eval_accuracy": 0.9919200965694482, "eval_f1": 0.9533852205205458, "eval_loss": 0.036938250064849854, "eval_precision": 0.9482270684201765, "eval_recall": 0.9585997980477954, "eval_runtime": 6.1962, "eval_samples_per_second": 524.674, "eval_steps_per_second": 0.646, "step": 1025 }, { "epoch": 4.77, "eval_accuracy": 0.9918032786885246, "eval_f1": 0.9520227348712804, "eval_loss": 0.037420712411403656, "eval_precision": 0.9456991032879442, "eval_recall": 0.9584315045439246, "eval_runtime": 5.9766, "eval_samples_per_second": 543.958, "eval_steps_per_second": 0.669, "step": 1050 }, { "epoch": 4.89, "eval_accuracy": 0.9922900198590398, "eval_f1": 0.9538745387453874, "eval_loss": 0.035940222442150116, "eval_precision": 0.9506853895018389, "eval_recall": 0.9570851565129586, "eval_runtime": 6.2768, "eval_samples_per_second": 517.943, "eval_steps_per_second": 0.637, "step": 1075 }, { "epoch": 5.0, "eval_accuracy": 0.9919006269226276, "eval_f1": 0.9523093627328155, "eval_loss": 0.03730743005871773, "eval_precision": 0.9452827060189023, "eval_recall": 0.9594412655671491, "eval_runtime": 6.0853, "eval_samples_per_second": 534.236, "eval_steps_per_second": 0.657, "step": 1100 }, { "epoch": 5.11, "eval_accuracy": 0.9923873680931428, "eval_f1": 0.9546215673141327, "eval_loss": 0.037039875984191895, "eval_precision": 0.9498500499833389, "eval_recall": 0.9594412655671491, "eval_runtime": 6.3128, "eval_samples_per_second": 514.986, "eval_steps_per_second": 0.634, "step": 1125 }, { "epoch": 5.23, "eval_accuracy": 0.9922316109185779, "eval_f1": 0.9555313625324512, "eval_loss": 0.038839343935251236, "eval_precision": 0.9509918319719953, "eval_recall": 0.9601144395826321, "eval_runtime": 6.1584, "eval_samples_per_second": 527.897, "eval_steps_per_second": 0.65, "step": 1150 }, { "epoch": 5.34, "eval_accuracy": 0.9919785055099101, "eval_f1": 0.9522212908633696, "eval_loss": 0.03950090706348419, "eval_precision": 0.948563794255177, "eval_recall": 0.9559071019858634, "eval_runtime": 6.084, "eval_samples_per_second": 534.349, "eval_steps_per_second": 0.657, "step": 1175 }, { "epoch": 5.45, "eval_accuracy": 0.9923678984463222, "eval_f1": 0.9542866711319491, "eval_loss": 0.03910110890865326, "eval_precision": 0.949516827724092, "eval_recall": 0.9591046785594076, "eval_runtime": 6.3281, "eval_samples_per_second": 513.744, "eval_steps_per_second": 0.632, "step": 1200 }, { "epoch": 5.57, "eval_accuracy": 0.9923289591526809, "eval_f1": 0.9552313883299799, "eval_loss": 0.037824589759111404, "eval_precision": 0.9517206815903776, "eval_recall": 0.9587680915516661, "eval_runtime": 6.1901, "eval_samples_per_second": 525.192, "eval_steps_per_second": 0.646, "step": 1225 }, { "epoch": 5.68, "eval_accuracy": 0.9923678984463222, "eval_f1": 0.956470785200067, "eval_loss": 0.038752481341362, "eval_precision": 0.9515323117921386, "eval_recall": 0.9614607876135981, "eval_runtime": 6.178, "eval_samples_per_second": 526.219, "eval_steps_per_second": 0.647, "step": 1250 }, { "epoch": 5.8, "eval_accuracy": 0.9924457770336046, "eval_f1": 0.9560485558811219, "eval_loss": 0.03838498517870903, "eval_precision": 0.9511910711311011, "eval_recall": 0.9609559071019859, "eval_runtime": 6.3664, "eval_samples_per_second": 510.65, "eval_steps_per_second": 0.628, "step": 1275 }, { "epoch": 5.91, "eval_accuracy": 0.9924068377399634, "eval_f1": 0.9571045576407506, "eval_loss": 0.03946718946099281, "eval_precision": 0.9529529529529529, "eval_recall": 0.9612924941097274, "eval_runtime": 6.1196, "eval_samples_per_second": 531.242, "eval_steps_per_second": 0.654, "step": 1300 }, { "epoch": 6.02, "eval_accuracy": 0.9919200965694482, "eval_f1": 0.9533869885982562, "eval_loss": 0.04075756296515465, "eval_precision": 0.9498830604744404, "eval_recall": 0.9569168630090878, "eval_runtime": 6.1927, "eval_samples_per_second": 524.974, "eval_steps_per_second": 0.646, "step": 1325 }, { "epoch": 6.14, "eval_accuracy": 0.9921732019781161, "eval_f1": 0.9547998997409975, "eval_loss": 0.04120802879333496, "eval_precision": 0.948067031690725, "eval_recall": 0.9616290811174689, "eval_runtime": 6.3552, "eval_samples_per_second": 511.548, "eval_steps_per_second": 0.629, "step": 1350 }, { "epoch": 6.25, "eval_accuracy": 0.9923873680931428, "eval_f1": 0.9555667337357477, "eval_loss": 0.0413355678319931, "eval_precision": 0.952054794520548, "eval_recall": 0.9591046785594076, "eval_runtime": 6.2847, "eval_samples_per_second": 517.288, "eval_steps_per_second": 0.636, "step": 1375 }, { "epoch": 6.36, "eval_accuracy": 0.9917448697480628, "eval_f1": 0.9525004181301221, "eval_loss": 0.04124680161476135, "eval_precision": 0.9466422872340425, "eval_recall": 0.9584315045439246, "eval_runtime": 6.4524, "eval_samples_per_second": 503.841, "eval_steps_per_second": 0.62, "step": 1400 }, { "epoch": 6.48, "eval_accuracy": 0.9920953233908337, "eval_f1": 0.9555611348229978, "eval_loss": 0.040540654212236404, "eval_precision": 0.9503912102547029, "eval_recall": 0.9607876135981152, "eval_runtime": 6.1266, "eval_samples_per_second": 530.638, "eval_steps_per_second": 0.653, "step": 1425 }, { "epoch": 6.59, "eval_accuracy": 0.9925041859740664, "eval_f1": 0.9565508580996233, "eval_loss": 0.04004018381237984, "eval_precision": 0.9516908212560387, "eval_recall": 0.9614607876135981, "eval_runtime": 6.4161, "eval_samples_per_second": 506.697, "eval_steps_per_second": 0.623, "step": 1450 }, { "epoch": 6.7, "eval_accuracy": 0.9922900198590398, "eval_f1": 0.9551813688531458, "eval_loss": 0.039815619587898254, "eval_precision": 0.9509591326105088, "eval_recall": 0.9594412655671491, "eval_runtime": 6.2578, "eval_samples_per_second": 519.511, "eval_steps_per_second": 0.639, "step": 1475 }, { "epoch": 6.82, "learning_rate": 1.909090909090909e-05, "loss": 0.0049, "step": 1500 }, { "epoch": 6.82, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.956871283812076, "eval_loss": 0.03951007500290871, "eval_precision": 0.9523253875645941, "eval_recall": 0.9614607876135981, "eval_runtime": 6.2854, "eval_samples_per_second": 517.232, "eval_steps_per_second": 0.636, "step": 1500 }, { "epoch": 6.93, "eval_accuracy": 0.9927183520890931, "eval_f1": 0.9571476397723468, "eval_loss": 0.03918459266424179, "eval_precision": 0.952047952047952, "eval_recall": 0.9623022551329519, "eval_runtime": 6.1825, "eval_samples_per_second": 525.837, "eval_steps_per_second": 0.647, "step": 1525 }, { "epoch": 7.05, "eval_accuracy": 0.9923484287995016, "eval_f1": 0.9551738583996647, "eval_loss": 0.03897989168763161, "eval_precision": 0.9511096278992157, "eval_recall": 0.9592729720632783, "eval_runtime": 6.0468, "eval_samples_per_second": 537.641, "eval_steps_per_second": 0.662, "step": 1550 }, { "epoch": 7.16, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.9565363034921699, "eval_loss": 0.03931865468621254, "eval_precision": 0.9519919986664445, "eval_recall": 0.9611242006058566, "eval_runtime": 6.2528, "eval_samples_per_second": 519.93, "eval_steps_per_second": 0.64, "step": 1575 }, { "epoch": 7.27, "eval_accuracy": 0.9925236556208871, "eval_f1": 0.9562233196618398, "eval_loss": 0.03892602398991585, "eval_precision": 0.9512073272273106, "eval_recall": 0.9612924941097274, "eval_runtime": 6.0818, "eval_samples_per_second": 534.544, "eval_steps_per_second": 0.658, "step": 1600 }, { "epoch": 7.39, "eval_accuracy": 0.9923678984463222, "eval_f1": 0.9565435820145692, "eval_loss": 0.0404973067343235, "eval_precision": 0.9518413597733711, "eval_recall": 0.9612924941097274, "eval_runtime": 6.1086, "eval_samples_per_second": 532.197, "eval_steps_per_second": 0.655, "step": 1625 }, { "epoch": 7.5, "eval_accuracy": 0.9924847163272458, "eval_f1": 0.9558737335677803, "eval_loss": 0.04104885458946228, "eval_precision": 0.9511748041993001, "eval_recall": 0.9606193200942443, "eval_runtime": 6.3603, "eval_samples_per_second": 511.14, "eval_steps_per_second": 0.629, "step": 1650 }, { "epoch": 7.61, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.9569442117607639, "eval_loss": 0.04079214483499527, "eval_precision": 0.95263509006004, "eval_recall": 0.9612924941097274, "eval_runtime": 6.0876, "eval_samples_per_second": 534.04, "eval_steps_per_second": 0.657, "step": 1675 }, { "epoch": 7.73, "eval_accuracy": 0.9921732019781161, "eval_f1": 0.9545302574389837, "eval_loss": 0.043598320335149765, "eval_precision": 0.9481899701095982, "eval_recall": 0.9609559071019859, "eval_runtime": 6.3314, "eval_samples_per_second": 513.469, "eval_steps_per_second": 0.632, "step": 1700 }, { "epoch": 7.84, "eval_accuracy": 0.9924068377399634, "eval_f1": 0.9559548683660676, "eval_loss": 0.0419035442173481, "eval_precision": 0.9495268138801262, "eval_recall": 0.9624705486368226, "eval_runtime": 6.237, "eval_samples_per_second": 521.246, "eval_steps_per_second": 0.641, "step": 1725 }, { "epoch": 7.95, "eval_accuracy": 0.9925625949145283, "eval_f1": 0.957126109529392, "eval_loss": 0.04293340817093849, "eval_precision": 0.9525, "eval_recall": 0.9617973746213396, "eval_runtime": 6.1487, "eval_samples_per_second": 528.734, "eval_steps_per_second": 0.651, "step": 1750 }, { "epoch": 8.07, "eval_accuracy": 0.9924068377399634, "eval_f1": 0.9561506276150629, "eval_loss": 0.041886329650878906, "eval_precision": 0.9508988015978695, "eval_recall": 0.9614607876135981, "eval_runtime": 6.3754, "eval_samples_per_second": 509.93, "eval_steps_per_second": 0.627, "step": 1775 }, { "epoch": 8.18, "eval_accuracy": 0.9922900198590398, "eval_f1": 0.9555313625324512, "eval_loss": 0.04220963269472122, "eval_precision": 0.9509918319719953, "eval_recall": 0.9601144395826321, "eval_runtime": 6.1129, "eval_samples_per_second": 531.828, "eval_steps_per_second": 0.654, "step": 1800 }, { "epoch": 8.3, "eval_accuracy": 0.9923873680931428, "eval_f1": 0.9561793045664014, "eval_loss": 0.041702426970005035, "eval_precision": 0.9521107959285834, "eval_recall": 0.9602827330865029, "eval_runtime": 6.3543, "eval_samples_per_second": 511.618, "eval_steps_per_second": 0.629, "step": 1825 }, { "epoch": 8.41, "eval_accuracy": 0.9924652466804252, "eval_f1": 0.9570171763720151, "eval_loss": 0.04150727763772011, "eval_precision": 0.952945102619723, "eval_recall": 0.9611242006058566, "eval_runtime": 6.1032, "eval_samples_per_second": 532.671, "eval_steps_per_second": 0.655, "step": 1850 }, { "epoch": 8.52, "eval_accuracy": 0.9924263073867841, "eval_f1": 0.9566965407488064, "eval_loss": 0.04162871465086937, "eval_precision": 0.952309488077372, "eval_recall": 0.9611242006058566, "eval_runtime": 6.1162, "eval_samples_per_second": 531.542, "eval_steps_per_second": 0.654, "step": 1875 }, { "epoch": 8.64, "eval_accuracy": 0.9922316109185779, "eval_f1": 0.9555611348229978, "eval_loss": 0.04189736768603325, "eval_precision": 0.9503912102547029, "eval_recall": 0.9607876135981152, "eval_runtime": 6.4808, "eval_samples_per_second": 501.634, "eval_steps_per_second": 0.617, "step": 1900 }, { "epoch": 8.75, "eval_accuracy": 0.9923873680931428, "eval_f1": 0.9564489112227805, "eval_loss": 0.04165585711598396, "eval_precision": 0.9519839946648883, "eval_recall": 0.9609559071019859, "eval_runtime": 6.2132, "eval_samples_per_second": 523.242, "eval_steps_per_second": 0.644, "step": 1925 }, { "epoch": 8.86, "eval_accuracy": 0.9926015342081694, "eval_f1": 0.9577818730105546, "eval_loss": 0.041886311024427414, "eval_precision": 0.9534689793195463, "eval_recall": 0.9621339616290812, "eval_runtime": 6.5243, "eval_samples_per_second": 498.291, "eval_steps_per_second": 0.613, "step": 1950 }, { "epoch": 8.98, "eval_accuracy": 0.9926599431486313, "eval_f1": 0.9575341318368372, "eval_loss": 0.04215257614850998, "eval_precision": 0.9531432382858096, "eval_recall": 0.9619656681252103, "eval_runtime": 6.2104, "eval_samples_per_second": 523.476, "eval_steps_per_second": 0.644, "step": 1975 }, { "epoch": 9.09, "learning_rate": 5.4545454545454545e-06, "loss": 0.0022, "step": 2000 }, { "epoch": 9.09, "eval_accuracy": 0.9925820645613489, "eval_f1": 0.9571847507331379, "eval_loss": 0.04227477312088013, "eval_precision": 0.953111963957951, "eval_recall": 0.9612924941097274, "eval_runtime": 6.1893, "eval_samples_per_second": 525.265, "eval_steps_per_second": 0.646, "step": 2000 }, { "epoch": 9.2, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.9567110441262665, "eval_loss": 0.042577099055051804, "eval_precision": 0.9520079986668889, "eval_recall": 0.9614607876135981, "eval_runtime": 6.2434, "eval_samples_per_second": 520.71, "eval_steps_per_second": 0.641, "step": 2025 }, { "epoch": 9.32, "eval_accuracy": 0.9924652466804252, "eval_f1": 0.9560338330123105, "eval_loss": 0.04250513017177582, "eval_precision": 0.9514919153192198, "eval_recall": 0.9606193200942443, "eval_runtime": 5.9913, "eval_samples_per_second": 542.619, "eval_steps_per_second": 0.668, "step": 2050 }, { "epoch": 9.43, "eval_accuracy": 0.9925431252677076, "eval_f1": 0.956463496316142, "eval_loss": 0.0422191396355629, "eval_precision": 0.951682772409197, "eval_recall": 0.9612924941097274, "eval_runtime": 6.2812, "eval_samples_per_second": 517.58, "eval_steps_per_second": 0.637, "step": 2075 }, { "epoch": 9.55, "eval_accuracy": 0.9924847163272458, "eval_f1": 0.9559537765868363, "eval_loss": 0.0423436276614666, "eval_precision": 0.9513333333333334, "eval_recall": 0.9606193200942443, "eval_runtime": 6.0529, "eval_samples_per_second": 537.095, "eval_steps_per_second": 0.661, "step": 2100 }, { "epoch": 9.66, "eval_accuracy": 0.9924652466804252, "eval_f1": 0.9558663428523575, "eval_loss": 0.04235740005970001, "eval_precision": 0.951325220870145, "eval_recall": 0.9604510265903736, "eval_runtime": 6.0731, "eval_samples_per_second": 535.315, "eval_steps_per_second": 0.659, "step": 2125 }, { "epoch": 9.77, "eval_accuracy": 0.9924652466804252, "eval_f1": 0.9566164154103852, "eval_loss": 0.042295120656490326, "eval_precision": 0.9521507169056352, "eval_recall": 0.9611242006058566, "eval_runtime": 6.3348, "eval_samples_per_second": 513.197, "eval_steps_per_second": 0.631, "step": 2150 }, { "epoch": 9.89, "eval_accuracy": 0.9924847163272458, "eval_f1": 0.9567037936521229, "eval_loss": 0.04226445034146309, "eval_precision": 0.9521586931155193, "eval_recall": 0.9612924941097274, "eval_runtime": 6.1145, "eval_samples_per_second": 531.688, "eval_steps_per_second": 0.654, "step": 2175 }, { "epoch": 10.0, "eval_accuracy": 0.9925236556208871, "eval_f1": 0.9570387739720292, "eval_loss": 0.04224075376987457, "eval_precision": 0.952492082013669, "eval_recall": 0.9616290811174689, "eval_runtime": 6.3677, "eval_samples_per_second": 510.543, "eval_steps_per_second": 0.628, "step": 2200 }, { "epoch": 10.0, "step": 2200, "total_flos": 4144211411102244.0, "train_loss": 0.021953743980689482, "train_runtime": 1324.4932, "train_samples_per_second": 106.018, "train_steps_per_second": 1.661 } ], "max_steps": 2200, "num_train_epochs": 10, "total_flos": 4144211411102244.0, "trial_name": null, "trial_params": null }