{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "global_step": 4600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.531720741599073, "eval_f1": 0.022944550669216066, "eval_loss": 1.042980432510376, "eval_precision": 0.013824884792626729, "eval_recall": 0.06741573033707865, "eval_runtime": 2.6201, "eval_samples_per_second": 52.67, "eval_steps_per_second": 4.58, "step": 46 }, { "epoch": 2.0, "eval_accuracy": 0.5824159907300116, "eval_f1": 0.05216284987277353, "eval_loss": 0.9423891305923462, "eval_precision": 0.03637976929902396, "eval_recall": 0.09213483146067415, "eval_runtime": 2.6433, "eval_samples_per_second": 52.207, "eval_steps_per_second": 4.54, "step": 92 }, { "epoch": 3.0, "eval_accuracy": 0.6006662804171495, "eval_f1": 0.06494287432351173, "eval_loss": 0.8916851282119751, "eval_precision": 0.04433497536945813, "eval_recall": 0.12134831460674157, "eval_runtime": 2.6927, "eval_samples_per_second": 51.249, "eval_steps_per_second": 4.456, "step": 138 }, { "epoch": 4.0, "eval_accuracy": 0.6420191193511008, "eval_f1": 0.10659560293137908, "eval_loss": 0.826358437538147, "eval_precision": 0.07575757575757576, "eval_recall": 0.1797752808988764, "eval_runtime": 2.6923, "eval_samples_per_second": 51.257, "eval_steps_per_second": 4.457, "step": 184 }, { "epoch": 5.0, "eval_accuracy": 0.6395567786790266, "eval_f1": 0.17535903250188964, "eval_loss": 0.9059988260269165, "eval_precision": 0.13211845102505695, "eval_recall": 0.2606741573033708, "eval_runtime": 2.718, "eval_samples_per_second": 50.774, "eval_steps_per_second": 4.415, "step": 230 }, { "epoch": 6.0, "eval_accuracy": 0.6408603707995365, "eval_f1": 0.16282420749279541, "eval_loss": 0.9093501567840576, "eval_precision": 0.11983032873807, "eval_recall": 0.2539325842696629, "eval_runtime": 2.7417, "eval_samples_per_second": 50.334, "eval_steps_per_second": 4.377, "step": 276 }, { "epoch": 7.0, "eval_accuracy": 0.6427433371958285, "eval_f1": 0.17168481742472771, "eval_loss": 1.0060389041900635, "eval_precision": 0.12007168458781362, "eval_recall": 0.30112359550561796, "eval_runtime": 2.7409, "eval_samples_per_second": 50.348, "eval_steps_per_second": 4.378, "step": 322 }, { "epoch": 8.0, "eval_accuracy": 0.6558516801853997, "eval_f1": 0.17363344051446947, "eval_loss": 1.1526994705200195, "eval_precision": 0.12162162162162163, "eval_recall": 0.30337078651685395, "eval_runtime": 2.7362, "eval_samples_per_second": 50.435, "eval_steps_per_second": 4.386, "step": 368 }, { "epoch": 9.0, "eval_accuracy": 0.6541859791425261, "eval_f1": 0.16133004926108374, "eval_loss": 1.0466786623001099, "eval_precision": 0.1111111111111111, "eval_recall": 0.2943820224719101, "eval_runtime": 2.7242, "eval_samples_per_second": 50.657, "eval_steps_per_second": 4.405, "step": 414 }, { "epoch": 10.0, "eval_accuracy": 0.6379634994206257, "eval_f1": 0.19889502762430938, "eval_loss": 1.185328722000122, "eval_precision": 0.14356929212362912, "eval_recall": 0.3235955056179775, "eval_runtime": 2.7468, "eval_samples_per_second": 50.24, "eval_steps_per_second": 4.369, "step": 460 }, { "epoch": 10.87, "learning_rate": 1.782608695652174e-05, "loss": 0.5814, "step": 500 }, { "epoch": 11.0, "eval_accuracy": 0.6622972190034763, "eval_f1": 0.24944974321349964, "eval_loss": 1.2020127773284912, "eval_precision": 0.18518518518518517, "eval_recall": 0.38202247191011235, "eval_runtime": 2.7642, "eval_samples_per_second": 49.924, "eval_steps_per_second": 4.341, "step": 506 }, { "epoch": 12.0, "eval_accuracy": 0.6589658169177288, "eval_f1": 0.2267481330617787, "eval_loss": 1.3076611757278442, "eval_precision": 0.16245136186770429, "eval_recall": 0.3752808988764045, "eval_runtime": 2.7844, "eval_samples_per_second": 49.562, "eval_steps_per_second": 4.31, "step": 552 }, { "epoch": 13.0, "eval_accuracy": 0.6307213209733488, "eval_f1": 0.2636015325670498, "eval_loss": 1.294709324836731, "eval_precision": 0.2, "eval_recall": 0.3865168539325843, "eval_runtime": 2.7404, "eval_samples_per_second": 50.358, "eval_steps_per_second": 4.379, "step": 598 }, { "epoch": 14.0, "eval_accuracy": 0.6591830822711472, "eval_f1": 0.3390663390663391, "eval_loss": 1.4205528497695923, "eval_precision": 0.2667525773195876, "eval_recall": 0.4651685393258427, "eval_runtime": 2.7797, "eval_samples_per_second": 49.646, "eval_steps_per_second": 4.317, "step": 644 }, { "epoch": 15.0, "eval_accuracy": 0.6625869061413673, "eval_f1": 0.33782712133227594, "eval_loss": 1.475420355796814, "eval_precision": 0.2610294117647059, "eval_recall": 0.4786516853932584, "eval_runtime": 2.7429, "eval_samples_per_second": 50.312, "eval_steps_per_second": 4.375, "step": 690 }, { "epoch": 16.0, "eval_accuracy": 0.6528099652375434, "eval_f1": 0.3605728727885425, "eval_loss": 1.6823292970657349, "eval_precision": 0.2884097035040431, "eval_recall": 0.48089887640449436, "eval_runtime": 2.7637, "eval_samples_per_second": 49.933, "eval_steps_per_second": 4.342, "step": 736 }, { "epoch": 17.0, "eval_accuracy": 0.662369640787949, "eval_f1": 0.3175832687838885, "eval_loss": 1.6413644552230835, "eval_precision": 0.24231678486997635, "eval_recall": 0.4606741573033708, "eval_runtime": 2.7668, "eval_samples_per_second": 49.877, "eval_steps_per_second": 4.337, "step": 782 }, { "epoch": 18.0, "eval_accuracy": 0.6634559675550405, "eval_f1": 0.2549647661755285, "eval_loss": 1.5539870262145996, "eval_precision": 0.17831541218637992, "eval_recall": 0.44719101123595506, "eval_runtime": 2.7564, "eval_samples_per_second": 50.065, "eval_steps_per_second": 4.353, "step": 828 }, { "epoch": 19.0, "eval_accuracy": 0.65454808806489, "eval_f1": 0.32420429311621024, "eval_loss": 1.7641867399215698, "eval_precision": 0.24172185430463577, "eval_recall": 0.49213483146067416, "eval_runtime": 2.7607, "eval_samples_per_second": 49.987, "eval_steps_per_second": 4.347, "step": 874 }, { "epoch": 20.0, "eval_accuracy": 0.6743192352259559, "eval_f1": 0.29172510518934086, "eval_loss": 1.6112134456634521, "eval_precision": 0.21202854230377166, "eval_recall": 0.46741573033707867, "eval_runtime": 2.7419, "eval_samples_per_second": 50.331, "eval_steps_per_second": 4.377, "step": 920 }, { "epoch": 21.0, "eval_accuracy": 0.6320973348783314, "eval_f1": 0.2980225988700565, "eval_loss": 1.9230778217315674, "eval_precision": 0.21730175077239958, "eval_recall": 0.47415730337078654, "eval_runtime": 2.7602, "eval_samples_per_second": 49.997, "eval_steps_per_second": 4.348, "step": 966 }, { "epoch": 21.74, "learning_rate": 1.565217391304348e-05, "loss": 0.1098, "step": 1000 }, { "epoch": 22.0, "eval_accuracy": 0.6402085747392816, "eval_f1": 0.3536776212832551, "eval_loss": 2.1778900623321533, "eval_precision": 0.27130852340936373, "eval_recall": 0.5078651685393258, "eval_runtime": 2.7589, "eval_samples_per_second": 50.021, "eval_steps_per_second": 4.35, "step": 1012 }, { "epoch": 23.0, "eval_accuracy": 0.6542584009269988, "eval_f1": 0.31053351573187415, "eval_loss": 1.8866859674453735, "eval_precision": 0.2232055063913471, "eval_recall": 0.5101123595505618, "eval_runtime": 2.7457, "eval_samples_per_second": 50.26, "eval_steps_per_second": 4.37, "step": 1058 }, { "epoch": 24.0, "eval_accuracy": 0.6286935110081112, "eval_f1": 0.29891304347826086, "eval_loss": 2.057832956314087, "eval_precision": 0.21421616358325218, "eval_recall": 0.4943820224719101, "eval_runtime": 2.7704, "eval_samples_per_second": 49.813, "eval_steps_per_second": 4.332, "step": 1104 }, { "epoch": 25.0, "eval_accuracy": 0.6264484356894554, "eval_f1": 0.2706571242680546, "eval_loss": 2.031670093536377, "eval_precision": 0.19047619047619047, "eval_recall": 0.46741573033707867, "eval_runtime": 2.7593, "eval_samples_per_second": 50.013, "eval_steps_per_second": 4.349, "step": 1150 }, { "epoch": 26.0, "eval_accuracy": 0.6575898030127463, "eval_f1": 0.34562211981566826, "eval_loss": 1.8547980785369873, "eval_precision": 0.26254375729288215, "eval_recall": 0.5056179775280899, "eval_runtime": 2.745, "eval_samples_per_second": 50.273, "eval_steps_per_second": 4.372, "step": 1196 }, { "epoch": 27.0, "eval_accuracy": 0.6420915411355735, "eval_f1": 0.3376230128690386, "eval_loss": 2.0632588863372803, "eval_precision": 0.2545662100456621, "eval_recall": 0.501123595505618, "eval_runtime": 2.7583, "eval_samples_per_second": 50.03, "eval_steps_per_second": 4.35, "step": 1242 }, { "epoch": 28.0, "eval_accuracy": 0.666787369640788, "eval_f1": 0.36335160532498045, "eval_loss": 1.943156123161316, "eval_precision": 0.27884615384615385, "eval_recall": 0.5213483146067416, "eval_runtime": 2.7624, "eval_samples_per_second": 49.957, "eval_steps_per_second": 4.344, "step": 1288 }, { "epoch": 29.0, "eval_accuracy": 0.6518684820393974, "eval_f1": 0.32880629020729096, "eval_loss": 1.9604640007019043, "eval_precision": 0.24109014675052412, "eval_recall": 0.5168539325842697, "eval_runtime": 2.7551, "eval_samples_per_second": 50.089, "eval_steps_per_second": 4.356, "step": 1334 }, { "epoch": 30.0, "eval_accuracy": 0.6587485515643106, "eval_f1": 0.3465045592705167, "eval_loss": 2.0531818866729736, "eval_precision": 0.2617680826636051, "eval_recall": 0.5123595505617977, "eval_runtime": 2.7577, "eval_samples_per_second": 50.042, "eval_steps_per_second": 4.352, "step": 1380 }, { "epoch": 31.0, "eval_accuracy": 0.6528099652375434, "eval_f1": 0.30739045127534337, "eval_loss": 1.9861180782318115, "eval_precision": 0.21678966789667897, "eval_recall": 0.5280898876404494, "eval_runtime": 2.7639, "eval_samples_per_second": 49.929, "eval_steps_per_second": 4.342, "step": 1426 }, { "epoch": 32.0, "eval_accuracy": 0.6265932792584009, "eval_f1": 0.25979112271540467, "eval_loss": 2.3644657135009766, "eval_precision": 0.18307267709291627, "eval_recall": 0.44719101123595506, "eval_runtime": 2.7617, "eval_samples_per_second": 49.969, "eval_steps_per_second": 4.345, "step": 1472 }, { "epoch": 32.61, "learning_rate": 1.3478260869565218e-05, "loss": 0.0461, "step": 1500 }, { "epoch": 33.0, "eval_accuracy": 0.6571552723059096, "eval_f1": 0.2733908427339084, "eval_loss": 2.0718517303466797, "eval_precision": 0.19397363465160075, "eval_recall": 0.46292134831460674, "eval_runtime": 2.7478, "eval_samples_per_second": 50.223, "eval_steps_per_second": 4.367, "step": 1518 }, { "epoch": 34.0, "eval_accuracy": 0.6454953650057937, "eval_f1": 0.2763246143527833, "eval_loss": 2.050283193588257, "eval_precision": 0.19694072657743786, "eval_recall": 0.46292134831460674, "eval_runtime": 2.7452, "eval_samples_per_second": 50.27, "eval_steps_per_second": 4.371, "step": 1564 }, { "epoch": 35.0, "eval_accuracy": 0.6310110081112399, "eval_f1": 0.26170622193713916, "eval_loss": 2.261981964111328, "eval_precision": 0.18312387791741472, "eval_recall": 0.4584269662921348, "eval_runtime": 2.7577, "eval_samples_per_second": 50.041, "eval_steps_per_second": 4.351, "step": 1610 }, { "epoch": 36.0, "eval_accuracy": 0.6399188876013905, "eval_f1": 0.3131313131313131, "eval_loss": 2.217377185821533, "eval_precision": 0.230605738575983, "eval_recall": 0.48764044943820223, "eval_runtime": 2.7643, "eval_samples_per_second": 49.922, "eval_steps_per_second": 4.341, "step": 1656 }, { "epoch": 37.0, "eval_accuracy": 0.6441917728852838, "eval_f1": 0.314410480349345, "eval_loss": 2.3862390518188477, "eval_precision": 0.232508073196986, "eval_recall": 0.4853932584269663, "eval_runtime": 2.7654, "eval_samples_per_second": 49.903, "eval_steps_per_second": 4.339, "step": 1702 }, { "epoch": 38.0, "eval_accuracy": 0.6550550405561993, "eval_f1": 0.3128571428571429, "eval_loss": 2.0702590942382812, "eval_precision": 0.2293193717277487, "eval_recall": 0.49213483146067416, "eval_runtime": 2.7536, "eval_samples_per_second": 50.116, "eval_steps_per_second": 4.358, "step": 1748 }, { "epoch": 39.0, "eval_accuracy": 0.6577346465816918, "eval_f1": 0.343939393939394, "eval_loss": 2.151489019393921, "eval_precision": 0.25942857142857145, "eval_recall": 0.5101123595505618, "eval_runtime": 2.7686, "eval_samples_per_second": 49.844, "eval_steps_per_second": 4.334, "step": 1794 }, { "epoch": 40.0, "eval_accuracy": 0.647595596755504, "eval_f1": 0.3431151241534989, "eval_loss": 2.1895194053649902, "eval_precision": 0.2579185520361991, "eval_recall": 0.5123595505617977, "eval_runtime": 2.7697, "eval_samples_per_second": 49.825, "eval_steps_per_second": 4.333, "step": 1840 }, { "epoch": 41.0, "eval_accuracy": 0.6629490150637312, "eval_f1": 0.3240810202550638, "eval_loss": 2.175402879714966, "eval_precision": 0.24324324324324326, "eval_recall": 0.4853932584269663, "eval_runtime": 2.7386, "eval_samples_per_second": 50.39, "eval_steps_per_second": 4.382, "step": 1886 }, { "epoch": 42.0, "eval_accuracy": 0.650130359212051, "eval_f1": 0.31381055676066527, "eval_loss": 2.3337295055389404, "eval_precision": 0.23134328358208955, "eval_recall": 0.48764044943820223, "eval_runtime": 2.775, "eval_samples_per_second": 49.729, "eval_steps_per_second": 4.324, "step": 1932 }, { "epoch": 43.0, "eval_accuracy": 0.6625869061413673, "eval_f1": 0.312180889861415, "eval_loss": 2.1595537662506104, "eval_precision": 0.23110151187904968, "eval_recall": 0.48089887640449436, "eval_runtime": 2.7514, "eval_samples_per_second": 50.156, "eval_steps_per_second": 4.361, "step": 1978 }, { "epoch": 43.48, "learning_rate": 1.1304347826086957e-05, "loss": 0.0323, "step": 2000 }, { "epoch": 44.0, "eval_accuracy": 0.6530272305909618, "eval_f1": 0.3159379407616361, "eval_loss": 2.2453536987304688, "eval_precision": 0.2302158273381295, "eval_recall": 0.503370786516854, "eval_runtime": 2.7499, "eval_samples_per_second": 50.184, "eval_steps_per_second": 4.364, "step": 2024 }, { "epoch": 45.0, "eval_accuracy": 0.6525926998841252, "eval_f1": 0.2999299229152067, "eval_loss": 2.1538333892822266, "eval_precision": 0.21792260692464357, "eval_recall": 0.48089887640449436, "eval_runtime": 2.772, "eval_samples_per_second": 49.784, "eval_steps_per_second": 4.329, "step": 2070 }, { "epoch": 46.0, "eval_accuracy": 0.6556344148319815, "eval_f1": 0.2761290322580645, "eval_loss": 2.1632461547851562, "eval_precision": 0.19366515837104073, "eval_recall": 0.48089887640449436, "eval_runtime": 2.7668, "eval_samples_per_second": 49.877, "eval_steps_per_second": 4.337, "step": 2116 }, { "epoch": 47.0, "eval_accuracy": 0.6575898030127463, "eval_f1": 0.2993762993762994, "eval_loss": 2.178040027618408, "eval_precision": 0.21643286573146292, "eval_recall": 0.4853932584269663, "eval_runtime": 2.7774, "eval_samples_per_second": 49.686, "eval_steps_per_second": 4.321, "step": 2162 }, { "epoch": 48.0, "eval_accuracy": 0.6502027809965237, "eval_f1": 0.29047949965253644, "eval_loss": 2.3481132984161377, "eval_precision": 0.21026156941649898, "eval_recall": 0.4696629213483146, "eval_runtime": 2.758, "eval_samples_per_second": 50.036, "eval_steps_per_second": 4.351, "step": 2208 }, { "epoch": 49.0, "eval_accuracy": 0.6594003476245655, "eval_f1": 0.2608695652173913, "eval_loss": 2.1968982219696045, "eval_precision": 0.18452935694315004, "eval_recall": 0.4449438202247191, "eval_runtime": 2.7601, "eval_samples_per_second": 49.997, "eval_steps_per_second": 4.348, "step": 2254 }, { "epoch": 50.0, "eval_accuracy": 0.6613557358053302, "eval_f1": 0.27965540092776675, "eval_loss": 2.1524665355682373, "eval_precision": 0.19830827067669174, "eval_recall": 0.47415730337078654, "eval_runtime": 2.7622, "eval_samples_per_second": 49.96, "eval_steps_per_second": 4.344, "step": 2300 }, { "epoch": 51.0, "eval_accuracy": 0.6413673232908459, "eval_f1": 0.26915647134578236, "eval_loss": 2.244340658187866, "eval_precision": 0.18862815884476533, "eval_recall": 0.4696629213483146, "eval_runtime": 2.7474, "eval_samples_per_second": 50.229, "eval_steps_per_second": 4.368, "step": 2346 }, { "epoch": 52.0, "eval_accuracy": 0.6659907300115875, "eval_f1": 0.29979181124219295, "eval_loss": 2.1262786388397217, "eval_precision": 0.21686746987951808, "eval_recall": 0.4853932584269663, "eval_runtime": 2.7827, "eval_samples_per_second": 49.592, "eval_steps_per_second": 4.312, "step": 2392 }, { "epoch": 53.0, "eval_accuracy": 0.6543308227114716, "eval_f1": 0.27220447284345045, "eval_loss": 2.178636074066162, "eval_precision": 0.19017857142857142, "eval_recall": 0.4786516853932584, "eval_runtime": 2.7405, "eval_samples_per_second": 50.356, "eval_steps_per_second": 4.379, "step": 2438 }, { "epoch": 54.0, "eval_accuracy": 0.6599797219003476, "eval_f1": 0.3191800878477306, "eval_loss": 2.2686634063720703, "eval_precision": 0.23669923995656894, "eval_recall": 0.4898876404494382, "eval_runtime": 2.7587, "eval_samples_per_second": 50.024, "eval_steps_per_second": 4.35, "step": 2484 }, { "epoch": 54.35, "learning_rate": 9.130434782608697e-06, "loss": 0.0289, "step": 2500 }, { "epoch": 55.0, "eval_accuracy": 0.6491164542294322, "eval_f1": 0.3539412673879443, "eval_loss": 2.4480252265930176, "eval_precision": 0.2697290930506478, "eval_recall": 0.5146067415730337, "eval_runtime": 2.7586, "eval_samples_per_second": 50.026, "eval_steps_per_second": 4.35, "step": 2530 }, { "epoch": 56.0, "eval_accuracy": 0.658603707995365, "eval_f1": 0.32152974504249293, "eval_loss": 2.241455078125, "eval_precision": 0.23474663908996898, "eval_recall": 0.5101123595505618, "eval_runtime": 2.7669, "eval_samples_per_second": 49.875, "eval_steps_per_second": 4.337, "step": 2576 }, { "epoch": 57.0, "eval_accuracy": 0.6625144843568945, "eval_f1": 0.33824670287044223, "eval_loss": 2.2077813148498535, "eval_precision": 0.25829383886255924, "eval_recall": 0.4898876404494382, "eval_runtime": 2.7555, "eval_samples_per_second": 50.082, "eval_steps_per_second": 4.355, "step": 2622 }, { "epoch": 58.0, "eval_accuracy": 0.6491164542294322, "eval_f1": 0.30736240171551105, "eval_loss": 2.3162100315093994, "eval_precision": 0.22536687631027252, "eval_recall": 0.48314606741573035, "eval_runtime": 2.7573, "eval_samples_per_second": 50.049, "eval_steps_per_second": 4.352, "step": 2668 }, { "epoch": 59.0, "eval_accuracy": 0.654837775202781, "eval_f1": 0.35776201733648544, "eval_loss": 2.3420791625976562, "eval_precision": 0.27548543689320387, "eval_recall": 0.5101123595505618, "eval_runtime": 2.7605, "eval_samples_per_second": 49.991, "eval_steps_per_second": 4.347, "step": 2714 }, { "epoch": 60.0, "eval_accuracy": 0.6544032444959443, "eval_f1": 0.3475609756097561, "eval_loss": 2.3971171379089355, "eval_precision": 0.2629757785467128, "eval_recall": 0.5123595505617977, "eval_runtime": 2.7631, "eval_samples_per_second": 49.943, "eval_steps_per_second": 4.343, "step": 2760 }, { "epoch": 61.0, "eval_accuracy": 0.6589658169177288, "eval_f1": 0.356979405034325, "eval_loss": 2.2836458683013916, "eval_precision": 0.2702078521939954, "eval_recall": 0.5258426966292135, "eval_runtime": 2.7541, "eval_samples_per_second": 50.107, "eval_steps_per_second": 4.357, "step": 2806 }, { "epoch": 62.0, "eval_accuracy": 0.6542584009269988, "eval_f1": 0.35784685367702807, "eval_loss": 2.3359830379486084, "eval_precision": 0.2700228832951945, "eval_recall": 0.5303370786516854, "eval_runtime": 2.7479, "eval_samples_per_second": 50.22, "eval_steps_per_second": 4.367, "step": 2852 }, { "epoch": 63.0, "eval_accuracy": 0.6491164542294322, "eval_f1": 0.36519036519036524, "eval_loss": 2.386730194091797, "eval_precision": 0.27909738717339666, "eval_recall": 0.5280898876404494, "eval_runtime": 2.7514, "eval_samples_per_second": 50.155, "eval_steps_per_second": 4.361, "step": 2898 }, { "epoch": 64.0, "eval_accuracy": 0.6441917728852838, "eval_f1": 0.35186595582635183, "eval_loss": 2.383052349090576, "eval_precision": 0.2661290322580645, "eval_recall": 0.5191011235955056, "eval_runtime": 2.7602, "eval_samples_per_second": 49.996, "eval_steps_per_second": 4.347, "step": 2944 }, { "epoch": 65.0, "eval_accuracy": 0.6536790266512167, "eval_f1": 0.3841166936790924, "eval_loss": 2.5153658390045166, "eval_precision": 0.30038022813688214, "eval_recall": 0.5325842696629214, "eval_runtime": 2.7644, "eval_samples_per_second": 49.92, "eval_steps_per_second": 4.341, "step": 2990 }, { "epoch": 65.22, "learning_rate": 6.956521739130435e-06, "loss": 0.0147, "step": 3000 }, { "epoch": 66.0, "eval_accuracy": 0.664904403244496, "eval_f1": 0.37846655791190864, "eval_loss": 2.3971505165100098, "eval_precision": 0.2970550576184379, "eval_recall": 0.5213483146067416, "eval_runtime": 2.7665, "eval_samples_per_second": 49.882, "eval_steps_per_second": 4.338, "step": 3036 }, { "epoch": 67.0, "eval_accuracy": 0.6633835457705678, "eval_f1": 0.36391912908242613, "eval_loss": 2.3396737575531006, "eval_precision": 0.27824019024970276, "eval_recall": 0.5258426966292135, "eval_runtime": 2.7947, "eval_samples_per_second": 49.379, "eval_steps_per_second": 4.294, "step": 3082 }, { "epoch": 68.0, "eval_accuracy": 0.6564310544611819, "eval_f1": 0.35294117647058826, "eval_loss": 2.459906816482544, "eval_precision": 0.269185360094451, "eval_recall": 0.5123595505617977, "eval_runtime": 2.748, "eval_samples_per_second": 50.218, "eval_steps_per_second": 4.367, "step": 3128 }, { "epoch": 69.0, "eval_accuracy": 0.6593279258400927, "eval_f1": 0.36205533596837947, "eval_loss": 2.3763880729675293, "eval_precision": 0.27926829268292686, "eval_recall": 0.5146067415730337, "eval_runtime": 2.7664, "eval_samples_per_second": 49.884, "eval_steps_per_second": 4.338, "step": 3174 }, { "epoch": 70.0, "eval_accuracy": 0.654837775202781, "eval_f1": 0.3348148148148148, "eval_loss": 2.368340492248535, "eval_precision": 0.24972375690607734, "eval_recall": 0.5078651685393258, "eval_runtime": 2.7667, "eval_samples_per_second": 49.878, "eval_steps_per_second": 4.337, "step": 3220 }, { "epoch": 71.0, "eval_accuracy": 0.6617902665121669, "eval_f1": 0.32901751713632904, "eval_loss": 2.3155479431152344, "eval_precision": 0.2488479262672811, "eval_recall": 0.4853932584269663, "eval_runtime": 2.7611, "eval_samples_per_second": 49.981, "eval_steps_per_second": 4.346, "step": 3266 }, { "epoch": 72.0, "eval_accuracy": 0.6662804171494786, "eval_f1": 0.3543307086614173, "eval_loss": 2.3285837173461914, "eval_precision": 0.2727272727272727, "eval_recall": 0.5056179775280899, "eval_runtime": 2.7664, "eval_samples_per_second": 49.885, "eval_steps_per_second": 4.338, "step": 3312 }, { "epoch": 73.0, "eval_accuracy": 0.6607763615295481, "eval_f1": 0.33206397562833206, "eval_loss": 2.3957254886627197, "eval_precision": 0.2511520737327189, "eval_recall": 0.4898876404494382, "eval_runtime": 2.7653, "eval_samples_per_second": 49.905, "eval_steps_per_second": 4.34, "step": 3358 }, { "epoch": 74.0, "eval_accuracy": 0.6594727694090382, "eval_f1": 0.3111432706222865, "eval_loss": 2.3470306396484375, "eval_precision": 0.2294557097118463, "eval_recall": 0.48314606741573035, "eval_runtime": 2.7615, "eval_samples_per_second": 49.973, "eval_steps_per_second": 4.345, "step": 3404 }, { "epoch": 75.0, "eval_accuracy": 0.6536066048667439, "eval_f1": 0.32770022042615726, "eval_loss": 2.451366424560547, "eval_precision": 0.24344978165938866, "eval_recall": 0.501123595505618, "eval_runtime": 2.7612, "eval_samples_per_second": 49.977, "eval_steps_per_second": 4.346, "step": 3450 }, { "epoch": 76.0, "eval_accuracy": 0.659545191193511, "eval_f1": 0.3306152705707932, "eval_loss": 2.346513271331787, "eval_precision": 0.24668141592920353, "eval_recall": 0.501123595505618, "eval_runtime": 2.7429, "eval_samples_per_second": 50.311, "eval_steps_per_second": 4.375, "step": 3496 }, { "epoch": 76.09, "learning_rate": 4.782608695652174e-06, "loss": 0.0156, "step": 3500 }, { "epoch": 77.0, "eval_accuracy": 0.6538238702201622, "eval_f1": 0.3167746580273578, "eval_loss": 2.42856502532959, "eval_precision": 0.2330508474576271, "eval_recall": 0.4943820224719101, "eval_runtime": 2.7674, "eval_samples_per_second": 49.867, "eval_steps_per_second": 4.336, "step": 3542 }, { "epoch": 78.0, "eval_accuracy": 0.6603418308227115, "eval_f1": 0.336559940431869, "eval_loss": 2.3454573154449463, "eval_precision": 0.2516703786191537, "eval_recall": 0.5078651685393258, "eval_runtime": 2.7701, "eval_samples_per_second": 49.818, "eval_steps_per_second": 4.332, "step": 3588 }, { "epoch": 79.0, "eval_accuracy": 0.655489571263036, "eval_f1": 0.3257520176082172, "eval_loss": 2.332895040512085, "eval_precision": 0.24183006535947713, "eval_recall": 0.49887640449438203, "eval_runtime": 2.7724, "eval_samples_per_second": 49.776, "eval_steps_per_second": 4.328, "step": 3634 }, { "epoch": 80.0, "eval_accuracy": 0.6509269988412515, "eval_f1": 0.3096960926193922, "eval_loss": 2.4176864624023438, "eval_precision": 0.22838847385272146, "eval_recall": 0.48089887640449436, "eval_runtime": 2.7816, "eval_samples_per_second": 49.612, "eval_steps_per_second": 4.314, "step": 3680 }, { "epoch": 81.0, "eval_accuracy": 0.663311123986095, "eval_f1": 0.31703703703703706, "eval_loss": 2.322171926498413, "eval_precision": 0.23646408839779007, "eval_recall": 0.48089887640449436, "eval_runtime": 2.7495, "eval_samples_per_second": 50.191, "eval_steps_per_second": 4.364, "step": 3726 }, { "epoch": 82.0, "eval_accuracy": 0.6552723059096176, "eval_f1": 0.3291512915129151, "eval_loss": 2.358896493911743, "eval_precision": 0.24505494505494504, "eval_recall": 0.501123595505618, "eval_runtime": 2.7748, "eval_samples_per_second": 49.733, "eval_steps_per_second": 4.325, "step": 3772 }, { "epoch": 83.0, "eval_accuracy": 0.6573001158748552, "eval_f1": 0.3404907975460122, "eval_loss": 2.3836281299591064, "eval_precision": 0.25844004656577413, "eval_recall": 0.49887640449438203, "eval_runtime": 2.7586, "eval_samples_per_second": 50.025, "eval_steps_per_second": 4.35, "step": 3818 }, { "epoch": 84.0, "eval_accuracy": 0.6519409038238703, "eval_f1": 0.35154394299287417, "eval_loss": 2.417782783508301, "eval_precision": 0.2713936430317848, "eval_recall": 0.49887640449438203, "eval_runtime": 2.751, "eval_samples_per_second": 50.164, "eval_steps_per_second": 4.362, "step": 3864 }, { "epoch": 85.0, "eval_accuracy": 0.6506373117033604, "eval_f1": 0.35266084193804603, "eval_loss": 2.494265079498291, "eval_precision": 0.2727272727272727, "eval_recall": 0.49887640449438203, "eval_runtime": 2.791, "eval_samples_per_second": 49.444, "eval_steps_per_second": 4.299, "step": 3910 }, { "epoch": 86.0, "eval_accuracy": 0.6568655851680185, "eval_f1": 0.34029389017788086, "eval_loss": 2.3840575218200684, "eval_precision": 0.25943396226415094, "eval_recall": 0.4943820224719101, "eval_runtime": 2.7591, "eval_samples_per_second": 50.016, "eval_steps_per_second": 4.349, "step": 3956 }, { "epoch": 86.96, "learning_rate": 2.6086956521739132e-06, "loss": 0.0172, "step": 4000 }, { "epoch": 87.0, "eval_accuracy": 0.6472334878331402, "eval_f1": 0.3413498836307215, "eval_loss": 2.444718599319458, "eval_precision": 0.26066350710900477, "eval_recall": 0.4943820224719101, "eval_runtime": 2.7661, "eval_samples_per_second": 49.89, "eval_steps_per_second": 4.338, "step": 4002 }, { "epoch": 88.0, "eval_accuracy": 0.6479577056778679, "eval_f1": 0.36450079239302696, "eval_loss": 2.4771909713745117, "eval_precision": 0.28151774785801714, "eval_recall": 0.5168539325842697, "eval_runtime": 2.7594, "eval_samples_per_second": 50.01, "eval_steps_per_second": 4.349, "step": 4048 }, { "epoch": 89.0, "eval_accuracy": 0.6564310544611819, "eval_f1": 0.36450839328537166, "eval_loss": 2.3940951824188232, "eval_precision": 0.28287841191067, "eval_recall": 0.5123595505617977, "eval_runtime": 2.766, "eval_samples_per_second": 49.892, "eval_steps_per_second": 4.338, "step": 4094 }, { "epoch": 90.0, "eval_accuracy": 0.664904403244496, "eval_f1": 0.36421725239616615, "eval_loss": 2.3723766803741455, "eval_precision": 0.2825278810408922, "eval_recall": 0.5123595505617977, "eval_runtime": 2.7724, "eval_samples_per_second": 49.776, "eval_steps_per_second": 4.328, "step": 4140 }, { "epoch": 91.0, "eval_accuracy": 0.6589658169177288, "eval_f1": 0.35759493670886083, "eval_loss": 2.412285566329956, "eval_precision": 0.27594627594627597, "eval_recall": 0.5078651685393258, "eval_runtime": 2.7583, "eval_samples_per_second": 50.03, "eval_steps_per_second": 4.35, "step": 4186 }, { "epoch": 92.0, "eval_accuracy": 0.6568655851680185, "eval_f1": 0.3537735849056604, "eval_loss": 2.4169280529022217, "eval_precision": 0.2720677146311971, "eval_recall": 0.5056179775280899, "eval_runtime": 2.7606, "eval_samples_per_second": 49.989, "eval_steps_per_second": 4.347, "step": 4232 }, { "epoch": 93.0, "eval_accuracy": 0.6580243337195828, "eval_f1": 0.34843749999999996, "eval_loss": 2.4057414531707764, "eval_precision": 0.26706586826347306, "eval_recall": 0.501123595505618, "eval_runtime": 2.7672, "eval_samples_per_second": 49.87, "eval_steps_per_second": 4.337, "step": 4278 }, { "epoch": 94.0, "eval_accuracy": 0.6558516801853997, "eval_f1": 0.34493426140757927, "eval_loss": 2.417436361312866, "eval_precision": 0.26297169811320753, "eval_recall": 0.501123595505618, "eval_runtime": 2.7713, "eval_samples_per_second": 49.796, "eval_steps_per_second": 4.33, "step": 4324 }, { "epoch": 95.0, "eval_accuracy": 0.6587485515643106, "eval_f1": 0.3555555555555556, "eval_loss": 2.4058446884155273, "eval_precision": 0.2748466257668712, "eval_recall": 0.503370786516854, "eval_runtime": 2.7567, "eval_samples_per_second": 50.06, "eval_steps_per_second": 4.353, "step": 4370 }, { "epoch": 96.0, "eval_accuracy": 0.6549101969872537, "eval_f1": 0.3468118195956454, "eval_loss": 2.423997163772583, "eval_precision": 0.26516052318668254, "eval_recall": 0.501123595505618, "eval_runtime": 2.7522, "eval_samples_per_second": 50.142, "eval_steps_per_second": 4.36, "step": 4416 }, { "epoch": 97.0, "eval_accuracy": 0.6596900347624566, "eval_f1": 0.3534956794972506, "eval_loss": 2.406991720199585, "eval_precision": 0.2717391304347826, "eval_recall": 0.5056179775280899, "eval_runtime": 2.765, "eval_samples_per_second": 49.91, "eval_steps_per_second": 4.34, "step": 4462 }, { "epoch": 97.83, "learning_rate": 4.347826086956522e-07, "loss": 0.0106, "step": 4500 }, { "epoch": 98.0, "eval_accuracy": 0.6607763615295481, "eval_f1": 0.34850863422292, "eval_loss": 2.402587413787842, "eval_precision": 0.2677925211097708, "eval_recall": 0.49887640449438203, "eval_runtime": 2.7737, "eval_samples_per_second": 49.753, "eval_steps_per_second": 4.326, "step": 4508 }, { "epoch": 99.0, "eval_accuracy": 0.6622247972190035, "eval_f1": 0.35062893081761004, "eval_loss": 2.4004111289978027, "eval_precision": 0.26964933494558646, "eval_recall": 0.501123595505618, "eval_runtime": 2.7443, "eval_samples_per_second": 50.286, "eval_steps_per_second": 4.373, "step": 4554 }, { "epoch": 100.0, "eval_accuracy": 0.6621523754345308, "eval_f1": 0.35035349567949725, "eval_loss": 2.4005491733551025, "eval_precision": 0.2693236714975845, "eval_recall": 0.501123595505618, "eval_runtime": 2.749, "eval_samples_per_second": 50.2, "eval_steps_per_second": 4.365, "step": 4600 } ], "max_steps": 4600, "num_train_epochs": 100, "total_flos": 8533183236037200.0, "trial_name": null, "trial_params": null }