diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,6016 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 500.0, + "global_step": 1000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "eval_accuracy": 0.45396600566572237, + "eval_f1": 0.01754385964912281, + "eval_loss": 0.7190675735473633, + "eval_precision": 0.012232415902140673, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.214, + "eval_steps_per_second": 10.354, + "step": 2 + }, + { + "epoch": 2.0, + "eval_accuracy": 0.45396600566572237, + "eval_f1": 0.01754385964912281, + "eval_loss": 0.7185351252555847, + "eval_precision": 0.012232415902140673, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.471, + "eval_steps_per_second": 10.441, + "step": 4 + }, + { + "epoch": 3.0, + "eval_accuracy": 0.45538243626062325, + "eval_f1": 0.017621145374449337, + "eval_loss": 0.7175477743148804, + "eval_precision": 0.012307692307692308, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.846, + "eval_steps_per_second": 10.456, + "step": 6 + }, + { + "epoch": 4.0, + "eval_accuracy": 0.4603399433427762, + "eval_f1": 0.0178173719376392, + "eval_loss": 0.7160851359367371, + "eval_precision": 0.0125, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.395, + "eval_steps_per_second": 10.4, + "step": 8 + }, + { + "epoch": 5.0, + "eval_accuracy": 0.46388101983002833, + "eval_f1": 0.017777777777777778, + "eval_loss": 0.7141746282577515, + "eval_precision": 0.012461059190031152, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.199, + "eval_steps_per_second": 10.354, + "step": 10 + }, + { + "epoch": 6.0, + "eval_accuracy": 0.476628895184136, + "eval_f1": 0.017797552836484983, + "eval_loss": 0.7118393182754517, + "eval_precision": 0.0124804992199688, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1922, + "eval_samples_per_second": 270.613, + "eval_steps_per_second": 10.408, + "step": 12 + }, + { + "epoch": 7.0, + "eval_accuracy": 0.48371104815864024, + "eval_f1": 0.01797752808988764, + "eval_loss": 0.7090863585472107, + "eval_precision": 0.012658227848101266, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1903, + "eval_samples_per_second": 273.244, + "eval_steps_per_second": 10.509, + "step": 14 + }, + { + "epoch": 8.0, + "eval_accuracy": 0.4943342776203966, + "eval_f1": 0.017937219730941704, + "eval_loss": 0.706073522567749, + "eval_precision": 0.012618296529968454, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.101, + "eval_steps_per_second": 10.465, + "step": 16 + }, + { + "epoch": 9.0, + "eval_accuracy": 0.5, + "eval_f1": 0.017937219730941704, + "eval_loss": 0.7027165293693542, + "eval_precision": 0.012618296529968454, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.213, + "eval_steps_per_second": 10.431, + "step": 18 + }, + { + "epoch": 10.0, + "eval_accuracy": 0.5056657223796034, + "eval_f1": 0.01791713325867861, + "eval_loss": 0.6989853382110596, + "eval_precision": 0.012598425196850394, + "eval_recall": 0.031007751937984496, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.566, + "eval_steps_per_second": 10.445, + "step": 20 + }, + { + "epoch": 11.0, + "eval_accuracy": 0.5134560906515581, + "eval_f1": 0.020134228187919462, + "eval_loss": 0.6949517726898193, + "eval_precision": 0.014150943396226415, + "eval_recall": 0.03488372093023256, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.801, + "eval_steps_per_second": 10.262, + "step": 22 + }, + { + "epoch": 12.0, + "eval_accuracy": 0.5226628895184136, + "eval_f1": 0.02252252252252252, + "eval_loss": 0.6908299922943115, + "eval_precision": 0.015873015873015872, + "eval_recall": 0.03875968992248062, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.659, + "eval_steps_per_second": 10.448, + "step": 24 + }, + { + "epoch": 13.0, + "eval_accuracy": 0.5375354107648725, + "eval_f1": 0.02711864406779661, + "eval_loss": 0.6863293051719666, + "eval_precision": 0.019138755980861243, + "eval_recall": 0.046511627906976744, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.704, + "eval_steps_per_second": 10.45, + "step": 26 + }, + { + "epoch": 14.0, + "eval_accuracy": 0.5524079320113314, + "eval_f1": 0.02531645569620253, + "eval_loss": 0.6815844774246216, + "eval_precision": 0.01800327332242226, + "eval_recall": 0.04263565891472868, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.22, + "eval_steps_per_second": 10.432, + "step": 28 + }, + { + "epoch": 15.0, + "eval_accuracy": 0.5793201133144475, + "eval_f1": 0.02790697674418605, + "eval_loss": 0.6764630079269409, + "eval_precision": 0.019933554817275746, + "eval_recall": 0.046511627906976744, + "eval_runtime": 0.1983, + "eval_samples_per_second": 262.168, + "eval_steps_per_second": 10.083, + "step": 30 + }, + { + "epoch": 16.0, + "eval_accuracy": 0.589943342776204, + "eval_f1": 0.026410564225690273, + "eval_loss": 0.6708706617355347, + "eval_precision": 0.019130434782608695, + "eval_recall": 0.04263565891472868, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.854, + "eval_steps_per_second": 10.264, + "step": 32 + }, + { + "epoch": 17.0, + "eval_accuracy": 0.6062322946175638, + "eval_f1": 0.026634382566585957, + "eval_loss": 0.6652079820632935, + "eval_precision": 0.01936619718309859, + "eval_recall": 0.04263565891472868, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.778, + "eval_steps_per_second": 10.376, + "step": 34 + }, + { + "epoch": 18.0, + "eval_accuracy": 0.6175637393767706, + "eval_f1": 0.024906600249066, + "eval_loss": 0.6591846942901611, + "eval_precision": 0.01834862385321101, + "eval_recall": 0.03875968992248062, + "eval_runtime": 0.1924, + "eval_samples_per_second": 270.301, + "eval_steps_per_second": 10.396, + "step": 36 + }, + { + "epoch": 19.0, + "eval_accuracy": 0.6345609065155807, + "eval_f1": 0.028025477707006374, + "eval_loss": 0.6527013778686523, + "eval_precision": 0.020872865275142316, + "eval_recall": 0.04263565891472868, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.99, + "eval_steps_per_second": 10.384, + "step": 38 + }, + { + "epoch": 20.0, + "eval_accuracy": 0.6536827195467422, + "eval_f1": 0.03743315508021391, + "eval_loss": 0.6457828283309937, + "eval_precision": 0.02857142857142857, + "eval_recall": 0.05426356589147287, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.029, + "eval_steps_per_second": 10.424, + "step": 40 + }, + { + "epoch": 21.0, + "eval_accuracy": 0.6657223796033994, + "eval_f1": 0.0326530612244898, + "eval_loss": 0.6385125517845154, + "eval_precision": 0.025157232704402517, + "eval_recall": 0.046511627906976744, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.093, + "eval_steps_per_second": 10.427, + "step": 42 + }, + { + "epoch": 22.0, + "eval_accuracy": 0.6841359773371105, + "eval_f1": 0.03888888888888889, + "eval_loss": 0.6314576864242554, + "eval_precision": 0.030303030303030304, + "eval_recall": 0.05426356589147287, + "eval_runtime": 0.1931, + "eval_samples_per_second": 269.344, + "eval_steps_per_second": 10.359, + "step": 44 + }, + { + "epoch": 23.0, + "eval_accuracy": 0.6926345609065155, + "eval_f1": 0.03977272727272728, + "eval_loss": 0.6241943836212158, + "eval_precision": 0.03139013452914798, + "eval_recall": 0.05426356589147287, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.395, + "eval_steps_per_second": 10.515, + "step": 46 + }, + { + "epoch": 24.0, + "eval_accuracy": 0.7096317280453258, + "eval_f1": 0.050445103857566766, + "eval_loss": 0.6164193749427795, + "eval_precision": 0.040865384615384616, + "eval_recall": 0.06589147286821706, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.651, + "eval_steps_per_second": 10.371, + "step": 48 + }, + { + "epoch": 25.0, + "eval_accuracy": 0.7273371104815864, + "eval_f1": 0.053973013493253376, + "eval_loss": 0.6084094047546387, + "eval_precision": 0.044009779951100246, + "eval_recall": 0.06976744186046512, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.214, + "eval_steps_per_second": 10.47, + "step": 50 + }, + { + "epoch": 26.0, + "eval_accuracy": 0.7407932011331445, + "eval_f1": 0.05581395348837209, + "eval_loss": 0.6001141667366028, + "eval_precision": 0.046511627906976744, + "eval_recall": 0.06976744186046512, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.284, + "eval_steps_per_second": 10.434, + "step": 52 + }, + { + "epoch": 27.0, + "eval_accuracy": 0.7471671388101983, + "eval_f1": 0.05778491171749598, + "eval_loss": 0.5918445587158203, + "eval_precision": 0.049315068493150684, + "eval_recall": 0.06976744186046512, + "eval_runtime": 0.1899, + "eval_samples_per_second": 273.835, + "eval_steps_per_second": 10.532, + "step": 54 + }, + { + "epoch": 28.0, + "eval_accuracy": 0.7528328611898017, + "eval_f1": 0.06988352745424294, + "eval_loss": 0.5830296874046326, + "eval_precision": 0.061224489795918366, + "eval_recall": 0.08139534883720931, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.728, + "eval_steps_per_second": 10.374, + "step": 56 + }, + { + "epoch": 29.0, + "eval_accuracy": 0.7648725212464589, + "eval_f1": 0.08275862068965517, + "eval_loss": 0.5733291506767273, + "eval_precision": 0.07453416149068323, + "eval_recall": 0.09302325581395349, + "eval_runtime": 0.1893, + "eval_samples_per_second": 274.728, + "eval_steps_per_second": 10.566, + "step": 58 + }, + { + "epoch": 30.0, + "eval_accuracy": 0.773371104815864, + "eval_f1": 0.08376963350785341, + "eval_loss": 0.5631821155548096, + "eval_precision": 0.0761904761904762, + "eval_recall": 0.09302325581395349, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.547, + "eval_steps_per_second": 10.483, + "step": 60 + }, + { + "epoch": 31.0, + "eval_accuracy": 0.7776203966005666, + "eval_f1": 0.09424083769633508, + "eval_loss": 0.5525625348091125, + "eval_precision": 0.08571428571428572, + "eval_recall": 0.10465116279069768, + "eval_runtime": 0.1903, + "eval_samples_per_second": 273.262, + "eval_steps_per_second": 10.51, + "step": 62 + }, + { + "epoch": 32.0, + "eval_accuracy": 0.7889518413597734, + "eval_f1": 0.1107142857142857, + "eval_loss": 0.5411368012428284, + "eval_precision": 0.10264900662251655, + "eval_recall": 0.12015503875968993, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.658, + "eval_steps_per_second": 10.448, + "step": 64 + }, + { + "epoch": 33.0, + "eval_accuracy": 0.7988668555240793, + "eval_f1": 0.11567164179104478, + "eval_loss": 0.5295829176902771, + "eval_precision": 0.11151079136690648, + "eval_recall": 0.12015503875968993, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.075, + "eval_steps_per_second": 10.503, + "step": 66 + }, + { + "epoch": 34.0, + "eval_accuracy": 0.8045325779036827, + "eval_f1": 0.13152804642166346, + "eval_loss": 0.5174781084060669, + "eval_precision": 0.13127413127413126, + "eval_recall": 0.13178294573643412, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.083, + "eval_steps_per_second": 10.503, + "step": 68 + }, + { + "epoch": 35.0, + "eval_accuracy": 0.8080736543909348, + "eval_f1": 0.13999999999999999, + "eval_loss": 0.5051134824752808, + "eval_precision": 0.1446280991735537, + "eval_recall": 0.13565891472868216, + "eval_runtime": 0.1896, + "eval_samples_per_second": 274.199, + "eval_steps_per_second": 10.546, + "step": 70 + }, + { + "epoch": 36.0, + "eval_accuracy": 0.8101983002832861, + "eval_f1": 0.1294363256784969, + "eval_loss": 0.4926650822162628, + "eval_precision": 0.14027149321266968, + "eval_recall": 0.12015503875968993, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.301, + "eval_steps_per_second": 10.473, + "step": 72 + }, + { + "epoch": 37.0, + "eval_accuracy": 0.8137393767705382, + "eval_f1": 0.1564482029598309, + "eval_loss": 0.4799807667732239, + "eval_precision": 0.17209302325581396, + "eval_recall": 0.1434108527131783, + "eval_runtime": 0.1898, + "eval_samples_per_second": 274.018, + "eval_steps_per_second": 10.539, + "step": 74 + }, + { + "epoch": 38.0, + "eval_accuracy": 0.8151558073654391, + "eval_f1": 0.15578947368421053, + "eval_loss": 0.46721795201301575, + "eval_precision": 0.17050691244239632, + "eval_recall": 0.1434108527131783, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.058, + "eval_steps_per_second": 10.502, + "step": 76 + }, + { + "epoch": 39.0, + "eval_accuracy": 0.8222379603399433, + "eval_f1": 0.1694915254237288, + "eval_loss": 0.45428818464279175, + "eval_precision": 0.18691588785046728, + "eval_recall": 0.15503875968992248, + "eval_runtime": 0.1894, + "eval_samples_per_second": 274.546, + "eval_steps_per_second": 10.559, + "step": 78 + }, + { + "epoch": 40.0, + "eval_accuracy": 0.8279036827195467, + "eval_f1": 0.18415417558886507, + "eval_loss": 0.442182332277298, + "eval_precision": 0.20574162679425836, + "eval_recall": 0.16666666666666666, + "eval_runtime": 0.1899, + "eval_samples_per_second": 273.899, + "eval_steps_per_second": 10.535, + "step": 80 + }, + { + "epoch": 41.0, + "eval_accuracy": 0.8328611898016998, + "eval_f1": 0.18064516129032257, + "eval_loss": 0.4300879240036011, + "eval_precision": 0.2028985507246377, + "eval_recall": 0.16279069767441862, + "eval_runtime": 0.1899, + "eval_samples_per_second": 273.884, + "eval_steps_per_second": 10.534, + "step": 82 + }, + { + "epoch": 42.0, + "eval_accuracy": 0.8335694050991501, + "eval_f1": 0.18181818181818182, + "eval_loss": 0.41832053661346436, + "eval_precision": 0.20588235294117646, + "eval_recall": 0.16279069767441862, + "eval_runtime": 0.1939, + "eval_samples_per_second": 268.181, + "eval_steps_per_second": 10.315, + "step": 84 + }, + { + "epoch": 43.0, + "eval_accuracy": 0.839943342776204, + "eval_f1": 0.18843683083511778, + "eval_loss": 0.40713071823120117, + "eval_precision": 0.21052631578947367, + "eval_recall": 0.17054263565891473, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.938, + "eval_steps_per_second": 10.421, + "step": 86 + }, + { + "epoch": 44.0, + "eval_accuracy": 0.8470254957507082, + "eval_f1": 0.19742489270386268, + "eval_loss": 0.39543262124061584, + "eval_precision": 0.22115384615384615, + "eval_recall": 0.17829457364341086, + "eval_runtime": 0.1888, + "eval_samples_per_second": 275.394, + "eval_steps_per_second": 10.592, + "step": 88 + }, + { + "epoch": 45.0, + "eval_accuracy": 0.8512747875354107, + "eval_f1": 0.2012847965738758, + "eval_loss": 0.38278087973594666, + "eval_precision": 0.22488038277511962, + "eval_recall": 0.1821705426356589, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.564, + "eval_steps_per_second": 10.522, + "step": 90 + }, + { + "epoch": 46.0, + "eval_accuracy": 0.8661473087818697, + "eval_f1": 0.2629310344827586, + "eval_loss": 0.370393306016922, + "eval_precision": 0.2961165048543689, + "eval_recall": 0.2364341085271318, + "eval_runtime": 0.1894, + "eval_samples_per_second": 274.622, + "eval_steps_per_second": 10.562, + "step": 92 + }, + { + "epoch": 47.0, + "eval_accuracy": 0.8682719546742209, + "eval_f1": 0.26898047722342733, + "eval_loss": 0.35816633701324463, + "eval_precision": 0.3054187192118227, + "eval_recall": 0.24031007751937986, + "eval_runtime": 0.1892, + "eval_samples_per_second": 274.795, + "eval_steps_per_second": 10.569, + "step": 94 + }, + { + "epoch": 48.0, + "eval_accuracy": 0.8654390934844193, + "eval_f1": 0.26495726495726496, + "eval_loss": 0.3456425368785858, + "eval_precision": 0.29523809523809524, + "eval_recall": 0.24031007751937986, + "eval_runtime": 0.1896, + "eval_samples_per_second": 274.243, + "eval_steps_per_second": 10.548, + "step": 96 + }, + { + "epoch": 49.0, + "eval_accuracy": 0.8703966005665722, + "eval_f1": 0.27015250544662306, + "eval_loss": 0.3332156538963318, + "eval_precision": 0.30845771144278605, + "eval_recall": 0.24031007751937986, + "eval_runtime": 0.1939, + "eval_samples_per_second": 268.247, + "eval_steps_per_second": 10.317, + "step": 98 + }, + { + "epoch": 50.0, + "eval_accuracy": 0.8739376770538244, + "eval_f1": 0.29694323144104806, + "eval_loss": 0.321566104888916, + "eval_precision": 0.34, + "eval_recall": 0.26356589147286824, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.499, + "eval_steps_per_second": 10.481, + "step": 100 + }, + { + "epoch": 51.0, + "eval_accuracy": 0.8796033994334278, + "eval_f1": 0.30042918454935624, + "eval_loss": 0.3097538650035858, + "eval_precision": 0.33653846153846156, + "eval_recall": 0.2713178294573643, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.754, + "eval_steps_per_second": 10.491, + "step": 102 + }, + { + "epoch": 52.0, + "eval_accuracy": 0.8852691218130312, + "eval_f1": 0.3177966101694915, + "eval_loss": 0.29793235659599304, + "eval_precision": 0.35046728971962615, + "eval_recall": 0.29069767441860467, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.675, + "eval_steps_per_second": 10.488, + "step": 104 + }, + { + "epoch": 53.0, + "eval_accuracy": 0.8916430594900849, + "eval_f1": 0.351931330472103, + "eval_loss": 0.2854478657245636, + "eval_precision": 0.3942307692307692, + "eval_recall": 0.3178294573643411, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.444, + "eval_steps_per_second": 10.517, + "step": 106 + }, + { + "epoch": 54.0, + "eval_accuracy": 0.8994334277620396, + "eval_f1": 0.3836206896551724, + "eval_loss": 0.27312982082366943, + "eval_precision": 0.4320388349514563, + "eval_recall": 0.3449612403100775, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.685, + "eval_steps_per_second": 10.488, + "step": 108 + }, + { + "epoch": 55.0, + "eval_accuracy": 0.9065155807365439, + "eval_f1": 0.3803418803418804, + "eval_loss": 0.26105964183807373, + "eval_precision": 0.4238095238095238, + "eval_recall": 0.3449612403100775, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.166, + "eval_steps_per_second": 10.506, + "step": 110 + }, + { + "epoch": 56.0, + "eval_accuracy": 0.9114730878186968, + "eval_f1": 0.41188959660297236, + "eval_loss": 0.24857781827449799, + "eval_precision": 0.45539906103286387, + "eval_recall": 0.375968992248062, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.447, + "eval_steps_per_second": 10.402, + "step": 112 + }, + { + "epoch": 57.0, + "eval_accuracy": 0.9178470254957507, + "eval_f1": 0.4340425531914893, + "eval_loss": 0.23573735356330872, + "eval_precision": 0.4811320754716981, + "eval_recall": 0.3953488372093023, + "eval_runtime": 0.1895, + "eval_samples_per_second": 274.34, + "eval_steps_per_second": 10.552, + "step": 114 + }, + { + "epoch": 58.0, + "eval_accuracy": 0.9242209631728046, + "eval_f1": 0.4651162790697675, + "eval_loss": 0.2240147441625595, + "eval_precision": 0.5116279069767442, + "eval_recall": 0.4263565891472868, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.427, + "eval_steps_per_second": 10.478, + "step": 116 + }, + { + "epoch": 59.0, + "eval_accuracy": 0.9341359773371105, + "eval_f1": 0.51931330472103, + "eval_loss": 0.21279525756835938, + "eval_precision": 0.5817307692307693, + "eval_recall": 0.4689922480620155, + "eval_runtime": 0.19, + "eval_samples_per_second": 273.618, + "eval_steps_per_second": 10.524, + "step": 118 + }, + { + "epoch": 60.0, + "eval_accuracy": 0.9362606232294618, + "eval_f1": 0.5159914712153518, + "eval_loss": 0.2014358937740326, + "eval_precision": 0.5734597156398105, + "eval_recall": 0.4689922480620155, + "eval_runtime": 0.1905, + "eval_samples_per_second": 272.975, + "eval_steps_per_second": 10.499, + "step": 120 + }, + { + "epoch": 61.0, + "eval_accuracy": 0.9376770538243626, + "eval_f1": 0.5290322580645161, + "eval_loss": 0.1877969652414322, + "eval_precision": 0.5942028985507246, + "eval_recall": 0.47674418604651164, + "eval_runtime": 0.19, + "eval_samples_per_second": 273.72, + "eval_steps_per_second": 10.528, + "step": 122 + }, + { + "epoch": 62.0, + "eval_accuracy": 0.9454674220963173, + "eval_f1": 0.5623678646934461, + "eval_loss": 0.17463728785514832, + "eval_precision": 0.6186046511627907, + "eval_recall": 0.5155038759689923, + "eval_runtime": 0.19, + "eval_samples_per_second": 273.747, + "eval_steps_per_second": 10.529, + "step": 124 + }, + { + "epoch": 63.0, + "eval_accuracy": 0.9461756373937678, + "eval_f1": 0.5660377358490567, + "eval_loss": 0.16446256637573242, + "eval_precision": 0.6164383561643836, + "eval_recall": 0.5232558139534884, + "eval_runtime": 0.1967, + "eval_samples_per_second": 264.347, + "eval_steps_per_second": 10.167, + "step": 126 + }, + { + "epoch": 64.0, + "eval_accuracy": 0.953257790368272, + "eval_f1": 0.6059322033898306, + "eval_loss": 0.15638068318367004, + "eval_precision": 0.6682242990654206, + "eval_recall": 0.5542635658914729, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.298, + "eval_steps_per_second": 10.473, + "step": 128 + }, + { + "epoch": 65.0, + "eval_accuracy": 0.9553824362606232, + "eval_f1": 0.6157112526539279, + "eval_loss": 0.1482805609703064, + "eval_precision": 0.6807511737089202, + "eval_recall": 0.562015503875969, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.059, + "eval_steps_per_second": 10.502, + "step": 130 + }, + { + "epoch": 66.0, + "eval_accuracy": 0.9560906515580736, + "eval_f1": 0.6160337552742616, + "eval_loss": 0.13676248490810394, + "eval_precision": 0.6759259259259259, + "eval_recall": 0.5658914728682171, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.879, + "eval_steps_per_second": 10.457, + "step": 132 + }, + { + "epoch": 67.0, + "eval_accuracy": 0.9596317280453258, + "eval_f1": 0.6540084388185653, + "eval_loss": 0.12685953080654144, + "eval_precision": 0.7175925925925926, + "eval_recall": 0.6007751937984496, + "eval_runtime": 0.1899, + "eval_samples_per_second": 273.788, + "eval_steps_per_second": 10.53, + "step": 134 + }, + { + "epoch": 68.0, + "eval_accuracy": 0.9638810198300283, + "eval_f1": 0.676595744680851, + "eval_loss": 0.118584543466568, + "eval_precision": 0.75, + "eval_recall": 0.6162790697674418, + "eval_runtime": 0.1892, + "eval_samples_per_second": 274.857, + "eval_steps_per_second": 10.571, + "step": 136 + }, + { + "epoch": 69.0, + "eval_accuracy": 0.9660056657223796, + "eval_f1": 0.6936170212765957, + "eval_loss": 0.11178788542747498, + "eval_precision": 0.7688679245283019, + "eval_recall": 0.6317829457364341, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.494, + "eval_steps_per_second": 10.519, + "step": 138 + }, + { + "epoch": 70.0, + "eval_accuracy": 0.9674220963172805, + "eval_f1": 0.6991525423728815, + "eval_loss": 0.10284025222063065, + "eval_precision": 0.7710280373831776, + "eval_recall": 0.6395348837209303, + "eval_runtime": 0.1946, + "eval_samples_per_second": 267.194, + "eval_steps_per_second": 10.277, + "step": 140 + }, + { + "epoch": 71.0, + "eval_accuracy": 0.9716713881019831, + "eval_f1": 0.7379454926624739, + "eval_loss": 0.09320546686649323, + "eval_precision": 0.8036529680365296, + "eval_recall": 0.6821705426356589, + "eval_runtime": 0.1903, + "eval_samples_per_second": 273.202, + "eval_steps_per_second": 10.508, + "step": 142 + }, + { + "epoch": 72.0, + "eval_accuracy": 0.9745042492917847, + "eval_f1": 0.7640918580375782, + "eval_loss": 0.08570843189954758, + "eval_precision": 0.8280542986425339, + "eval_recall": 0.7093023255813954, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.094, + "eval_steps_per_second": 10.504, + "step": 144 + }, + { + "epoch": 73.0, + "eval_accuracy": 0.9759206798866855, + "eval_f1": 0.7784679089026916, + "eval_loss": 0.07916779816150665, + "eval_precision": 0.8355555555555556, + "eval_recall": 0.7286821705426356, + "eval_runtime": 0.1898, + "eval_samples_per_second": 273.975, + "eval_steps_per_second": 10.537, + "step": 146 + }, + { + "epoch": 74.0, + "eval_accuracy": 0.9794617563739377, + "eval_f1": 0.8057259713701432, + "eval_loss": 0.07321218401193619, + "eval_precision": 0.8528138528138528, + "eval_recall": 0.7635658914728682, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.502, + "eval_steps_per_second": 10.519, + "step": 148 + }, + { + "epoch": 75.0, + "eval_accuracy": 0.9801699716713881, + "eval_f1": 0.8081632653061224, + "eval_loss": 0.06479813903570175, + "eval_precision": 0.853448275862069, + "eval_recall": 0.7674418604651163, + "eval_runtime": 0.1896, + "eval_samples_per_second": 274.24, + "eval_steps_per_second": 10.548, + "step": 150 + }, + { + "epoch": 76.0, + "eval_accuracy": 0.9801699716713881, + "eval_f1": 0.8097165991902834, + "eval_loss": 0.05995577573776245, + "eval_precision": 0.847457627118644, + "eval_recall": 0.7751937984496124, + "eval_runtime": 0.1985, + "eval_samples_per_second": 262.005, + "eval_steps_per_second": 10.077, + "step": 152 + }, + { + "epoch": 77.0, + "eval_accuracy": 0.9851274787535411, + "eval_f1": 0.8571428571428573, + "eval_loss": 0.05317886918783188, + "eval_precision": 0.891213389121339, + "eval_recall": 0.8255813953488372, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.279, + "eval_steps_per_second": 10.434, + "step": 154 + }, + { + "epoch": 78.0, + "eval_accuracy": 0.9872521246458924, + "eval_f1": 0.8714859437751005, + "eval_loss": 0.04899248853325844, + "eval_precision": 0.9041666666666667, + "eval_recall": 0.8410852713178295, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.14, + "eval_steps_per_second": 10.505, + "step": 156 + }, + { + "epoch": 79.0, + "eval_accuracy": 0.9879603399433428, + "eval_f1": 0.88, + "eval_loss": 0.04492037743330002, + "eval_precision": 0.9090909090909091, + "eval_recall": 0.8527131782945736, + "eval_runtime": 0.1903, + "eval_samples_per_second": 273.212, + "eval_steps_per_second": 10.508, + "step": 158 + }, + { + "epoch": 80.0, + "eval_accuracy": 0.9907932011331445, + "eval_f1": 0.9021956087824351, + "eval_loss": 0.03977702185511589, + "eval_precision": 0.9300411522633745, + "eval_recall": 0.875968992248062, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.722, + "eval_steps_per_second": 10.489, + "step": 160 + }, + { + "epoch": 81.0, + "eval_accuracy": 0.990084985835694, + "eval_f1": 0.9018036072144289, + "eval_loss": 0.03646460920572281, + "eval_precision": 0.9336099585062241, + "eval_recall": 0.872093023255814, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.606, + "eval_steps_per_second": 10.523, + "step": 162 + }, + { + "epoch": 82.0, + "eval_accuracy": 0.990084985835694, + "eval_f1": 0.9018036072144289, + "eval_loss": 0.03253123536705971, + "eval_precision": 0.9336099585062241, + "eval_recall": 0.872093023255814, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.383, + "eval_steps_per_second": 10.515, + "step": 164 + }, + { + "epoch": 83.0, + "eval_accuracy": 0.9907932011331445, + "eval_f1": 0.9098196392785571, + "eval_loss": 0.028543885797262192, + "eval_precision": 0.941908713692946, + "eval_recall": 0.8798449612403101, + "eval_runtime": 0.199, + "eval_samples_per_second": 261.341, + "eval_steps_per_second": 10.052, + "step": 166 + }, + { + "epoch": 84.0, + "eval_accuracy": 0.990084985835694, + "eval_f1": 0.9018036072144289, + "eval_loss": 0.02411552518606186, + "eval_precision": 0.9336099585062241, + "eval_recall": 0.872093023255814, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.075, + "eval_steps_per_second": 10.503, + "step": 168 + }, + { + "epoch": 85.0, + "eval_accuracy": 0.9929178470254958, + "eval_f1": 0.932806324110672, + "eval_loss": 0.02160893939435482, + "eval_precision": 0.9516129032258065, + "eval_recall": 0.9147286821705426, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.787, + "eval_steps_per_second": 10.453, + "step": 170 + }, + { + "epoch": 86.0, + "eval_accuracy": 0.9957507082152974, + "eval_f1": 0.9549902152641878, + "eval_loss": 0.019445108249783516, + "eval_precision": 0.9644268774703557, + "eval_recall": 0.9457364341085271, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.268, + "eval_steps_per_second": 10.472, + "step": 172 + }, + { + "epoch": 87.0, + "eval_accuracy": 0.9964589235127479, + "eval_f1": 0.962962962962963, + "eval_loss": 0.016319064423441887, + "eval_precision": 0.9686274509803922, + "eval_recall": 0.9573643410852714, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.353, + "eval_steps_per_second": 10.475, + "step": 174 + }, + { + "epoch": 88.0, + "eval_accuracy": 0.9964589235127479, + "eval_f1": 0.962962962962963, + "eval_loss": 0.014255463145673275, + "eval_precision": 0.9686274509803922, + "eval_recall": 0.9573643410852714, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.168, + "eval_steps_per_second": 10.468, + "step": 176 + }, + { + "epoch": 89.0, + "eval_accuracy": 0.9971671388101983, + "eval_f1": 0.9707602339181286, + "eval_loss": 0.013463201001286507, + "eval_precision": 0.9764705882352941, + "eval_recall": 0.9651162790697675, + "eval_runtime": 0.1954, + "eval_samples_per_second": 266.074, + "eval_steps_per_second": 10.234, + "step": 178 + }, + { + "epoch": 90.0, + "eval_accuracy": 0.9971671388101983, + "eval_f1": 0.9708737864077669, + "eval_loss": 0.013294624164700508, + "eval_precision": 0.9727626459143969, + "eval_recall": 0.9689922480620154, + "eval_runtime": 0.1939, + "eval_samples_per_second": 268.172, + "eval_steps_per_second": 10.314, + "step": 180 + }, + { + "epoch": 91.0, + "eval_accuracy": 0.9985835694050992, + "eval_f1": 0.9864077669902912, + "eval_loss": 0.010970248840749264, + "eval_precision": 0.9883268482490273, + "eval_recall": 0.9844961240310077, + "eval_runtime": 0.1897, + "eval_samples_per_second": 274.144, + "eval_steps_per_second": 10.544, + "step": 182 + }, + { + "epoch": 92.0, + "eval_accuracy": 0.9985835694050992, + "eval_f1": 0.9864077669902912, + "eval_loss": 0.009612097404897213, + "eval_precision": 0.9883268482490273, + "eval_recall": 0.9844961240310077, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.79, + "eval_steps_per_second": 10.492, + "step": 184 + }, + { + "epoch": 93.0, + "eval_accuracy": 0.9978753541076487, + "eval_f1": 0.978640776699029, + "eval_loss": 0.009413937106728554, + "eval_precision": 0.980544747081712, + "eval_recall": 0.9767441860465116, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.534, + "eval_steps_per_second": 10.521, + "step": 186 + }, + { + "epoch": 94.0, + "eval_accuracy": 0.9971671388101983, + "eval_f1": 0.9707602339181286, + "eval_loss": 0.008508301340043545, + "eval_precision": 0.9764705882352941, + "eval_recall": 0.9651162790697675, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.426, + "eval_steps_per_second": 10.478, + "step": 188 + }, + { + "epoch": 95.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.006476177833974361, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.478, + "eval_steps_per_second": 10.518, + "step": 190 + }, + { + "epoch": 96.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.005191581789404154, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.486, + "eval_steps_per_second": 10.48, + "step": 192 + }, + { + "epoch": 97.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.004574592690914869, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.125, + "eval_steps_per_second": 10.466, + "step": 194 + }, + { + "epoch": 98.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0043844361789524555, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.645, + "eval_steps_per_second": 10.409, + "step": 196 + }, + { + "epoch": 99.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.004784913267940283, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.482, + "eval_steps_per_second": 10.442, + "step": 198 + }, + { + "epoch": 100.0, + "eval_accuracy": 0.9985835694050992, + "eval_f1": 0.9844961240310077, + "eval_loss": 0.004961721133440733, + "eval_precision": 0.9844961240310077, + "eval_recall": 0.9844961240310077, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.948, + "eval_steps_per_second": 10.383, + "step": 200 + }, + { + "epoch": 101.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.004689970053732395, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1947, + "eval_samples_per_second": 267.024, + "eval_steps_per_second": 10.27, + "step": 202 + }, + { + "epoch": 102.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.004511161707341671, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1972, + "eval_samples_per_second": 263.665, + "eval_steps_per_second": 10.141, + "step": 204 + }, + { + "epoch": 103.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.004330621100962162, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1947, + "eval_samples_per_second": 267.045, + "eval_steps_per_second": 10.271, + "step": 206 + }, + { + "epoch": 104.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.003701193956658244, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.832, + "eval_steps_per_second": 10.263, + "step": 208 + }, + { + "epoch": 105.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.002771391998976469, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.793, + "eval_steps_per_second": 10.261, + "step": 210 + }, + { + "epoch": 106.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0020373458974063396, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.199, + "eval_steps_per_second": 10.469, + "step": 212 + }, + { + "epoch": 107.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0016820903401821852, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1942, + "eval_samples_per_second": 267.792, + "eval_steps_per_second": 10.3, + "step": 214 + }, + { + "epoch": 108.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0015996459405869246, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.494, + "eval_steps_per_second": 10.481, + "step": 216 + }, + { + "epoch": 109.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0018962565809488297, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1957, + "eval_samples_per_second": 265.706, + "eval_steps_per_second": 10.219, + "step": 218 + }, + { + "epoch": 110.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922178988326849, + "eval_loss": 0.0030049937777221203, + "eval_precision": 0.99609375, + "eval_recall": 0.9883720930232558, + "eval_runtime": 0.1903, + "eval_samples_per_second": 273.24, + "eval_steps_per_second": 10.509, + "step": 220 + }, + { + "epoch": 111.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922178988326849, + "eval_loss": 0.0027573523111641407, + "eval_precision": 0.99609375, + "eval_recall": 0.9883720930232558, + "eval_runtime": 0.196, + "eval_samples_per_second": 265.316, + "eval_steps_per_second": 10.204, + "step": 222 + }, + { + "epoch": 112.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0014663514448329806, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.795, + "eval_steps_per_second": 10.492, + "step": 224 + }, + { + "epoch": 113.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0009652902954258025, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1929, + "eval_samples_per_second": 269.56, + "eval_steps_per_second": 10.368, + "step": 226 + }, + { + "epoch": 114.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.000940584228374064, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.19, + "eval_samples_per_second": 273.637, + "eval_steps_per_second": 10.524, + "step": 228 + }, + { + "epoch": 115.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0009229247807525098, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.073, + "eval_steps_per_second": 10.503, + "step": 230 + }, + { + "epoch": 116.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0009766740258783102, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.092, + "eval_steps_per_second": 10.465, + "step": 232 + }, + { + "epoch": 117.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0008239487651735544, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1899, + "eval_samples_per_second": 273.825, + "eval_steps_per_second": 10.532, + "step": 234 + }, + { + "epoch": 118.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0007718774140812457, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1939, + "eval_samples_per_second": 268.187, + "eval_steps_per_second": 10.315, + "step": 236 + }, + { + "epoch": 119.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0007432139827869833, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1898, + "eval_samples_per_second": 273.921, + "eval_steps_per_second": 10.535, + "step": 238 + }, + { + "epoch": 120.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0007115314365364611, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.229, + "eval_steps_per_second": 10.47, + "step": 240 + }, + { + "epoch": 121.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.000678342767059803, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.268, + "eval_steps_per_second": 10.472, + "step": 242 + }, + { + "epoch": 122.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0006657196790911257, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1927, + "eval_samples_per_second": 269.802, + "eval_steps_per_second": 10.377, + "step": 244 + }, + { + "epoch": 123.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0006468800129368901, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.365, + "eval_steps_per_second": 10.476, + "step": 246 + }, + { + "epoch": 124.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.000598097569309175, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.975, + "eval_steps_per_second": 10.461, + "step": 248 + }, + { + "epoch": 125.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.000571465352550149, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.439, + "eval_steps_per_second": 10.401, + "step": 250 + }, + { + "epoch": 126.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0005956876557320356, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.456, + "eval_steps_per_second": 10.441, + "step": 252 + }, + { + "epoch": 127.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0005214645061641932, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.648, + "eval_steps_per_second": 10.486, + "step": 254 + }, + { + "epoch": 128.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00044241841533221304, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.19, + "eval_samples_per_second": 273.68, + "eval_steps_per_second": 10.526, + "step": 256 + }, + { + "epoch": 129.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00041046313708648086, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1942, + "eval_samples_per_second": 267.783, + "eval_steps_per_second": 10.299, + "step": 258 + }, + { + "epoch": 130.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00039329633000306785, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.378, + "eval_steps_per_second": 10.515, + "step": 260 + }, + { + "epoch": 131.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003948420926462859, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.438, + "eval_steps_per_second": 10.44, + "step": 262 + }, + { + "epoch": 132.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00037927410448901355, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.396, + "eval_steps_per_second": 10.515, + "step": 264 + }, + { + "epoch": 133.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003346985613461584, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.226, + "eval_steps_per_second": 10.432, + "step": 266 + }, + { + "epoch": 134.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00032417659531347454, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.079, + "eval_steps_per_second": 10.465, + "step": 268 + }, + { + "epoch": 135.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003305810096208006, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.057, + "eval_steps_per_second": 10.464, + "step": 270 + }, + { + "epoch": 136.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003238403587602079, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.301, + "eval_steps_per_second": 10.473, + "step": 272 + }, + { + "epoch": 137.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00033838118542917073, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.505, + "eval_steps_per_second": 10.443, + "step": 274 + }, + { + "epoch": 138.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003516759898047894, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.201, + "eval_samples_per_second": 258.756, + "eval_steps_per_second": 9.952, + "step": 276 + }, + { + "epoch": 139.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003421700675971806, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.177, + "eval_steps_per_second": 10.43, + "step": 278 + }, + { + "epoch": 140.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00034544046502560377, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.741, + "eval_steps_per_second": 10.452, + "step": 280 + }, + { + "epoch": 141.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.000345398933859542, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1942, + "eval_samples_per_second": 267.696, + "eval_steps_per_second": 10.296, + "step": 282 + }, + { + "epoch": 142.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00031844479963183403, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.36, + "eval_steps_per_second": 10.398, + "step": 284 + }, + { + "epoch": 143.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00032226371695287526, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1931, + "eval_samples_per_second": 269.243, + "eval_steps_per_second": 10.355, + "step": 286 + }, + { + "epoch": 144.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003062640316784382, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.378, + "eval_steps_per_second": 10.515, + "step": 288 + }, + { + "epoch": 145.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003345184959471226, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.176, + "eval_steps_per_second": 10.43, + "step": 290 + }, + { + "epoch": 146.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003987839154433459, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.241, + "eval_steps_per_second": 10.432, + "step": 292 + }, + { + "epoch": 147.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0004939653445035219, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.357, + "eval_steps_per_second": 10.475, + "step": 294 + }, + { + "epoch": 148.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00038645107997581363, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1922, + "eval_samples_per_second": 270.573, + "eval_steps_per_second": 10.407, + "step": 296 + }, + { + "epoch": 149.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00030202866764739156, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.771, + "eval_steps_per_second": 10.491, + "step": 298 + }, + { + "epoch": 150.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00029896365595050156, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.114, + "eval_steps_per_second": 10.351, + "step": 300 + }, + { + "epoch": 151.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00028947534156031907, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.178, + "eval_steps_per_second": 10.468, + "step": 302 + }, + { + "epoch": 152.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00028148043202236295, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1933, + "eval_samples_per_second": 269.046, + "eval_steps_per_second": 10.348, + "step": 304 + }, + { + "epoch": 153.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00030154644628055394, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.517, + "eval_steps_per_second": 10.481, + "step": 306 + }, + { + "epoch": 154.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00028183270478621125, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.559, + "eval_steps_per_second": 10.483, + "step": 308 + }, + { + "epoch": 155.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00026179320411756635, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.505, + "eval_steps_per_second": 10.443, + "step": 310 + }, + { + "epoch": 156.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00025669598835520446, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1926, + "eval_samples_per_second": 270.029, + "eval_steps_per_second": 10.386, + "step": 312 + }, + { + "epoch": 157.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0002637333527673036, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.623, + "eval_steps_per_second": 10.409, + "step": 314 + }, + { + "epoch": 158.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00025175316841341555, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1934, + "eval_samples_per_second": 268.908, + "eval_steps_per_second": 10.343, + "step": 316 + }, + { + "epoch": 159.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00024776585632935166, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.722, + "eval_steps_per_second": 10.412, + "step": 318 + }, + { + "epoch": 160.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00026708838413469493, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.674, + "eval_steps_per_second": 10.411, + "step": 320 + }, + { + "epoch": 161.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00029284742777235806, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.246, + "eval_steps_per_second": 10.433, + "step": 322 + }, + { + "epoch": 162.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00025016561266966164, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.165, + "eval_steps_per_second": 10.468, + "step": 324 + }, + { + "epoch": 163.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.000234853447182104, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.652, + "eval_steps_per_second": 10.487, + "step": 326 + }, + { + "epoch": 164.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00023277125728782266, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.641, + "eval_steps_per_second": 10.448, + "step": 328 + }, + { + "epoch": 165.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00023167900508269668, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.086, + "eval_steps_per_second": 10.465, + "step": 330 + }, + { + "epoch": 166.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0002348786365473643, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.365, + "eval_steps_per_second": 10.476, + "step": 332 + }, + { + "epoch": 167.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00024429563200101256, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.477, + "eval_steps_per_second": 10.48, + "step": 334 + }, + { + "epoch": 168.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00022864319907967, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.718, + "eval_steps_per_second": 10.374, + "step": 336 + }, + { + "epoch": 169.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00020606903126463294, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.907, + "eval_steps_per_second": 10.458, + "step": 338 + }, + { + "epoch": 170.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00018062723393086344, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1937, + "eval_samples_per_second": 268.46, + "eval_steps_per_second": 10.325, + "step": 340 + }, + { + "epoch": 171.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017375921015627682, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.492, + "eval_steps_per_second": 10.442, + "step": 342 + }, + { + "epoch": 172.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001682743604760617, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.003, + "eval_steps_per_second": 10.423, + "step": 344 + }, + { + "epoch": 173.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00016051206330303103, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.663, + "eval_steps_per_second": 10.449, + "step": 346 + }, + { + "epoch": 174.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001565395068610087, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.951, + "eval_steps_per_second": 10.46, + "step": 348 + }, + { + "epoch": 175.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00015261786757037044, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.828, + "eval_steps_per_second": 10.416, + "step": 350 + }, + { + "epoch": 176.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00014788127737119794, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.638, + "eval_steps_per_second": 10.409, + "step": 352 + }, + { + "epoch": 177.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00015022205479908735, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1947, + "eval_samples_per_second": 267.132, + "eval_steps_per_second": 10.274, + "step": 354 + }, + { + "epoch": 178.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00015139019524212927, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1927, + "eval_samples_per_second": 269.83, + "eval_steps_per_second": 10.378, + "step": 356 + }, + { + "epoch": 179.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00015289123984985054, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.772, + "eval_steps_per_second": 10.26, + "step": 358 + }, + { + "epoch": 180.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00016072712605819106, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.07, + "eval_steps_per_second": 10.464, + "step": 360 + }, + { + "epoch": 181.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001745976769598201, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.168, + "eval_steps_per_second": 10.468, + "step": 362 + }, + { + "epoch": 182.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001719567080726847, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.782, + "eval_steps_per_second": 10.492, + "step": 364 + }, + { + "epoch": 183.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017195084365084767, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.114, + "eval_steps_per_second": 10.427, + "step": 366 + }, + { + "epoch": 184.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00016906547534745187, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.131, + "eval_steps_per_second": 10.467, + "step": 368 + }, + { + "epoch": 185.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017375753668602556, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.271, + "eval_steps_per_second": 10.434, + "step": 370 + }, + { + "epoch": 186.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017936242511495948, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.601, + "eval_steps_per_second": 10.446, + "step": 372 + }, + { + "epoch": 187.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001846987579483539, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.726, + "eval_steps_per_second": 10.489, + "step": 374 + }, + { + "epoch": 188.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0005070104962214828, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1996, + "eval_samples_per_second": 260.461, + "eval_steps_per_second": 10.018, + "step": 376 + }, + { + "epoch": 189.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.000675897637847811, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.573, + "eval_steps_per_second": 10.522, + "step": 378 + }, + { + "epoch": 190.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001741629675962031, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.096, + "eval_steps_per_second": 10.427, + "step": 380 + }, + { + "epoch": 191.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001857963652582839, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.639, + "eval_steps_per_second": 10.448, + "step": 382 + }, + { + "epoch": 192.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0002107126492774114, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.498, + "eval_steps_per_second": 10.481, + "step": 384 + }, + { + "epoch": 193.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00020173982193227857, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.772, + "eval_steps_per_second": 10.491, + "step": 386 + }, + { + "epoch": 194.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017930121975950897, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.78, + "eval_steps_per_second": 10.453, + "step": 388 + }, + { + "epoch": 195.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017655600095167756, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.747, + "eval_steps_per_second": 10.49, + "step": 390 + }, + { + "epoch": 196.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001722782471915707, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.576, + "eval_steps_per_second": 10.484, + "step": 392 + }, + { + "epoch": 197.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00016521110956091434, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.993, + "eval_steps_per_second": 10.461, + "step": 394 + }, + { + "epoch": 198.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017568585462868214, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1935, + "eval_samples_per_second": 268.712, + "eval_steps_per_second": 10.335, + "step": 396 + }, + { + "epoch": 199.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00016936961037572473, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.979, + "eval_steps_per_second": 10.422, + "step": 398 + }, + { + "epoch": 200.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00014734009164385498, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.891, + "eval_steps_per_second": 10.457, + "step": 400 + }, + { + "epoch": 201.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00014263550110626966, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.413, + "eval_steps_per_second": 10.516, + "step": 402 + }, + { + "epoch": 202.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00014432436728384346, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.55, + "eval_steps_per_second": 10.444, + "step": 404 + }, + { + "epoch": 203.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001547217689221725, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.489, + "eval_steps_per_second": 10.48, + "step": 406 + }, + { + "epoch": 204.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00016551432781852782, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.466, + "eval_steps_per_second": 10.441, + "step": 408 + }, + { + "epoch": 205.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00017147496691904962, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.413, + "eval_steps_per_second": 10.439, + "step": 410 + }, + { + "epoch": 206.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00016451763804070652, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.735, + "eval_steps_per_second": 10.451, + "step": 412 + }, + { + "epoch": 207.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001420173211954534, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1938, + "eval_samples_per_second": 268.254, + "eval_steps_per_second": 10.317, + "step": 414 + }, + { + "epoch": 208.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00015448310296051204, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.13, + "eval_steps_per_second": 10.351, + "step": 416 + }, + { + "epoch": 209.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00013038184260949492, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.42, + "eval_steps_per_second": 10.478, + "step": 418 + }, + { + "epoch": 210.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00013210569159127772, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 272.031, + "eval_steps_per_second": 10.463, + "step": 420 + }, + { + "epoch": 211.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00013243983266875148, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.908, + "eval_steps_per_second": 10.458, + "step": 422 + }, + { + "epoch": 212.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011647965584415942, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.347, + "eval_steps_per_second": 10.475, + "step": 424 + }, + { + "epoch": 213.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011237960279686376, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.59, + "eval_steps_per_second": 10.446, + "step": 426 + }, + { + "epoch": 214.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010945500253001228, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1924, + "eval_samples_per_second": 270.226, + "eval_steps_per_second": 10.393, + "step": 428 + }, + { + "epoch": 215.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010889133409364149, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.655, + "eval_steps_per_second": 10.41, + "step": 430 + }, + { + "epoch": 216.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011191463272552937, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.181, + "eval_steps_per_second": 10.43, + "step": 432 + }, + { + "epoch": 217.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001194515498355031, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1905, + "eval_samples_per_second": 272.991, + "eval_steps_per_second": 10.5, + "step": 434 + }, + { + "epoch": 218.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001374753046547994, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.969, + "eval_steps_per_second": 10.383, + "step": 436 + }, + { + "epoch": 219.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00014326351811178029, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.156, + "eval_steps_per_second": 10.468, + "step": 438 + }, + { + "epoch": 220.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00013214044156484306, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.994, + "eval_steps_per_second": 10.423, + "step": 440 + }, + { + "epoch": 221.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00012192948634037748, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.956, + "eval_steps_per_second": 10.421, + "step": 442 + }, + { + "epoch": 222.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011187892232555896, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1922, + "eval_samples_per_second": 270.544, + "eval_steps_per_second": 10.406, + "step": 444 + }, + { + "epoch": 223.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010678944818209857, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.668, + "eval_steps_per_second": 10.449, + "step": 446 + }, + { + "epoch": 224.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010234924411633983, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.854, + "eval_steps_per_second": 10.417, + "step": 448 + }, + { + "epoch": 225.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010161428508581594, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.448, + "eval_steps_per_second": 10.44, + "step": 450 + }, + { + "epoch": 226.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.345171565655619e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.48, + "eval_steps_per_second": 10.48, + "step": 452 + }, + { + "epoch": 227.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.373368811793625e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1945, + "eval_samples_per_second": 267.404, + "eval_steps_per_second": 10.285, + "step": 454 + }, + { + "epoch": 228.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.916733688442037e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.217, + "eval_steps_per_second": 10.47, + "step": 456 + }, + { + "epoch": 229.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.384766988456249e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.779, + "eval_steps_per_second": 10.453, + "step": 458 + }, + { + "epoch": 230.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.175561379175633e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.393, + "eval_steps_per_second": 10.477, + "step": 460 + }, + { + "epoch": 231.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.695087697356939e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.273, + "eval_steps_per_second": 10.472, + "step": 462 + }, + { + "epoch": 232.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.71935738157481e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.764, + "eval_steps_per_second": 10.452, + "step": 464 + }, + { + "epoch": 233.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.80057884589769e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.015, + "eval_steps_per_second": 10.424, + "step": 466 + }, + { + "epoch": 234.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.775362559594214e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.193, + "eval_samples_per_second": 269.425, + "eval_steps_per_second": 10.362, + "step": 468 + }, + { + "epoch": 235.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.662545249331743e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.259, + "eval_steps_per_second": 10.433, + "step": 470 + }, + { + "epoch": 236.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001449029368814081, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.729, + "eval_steps_per_second": 10.413, + "step": 472 + }, + { + "epoch": 237.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.0005231755203567445, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1963, + "eval_samples_per_second": 264.9, + "eval_steps_per_second": 10.188, + "step": 474 + }, + { + "epoch": 238.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.718549699755386e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 272.024, + "eval_steps_per_second": 10.462, + "step": 476 + }, + { + "epoch": 239.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.285966032417491e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.001, + "eval_steps_per_second": 10.423, + "step": 478 + }, + { + "epoch": 240.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.819038728484884e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.983, + "eval_steps_per_second": 10.461, + "step": 480 + }, + { + "epoch": 241.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00012997654266655445, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.127, + "eval_steps_per_second": 10.428, + "step": 482 + }, + { + "epoch": 242.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.022307156352326e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.715, + "eval_steps_per_second": 10.412, + "step": 484 + }, + { + "epoch": 243.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.249302481999621e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.702, + "eval_steps_per_second": 10.45, + "step": 486 + }, + { + "epoch": 244.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.476464765612036e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.054, + "eval_steps_per_second": 10.425, + "step": 488 + }, + { + "epoch": 245.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010226272570434958, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.107, + "eval_steps_per_second": 10.466, + "step": 490 + }, + { + "epoch": 246.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001063941017491743, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.011, + "eval_steps_per_second": 10.424, + "step": 492 + }, + { + "epoch": 247.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010720050340751186, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.45, + "eval_steps_per_second": 10.402, + "step": 494 + }, + { + "epoch": 248.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011007071589119732, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.75, + "eval_steps_per_second": 10.413, + "step": 496 + }, + { + "epoch": 249.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001136000792030245, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.193, + "eval_samples_per_second": 269.423, + "eval_steps_per_second": 10.362, + "step": 498 + }, + { + "epoch": 250.0, + "learning_rate": 3e-05, + "loss": 0.1402, + "step": 500 + }, + { + "epoch": 250.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00013848966045770794, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1996, + "eval_samples_per_second": 260.512, + "eval_steps_per_second": 10.02, + "step": 500 + }, + { + "epoch": 251.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010977823694702238, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.49, + "eval_steps_per_second": 10.442, + "step": 502 + }, + { + "epoch": 252.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.933987894328311e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.922, + "eval_steps_per_second": 10.459, + "step": 504 + }, + { + "epoch": 253.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011568746413104236, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2023, + "eval_samples_per_second": 257.015, + "eval_steps_per_second": 9.885, + "step": 506 + }, + { + "epoch": 254.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00015481284935958683, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.092, + "eval_steps_per_second": 10.427, + "step": 508 + }, + { + "epoch": 255.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011079219257226214, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.153, + "eval_steps_per_second": 10.467, + "step": 510 + }, + { + "epoch": 256.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010259331611450762, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.97, + "eval_steps_per_second": 10.422, + "step": 512 + }, + { + "epoch": 257.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010927036782959476, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.636, + "eval_steps_per_second": 10.448, + "step": 514 + }, + { + "epoch": 258.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00010331905650673434, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.371, + "eval_steps_per_second": 10.437, + "step": 516 + }, + { + "epoch": 259.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0001038439804688096, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.845, + "eval_steps_per_second": 10.417, + "step": 518 + }, + { + "epoch": 260.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011001154052792117, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.758, + "eval_steps_per_second": 10.414, + "step": 520 + }, + { + "epoch": 261.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.0003085101780015975, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.094, + "eval_steps_per_second": 10.427, + "step": 522 + }, + { + "epoch": 262.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922480620155039, + "eval_loss": 0.0011753622675314546, + "eval_precision": 0.9922480620155039, + "eval_recall": 0.9922480620155039, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.611, + "eval_steps_per_second": 10.447, + "step": 524 + }, + { + "epoch": 263.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011800944776041433, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.319, + "eval_steps_per_second": 10.435, + "step": 526 + }, + { + "epoch": 264.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011525224545039237, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.263, + "eval_steps_per_second": 10.433, + "step": 528 + }, + { + "epoch": 265.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 0.00011260627798037603, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.68, + "eval_steps_per_second": 10.488, + "step": 530 + }, + { + "epoch": 266.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.79475919646211e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.986, + "eval_steps_per_second": 10.461, + "step": 532 + }, + { + "epoch": 267.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.132647053571418e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.788, + "eval_steps_per_second": 10.453, + "step": 534 + }, + { + "epoch": 268.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.759691652609035e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.264, + "eval_steps_per_second": 10.472, + "step": 536 + }, + { + "epoch": 269.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.298681157408282e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.832, + "eval_steps_per_second": 10.494, + "step": 538 + }, + { + "epoch": 270.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.018757605692372e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.139, + "eval_steps_per_second": 10.352, + "step": 540 + }, + { + "epoch": 271.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.68438442517072e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.941, + "eval_steps_per_second": 10.459, + "step": 542 + }, + { + "epoch": 272.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.749886910663918e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.865, + "eval_steps_per_second": 10.418, + "step": 544 + }, + { + "epoch": 273.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922779922779923, + "eval_loss": 0.0012262859381735325, + "eval_precision": 0.9884615384615385, + "eval_recall": 0.9961240310077519, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.119, + "eval_steps_per_second": 10.428, + "step": 546 + }, + { + "epoch": 274.0, + "eval_accuracy": 0.9992917847025495, + "eval_f1": 0.9922779922779923, + "eval_loss": 0.0021211248822510242, + "eval_precision": 0.9884615384615385, + "eval_recall": 0.9961240310077519, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.539, + "eval_steps_per_second": 10.482, + "step": 548 + }, + { + "epoch": 275.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.285941294161603e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.835, + "eval_steps_per_second": 10.455, + "step": 550 + }, + { + "epoch": 276.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 9.277593926526606e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1935, + "eval_samples_per_second": 268.707, + "eval_steps_per_second": 10.335, + "step": 552 + }, + { + "epoch": 277.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.468082523904741e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1939, + "eval_samples_per_second": 268.215, + "eval_steps_per_second": 10.316, + "step": 554 + }, + { + "epoch": 278.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.159714732551947e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.587, + "eval_steps_per_second": 10.446, + "step": 556 + }, + { + "epoch": 279.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.69611181365326e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1966, + "eval_samples_per_second": 264.517, + "eval_steps_per_second": 10.174, + "step": 558 + }, + { + "epoch": 280.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.470361015293747e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1988, + "eval_samples_per_second": 261.577, + "eval_steps_per_second": 10.061, + "step": 560 + }, + { + "epoch": 281.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.783402932342142e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1951, + "eval_samples_per_second": 266.587, + "eval_steps_per_second": 10.253, + "step": 562 + }, + { + "epoch": 282.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.015487062744796e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1944, + "eval_samples_per_second": 267.552, + "eval_steps_per_second": 10.29, + "step": 564 + }, + { + "epoch": 283.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.00842244643718e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1972, + "eval_samples_per_second": 263.698, + "eval_steps_per_second": 10.142, + "step": 566 + }, + { + "epoch": 284.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.267325756605715e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1966, + "eval_samples_per_second": 264.55, + "eval_steps_per_second": 10.175, + "step": 568 + }, + { + "epoch": 285.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.416579657932743e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1973, + "eval_samples_per_second": 263.618, + "eval_steps_per_second": 10.139, + "step": 570 + }, + { + "epoch": 286.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.066305599641055e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1961, + "eval_samples_per_second": 265.18, + "eval_steps_per_second": 10.199, + "step": 572 + }, + { + "epoch": 287.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.50228064134717e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1948, + "eval_samples_per_second": 266.886, + "eval_steps_per_second": 10.265, + "step": 574 + }, + { + "epoch": 288.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 7.022007775958627e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1977, + "eval_samples_per_second": 262.979, + "eval_steps_per_second": 10.115, + "step": 576 + }, + { + "epoch": 289.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.727103027515113e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2042, + "eval_samples_per_second": 254.611, + "eval_steps_per_second": 9.793, + "step": 578 + }, + { + "epoch": 290.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.552635750267655e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.199, + "eval_samples_per_second": 261.256, + "eval_steps_per_second": 10.048, + "step": 580 + }, + { + "epoch": 291.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.397445395123214e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.747, + "eval_steps_per_second": 10.259, + "step": 582 + }, + { + "epoch": 292.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.245623080758378e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2001, + "eval_samples_per_second": 259.861, + "eval_steps_per_second": 9.995, + "step": 584 + }, + { + "epoch": 293.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.104681233409792e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1966, + "eval_samples_per_second": 264.561, + "eval_steps_per_second": 10.175, + "step": 586 + }, + { + "epoch": 294.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.057948121451773e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.196, + "eval_samples_per_second": 265.364, + "eval_steps_per_second": 10.206, + "step": 588 + }, + { + "epoch": 295.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.021445005899295e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1986, + "eval_samples_per_second": 261.772, + "eval_steps_per_second": 10.068, + "step": 590 + }, + { + "epoch": 296.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.6982829846674576e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1993, + "eval_samples_per_second": 260.856, + "eval_steps_per_second": 10.033, + "step": 592 + }, + { + "epoch": 297.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.489697650773451e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1988, + "eval_samples_per_second": 261.611, + "eval_steps_per_second": 10.062, + "step": 594 + }, + { + "epoch": 298.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.506767047336325e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.74, + "eval_steps_per_second": 10.259, + "step": 596 + }, + { + "epoch": 299.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.741238419432193e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1963, + "eval_samples_per_second": 264.949, + "eval_steps_per_second": 10.19, + "step": 598 + }, + { + "epoch": 300.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.9511978179216385e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1973, + "eval_samples_per_second": 263.621, + "eval_steps_per_second": 10.139, + "step": 600 + }, + { + "epoch": 301.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.165297963889316e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2013, + "eval_samples_per_second": 258.378, + "eval_steps_per_second": 9.938, + "step": 602 + }, + { + "epoch": 302.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.433777161873877e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1972, + "eval_samples_per_second": 263.723, + "eval_steps_per_second": 10.143, + "step": 604 + }, + { + "epoch": 303.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.947341171326116e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.013, + "eval_steps_per_second": 10.424, + "step": 606 + }, + { + "epoch": 304.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 8.054797945078462e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.446, + "eval_steps_per_second": 10.44, + "step": 608 + }, + { + "epoch": 305.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 6.788939208490774e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.332, + "eval_steps_per_second": 10.436, + "step": 610 + }, + { + "epoch": 306.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.459954627440311e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1936, + "eval_samples_per_second": 268.534, + "eval_steps_per_second": 10.328, + "step": 612 + }, + { + "epoch": 307.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.251478069112636e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.09, + "eval_steps_per_second": 10.465, + "step": 614 + }, + { + "epoch": 308.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.186112684896216e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.542, + "eval_steps_per_second": 10.444, + "step": 616 + }, + { + "epoch": 309.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.160113505553454e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1927, + "eval_samples_per_second": 269.859, + "eval_steps_per_second": 10.379, + "step": 618 + }, + { + "epoch": 310.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.29017997905612e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.584, + "eval_steps_per_second": 10.446, + "step": 620 + }, + { + "epoch": 311.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.5057505960576236e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.709, + "eval_steps_per_second": 10.373, + "step": 622 + }, + { + "epoch": 312.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.501869600266218e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.691, + "eval_steps_per_second": 10.373, + "step": 624 + }, + { + "epoch": 313.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 5.359837450669147e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.196, + "eval_samples_per_second": 265.245, + "eval_steps_per_second": 10.202, + "step": 626 + }, + { + "epoch": 314.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.898127735941671e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.997, + "eval_steps_per_second": 10.461, + "step": 628 + }, + { + "epoch": 315.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.6336077502928674e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.911, + "eval_steps_per_second": 10.42, + "step": 630 + }, + { + "epoch": 316.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.578220614348538e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.876, + "eval_steps_per_second": 10.418, + "step": 632 + }, + { + "epoch": 317.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.635083314497024e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.852, + "eval_steps_per_second": 10.494, + "step": 634 + }, + { + "epoch": 318.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.717935371445492e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.207, + "eval_steps_per_second": 10.431, + "step": 636 + }, + { + "epoch": 319.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.7964662371668965e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.191, + "eval_samples_per_second": 272.217, + "eval_steps_per_second": 10.47, + "step": 638 + }, + { + "epoch": 320.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.8506914026802406e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.375, + "eval_steps_per_second": 10.476, + "step": 640 + }, + { + "epoch": 321.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.6628272684756666e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.503, + "eval_steps_per_second": 10.481, + "step": 642 + }, + { + "epoch": 322.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.504551543504931e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.381, + "eval_steps_per_second": 10.438, + "step": 644 + }, + { + "epoch": 323.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.162485492997803e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1965, + "eval_samples_per_second": 264.694, + "eval_steps_per_second": 10.181, + "step": 646 + }, + { + "epoch": 324.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.997327439719811e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.341, + "eval_steps_per_second": 10.436, + "step": 648 + }, + { + "epoch": 325.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.148295192862861e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.569, + "eval_steps_per_second": 10.483, + "step": 650 + }, + { + "epoch": 326.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.949719757656567e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.481, + "eval_steps_per_second": 10.48, + "step": 652 + }, + { + "epoch": 327.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.949163146899082e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.982, + "eval_steps_per_second": 10.384, + "step": 654 + }, + { + "epoch": 328.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.067728150403127e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1924, + "eval_samples_per_second": 270.304, + "eval_steps_per_second": 10.396, + "step": 656 + }, + { + "epoch": 329.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.185877332929522e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.59, + "eval_steps_per_second": 10.484, + "step": 658 + }, + { + "epoch": 330.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.2947223846567795e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.736, + "eval_steps_per_second": 10.451, + "step": 660 + }, + { + "epoch": 331.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.386345608509146e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.721, + "eval_steps_per_second": 10.489, + "step": 662 + }, + { + "epoch": 332.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.406541120260954e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.747, + "eval_steps_per_second": 10.452, + "step": 664 + }, + { + "epoch": 333.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.3815198296215385e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.657, + "eval_steps_per_second": 10.448, + "step": 666 + }, + { + "epoch": 334.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.336113124736585e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1925, + "eval_samples_per_second": 270.086, + "eval_steps_per_second": 10.388, + "step": 668 + }, + { + "epoch": 335.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.2898838728433475e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.888, + "eval_steps_per_second": 10.496, + "step": 670 + }, + { + "epoch": 336.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.576912397169508e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 272.002, + "eval_steps_per_second": 10.462, + "step": 672 + }, + { + "epoch": 337.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.7782745241420344e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.42, + "eval_steps_per_second": 10.478, + "step": 674 + }, + { + "epoch": 338.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.69547558168415e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.354, + "eval_steps_per_second": 10.475, + "step": 676 + }, + { + "epoch": 339.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.6122160711092874e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.957, + "eval_steps_per_second": 10.46, + "step": 678 + }, + { + "epoch": 340.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.524645191850141e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1967, + "eval_samples_per_second": 264.369, + "eval_steps_per_second": 10.168, + "step": 680 + }, + { + "epoch": 341.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.430363333085552e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2028, + "eval_samples_per_second": 256.393, + "eval_steps_per_second": 9.861, + "step": 682 + }, + { + "epoch": 342.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.3363099393900484e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1934, + "eval_samples_per_second": 268.805, + "eval_steps_per_second": 10.339, + "step": 684 + }, + { + "epoch": 343.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.241560964146629e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1903, + "eval_samples_per_second": 273.186, + "eval_steps_per_second": 10.507, + "step": 686 + }, + { + "epoch": 344.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.1283663449576125e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1946, + "eval_samples_per_second": 267.275, + "eval_steps_per_second": 10.28, + "step": 688 + }, + { + "epoch": 345.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.007289680885151e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1905, + "eval_samples_per_second": 273.012, + "eval_steps_per_second": 10.5, + "step": 690 + }, + { + "epoch": 346.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.848155029118061e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.82, + "eval_steps_per_second": 10.455, + "step": 692 + }, + { + "epoch": 347.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.778138488996774e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.98, + "eval_steps_per_second": 10.384, + "step": 694 + }, + { + "epoch": 348.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.73378315998707e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1934, + "eval_samples_per_second": 268.883, + "eval_steps_per_second": 10.342, + "step": 696 + }, + { + "epoch": 349.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.5984983696835116e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 272.019, + "eval_steps_per_second": 10.462, + "step": 698 + }, + { + "epoch": 350.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.4531112760305405e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.745, + "eval_steps_per_second": 10.452, + "step": 700 + }, + { + "epoch": 351.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.439624924794771e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1902, + "eval_samples_per_second": 273.351, + "eval_steps_per_second": 10.513, + "step": 702 + }, + { + "epoch": 352.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.4926921216538176e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.044, + "eval_steps_per_second": 10.463, + "step": 704 + }, + { + "epoch": 353.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.521246981108561e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.075, + "eval_steps_per_second": 10.426, + "step": 706 + }, + { + "epoch": 354.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.54865551344119e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.461, + "eval_steps_per_second": 10.402, + "step": 708 + }, + { + "epoch": 355.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.57405879185535e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.94, + "eval_steps_per_second": 10.459, + "step": 710 + }, + { + "epoch": 356.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.594366353354417e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.717, + "eval_steps_per_second": 10.451, + "step": 712 + }, + { + "epoch": 357.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.6125871702097356e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1935, + "eval_samples_per_second": 268.738, + "eval_steps_per_second": 10.336, + "step": 714 + }, + { + "epoch": 358.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.620458301156759e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1931, + "eval_samples_per_second": 269.313, + "eval_steps_per_second": 10.358, + "step": 716 + }, + { + "epoch": 359.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.470125739113428e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.727, + "eval_steps_per_second": 10.451, + "step": 718 + }, + { + "epoch": 360.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.390650817891583e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.345, + "eval_steps_per_second": 10.398, + "step": 720 + }, + { + "epoch": 361.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.3351963793393224e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.516, + "eval_steps_per_second": 10.52, + "step": 722 + }, + { + "epoch": 362.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.2921554520726204e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.815, + "eval_steps_per_second": 10.493, + "step": 724 + }, + { + "epoch": 363.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.256916534155607e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1903, + "eval_samples_per_second": 273.229, + "eval_steps_per_second": 10.509, + "step": 726 + }, + { + "epoch": 364.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.227618071832694e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1904, + "eval_samples_per_second": 273.043, + "eval_steps_per_second": 10.502, + "step": 728 + }, + { + "epoch": 365.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.285772618255578e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.401, + "eval_steps_per_second": 10.477, + "step": 730 + }, + { + "epoch": 366.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.53492796421051e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.19, + "eval_samples_per_second": 273.686, + "eval_steps_per_second": 10.526, + "step": 732 + }, + { + "epoch": 367.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.8624759326921776e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.048, + "eval_steps_per_second": 10.425, + "step": 734 + }, + { + "epoch": 368.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 4.109403016627766e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.694, + "eval_steps_per_second": 10.373, + "step": 736 + }, + { + "epoch": 369.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.960210960940458e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.483, + "eval_steps_per_second": 10.48, + "step": 738 + }, + { + "epoch": 370.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.5878434573533013e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1905, + "eval_samples_per_second": 272.923, + "eval_steps_per_second": 10.497, + "step": 740 + }, + { + "epoch": 371.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.3986245398409665e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1901, + "eval_samples_per_second": 273.51, + "eval_steps_per_second": 10.52, + "step": 742 + }, + { + "epoch": 372.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.297941293567419e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.961, + "eval_steps_per_second": 10.383, + "step": 744 + }, + { + "epoch": 373.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.277920404798351e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1931, + "eval_samples_per_second": 269.249, + "eval_steps_per_second": 10.356, + "step": 746 + }, + { + "epoch": 374.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.3448646718170494e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.799, + "eval_steps_per_second": 10.492, + "step": 748 + }, + { + "epoch": 375.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.4745906305033714e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.374, + "eval_steps_per_second": 10.437, + "step": 750 + }, + { + "epoch": 376.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.229073990951292e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1937, + "eval_samples_per_second": 268.516, + "eval_steps_per_second": 10.328, + "step": 752 + }, + { + "epoch": 377.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.170399213558994e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.612, + "eval_steps_per_second": 10.447, + "step": 754 + }, + { + "epoch": 378.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.149329131701961e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.098, + "eval_steps_per_second": 10.465, + "step": 756 + }, + { + "epoch": 379.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.1424639018950984e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.796, + "eval_steps_per_second": 10.415, + "step": 758 + }, + { + "epoch": 380.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.1409865187015384e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1924, + "eval_samples_per_second": 270.234, + "eval_steps_per_second": 10.394, + "step": 760 + }, + { + "epoch": 381.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.1399518775288016e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.064, + "eval_steps_per_second": 10.426, + "step": 762 + }, + { + "epoch": 382.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.164066220051609e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2, + "eval_samples_per_second": 259.951, + "eval_steps_per_second": 9.998, + "step": 764 + }, + { + "epoch": 383.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.127932359348051e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.348, + "eval_steps_per_second": 10.475, + "step": 766 + }, + { + "epoch": 384.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.107547672698274e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.106, + "eval_steps_per_second": 10.35, + "step": 768 + }, + { + "epoch": 385.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0961142329033464e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1967, + "eval_samples_per_second": 264.42, + "eval_steps_per_second": 10.17, + "step": 770 + }, + { + "epoch": 386.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.077806468354538e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1972, + "eval_samples_per_second": 263.734, + "eval_steps_per_second": 10.144, + "step": 772 + }, + { + "epoch": 387.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0614490242442116e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.003, + "eval_steps_per_second": 10.423, + "step": 774 + }, + { + "epoch": 388.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0540126317646354e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.198, + "eval_samples_per_second": 262.598, + "eval_steps_per_second": 10.1, + "step": 776 + }, + { + "epoch": 389.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.066670979023911e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.463, + "eval_steps_per_second": 10.402, + "step": 778 + }, + { + "epoch": 390.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0717979825567454e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1925, + "eval_samples_per_second": 270.06, + "eval_steps_per_second": 10.387, + "step": 780 + }, + { + "epoch": 391.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.078346708207391e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.176, + "eval_steps_per_second": 10.353, + "step": 782 + }, + { + "epoch": 392.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.083515548496507e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.82, + "eval_steps_per_second": 10.416, + "step": 784 + }, + { + "epoch": 393.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.090325481025502e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1939, + "eval_samples_per_second": 268.118, + "eval_steps_per_second": 10.312, + "step": 786 + }, + { + "epoch": 394.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0947507184464484e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.176, + "eval_steps_per_second": 10.43, + "step": 788 + }, + { + "epoch": 395.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.097290391451679e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.943, + "eval_steps_per_second": 10.459, + "step": 790 + }, + { + "epoch": 396.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0978491849964485e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.942, + "eval_steps_per_second": 10.459, + "step": 792 + }, + { + "epoch": 397.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.095619467785582e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.738, + "eval_steps_per_second": 10.451, + "step": 794 + }, + { + "epoch": 398.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.087857840000652e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.787, + "eval_steps_per_second": 10.492, + "step": 796 + }, + { + "epoch": 399.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0782299290876836e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.863, + "eval_steps_per_second": 10.418, + "step": 798 + }, + { + "epoch": 400.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.068123260163702e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1928, + "eval_samples_per_second": 269.708, + "eval_steps_per_second": 10.373, + "step": 800 + }, + { + "epoch": 401.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.058970833080821e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.02, + "eval_steps_per_second": 10.424, + "step": 802 + }, + { + "epoch": 402.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.052263491554186e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1956, + "eval_samples_per_second": 265.883, + "eval_steps_per_second": 10.226, + "step": 804 + }, + { + "epoch": 403.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0454400985036045e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.99, + "eval_steps_per_second": 10.384, + "step": 806 + }, + { + "epoch": 404.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0751052690902725e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1953, + "eval_samples_per_second": 266.323, + "eval_steps_per_second": 10.243, + "step": 808 + }, + { + "epoch": 405.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.103676135651767e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.184, + "eval_steps_per_second": 10.43, + "step": 810 + }, + { + "epoch": 406.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.1271814805222675e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1929, + "eval_samples_per_second": 269.54, + "eval_steps_per_second": 10.367, + "step": 812 + }, + { + "epoch": 407.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.145438677165657e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.67, + "eval_steps_per_second": 10.449, + "step": 814 + }, + { + "epoch": 408.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.158483377774246e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.774, + "eval_steps_per_second": 10.261, + "step": 816 + }, + { + "epoch": 409.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.1657957151765004e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1945, + "eval_samples_per_second": 267.307, + "eval_steps_per_second": 10.281, + "step": 818 + }, + { + "epoch": 410.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.165179441566579e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1994, + "eval_samples_per_second": 260.802, + "eval_steps_per_second": 10.031, + "step": 820 + }, + { + "epoch": 411.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.1612235034117475e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1932, + "eval_samples_per_second": 269.133, + "eval_steps_per_second": 10.351, + "step": 822 + }, + { + "epoch": 412.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.151909550069831e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1931, + "eval_samples_per_second": 269.277, + "eval_steps_per_second": 10.357, + "step": 824 + }, + { + "epoch": 413.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.1393577955896035e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 271.016, + "eval_steps_per_second": 10.424, + "step": 826 + }, + { + "epoch": 414.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.112521153525449e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.069, + "eval_steps_per_second": 10.464, + "step": 828 + }, + { + "epoch": 415.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.087819641223177e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.939, + "eval_steps_per_second": 10.421, + "step": 830 + }, + { + "epoch": 416.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.065093915211037e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1942, + "eval_samples_per_second": 267.751, + "eval_steps_per_second": 10.298, + "step": 832 + }, + { + "epoch": 417.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0428260288317688e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.496, + "eval_steps_per_second": 10.442, + "step": 834 + }, + { + "epoch": 418.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0221630368032493e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1922, + "eval_samples_per_second": 270.534, + "eval_steps_per_second": 10.405, + "step": 836 + }, + { + "epoch": 419.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0028943001525477e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.838, + "eval_steps_per_second": 10.455, + "step": 838 + }, + { + "epoch": 420.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.984862294397317e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.65, + "eval_steps_per_second": 10.41, + "step": 840 + }, + { + "epoch": 421.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.964744999189861e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 272.026, + "eval_steps_per_second": 10.463, + "step": 842 + }, + { + "epoch": 422.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.9449187422869727e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1924, + "eval_samples_per_second": 270.328, + "eval_steps_per_second": 10.397, + "step": 844 + }, + { + "epoch": 423.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.9258917493280023e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.952, + "eval_steps_per_second": 10.421, + "step": 846 + }, + { + "epoch": 424.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.904894972743932e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.226, + "eval_steps_per_second": 10.432, + "step": 848 + }, + { + "epoch": 425.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.88442552118795e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2041, + "eval_samples_per_second": 254.783, + "eval_steps_per_second": 9.799, + "step": 850 + }, + { + "epoch": 426.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.911575575126335e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1984, + "eval_samples_per_second": 262.074, + "eval_steps_per_second": 10.08, + "step": 852 + }, + { + "epoch": 427.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.936324199254159e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1949, + "eval_samples_per_second": 266.758, + "eval_steps_per_second": 10.26, + "step": 854 + }, + { + "epoch": 428.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.9586068194475956e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.498, + "eval_steps_per_second": 10.442, + "step": 856 + }, + { + "epoch": 429.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.9791270208079368e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.33, + "eval_steps_per_second": 10.474, + "step": 858 + }, + { + "epoch": 430.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.9990545954206027e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.215, + "eval_steps_per_second": 10.431, + "step": 860 + }, + { + "epoch": 431.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 3.0018487450433895e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1941, + "eval_samples_per_second": 267.845, + "eval_steps_per_second": 10.302, + "step": 862 + }, + { + "epoch": 432.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.9611455829581246e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.478, + "eval_steps_per_second": 10.441, + "step": 864 + }, + { + "epoch": 433.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.8550246497616172e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.567, + "eval_steps_per_second": 10.483, + "step": 866 + }, + { + "epoch": 434.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.7831518309540115e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.267, + "eval_steps_per_second": 10.433, + "step": 868 + }, + { + "epoch": 435.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.740779564192053e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.367, + "eval_steps_per_second": 10.437, + "step": 870 + }, + { + "epoch": 436.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.7122618121211417e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.575, + "eval_steps_per_second": 10.484, + "step": 872 + }, + { + "epoch": 437.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.679020144569222e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1964, + "eval_samples_per_second": 264.762, + "eval_steps_per_second": 10.183, + "step": 874 + }, + { + "epoch": 438.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.6459496439201757e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1906, + "eval_samples_per_second": 272.761, + "eval_steps_per_second": 10.491, + "step": 876 + }, + { + "epoch": 439.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.622292231535539e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.492, + "eval_steps_per_second": 10.48, + "step": 878 + }, + { + "epoch": 440.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.6056086426251568e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.495, + "eval_steps_per_second": 10.442, + "step": 880 + }, + { + "epoch": 441.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.592454620753415e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.76, + "eval_steps_per_second": 10.414, + "step": 882 + }, + { + "epoch": 442.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5815697881625965e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1939, + "eval_samples_per_second": 268.222, + "eval_steps_per_second": 10.316, + "step": 884 + }, + { + "epoch": 443.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5724011720740236e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1945, + "eval_samples_per_second": 267.33, + "eval_steps_per_second": 10.282, + "step": 886 + }, + { + "epoch": 444.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5625886337365955e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.602, + "eval_steps_per_second": 10.446, + "step": 888 + }, + { + "epoch": 445.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.554379534558393e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1926, + "eval_samples_per_second": 269.987, + "eval_steps_per_second": 10.384, + "step": 890 + }, + { + "epoch": 446.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5473098503425717e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.681, + "eval_steps_per_second": 10.488, + "step": 892 + }, + { + "epoch": 447.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5407531211385503e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.714, + "eval_steps_per_second": 10.451, + "step": 894 + }, + { + "epoch": 448.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5346264010295272e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.142, + "eval_steps_per_second": 10.467, + "step": 896 + }, + { + "epoch": 449.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.528832555981353e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.359, + "eval_steps_per_second": 10.398, + "step": 898 + }, + { + "epoch": 450.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.523170223867055e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.25, + "eval_steps_per_second": 10.433, + "step": 900 + }, + { + "epoch": 451.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.517813481972553e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.571, + "eval_steps_per_second": 10.484, + "step": 902 + }, + { + "epoch": 452.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5129967980319634e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.994, + "eval_steps_per_second": 10.461, + "step": 904 + }, + { + "epoch": 453.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5080849809455685e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1919, + "eval_samples_per_second": 270.948, + "eval_steps_per_second": 10.421, + "step": 906 + }, + { + "epoch": 454.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5028577510965988e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1905, + "eval_samples_per_second": 272.904, + "eval_steps_per_second": 10.496, + "step": 908 + }, + { + "epoch": 455.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4976090571726672e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1938, + "eval_samples_per_second": 268.378, + "eval_steps_per_second": 10.322, + "step": 910 + }, + { + "epoch": 456.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4926561309257522e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1936, + "eval_samples_per_second": 268.618, + "eval_steps_per_second": 10.331, + "step": 912 + }, + { + "epoch": 457.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.487782694515772e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.927, + "eval_steps_per_second": 10.459, + "step": 914 + }, + { + "epoch": 458.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4832583221723326e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.861, + "eval_steps_per_second": 10.456, + "step": 916 + }, + { + "epoch": 459.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4795017452561297e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.364, + "eval_steps_per_second": 10.399, + "step": 918 + }, + { + "epoch": 460.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4835548174451105e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1925, + "eval_samples_per_second": 270.063, + "eval_steps_per_second": 10.387, + "step": 920 + }, + { + "epoch": 461.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4869001208571717e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1922, + "eval_samples_per_second": 270.57, + "eval_steps_per_second": 10.407, + "step": 922 + }, + { + "epoch": 462.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.48901797021972e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.482, + "eval_steps_per_second": 10.48, + "step": 924 + }, + { + "epoch": 463.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4896455215639435e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1907, + "eval_samples_per_second": 272.671, + "eval_steps_per_second": 10.487, + "step": 926 + }, + { + "epoch": 464.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.48953092523152e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.803, + "eval_steps_per_second": 10.454, + "step": 928 + }, + { + "epoch": 465.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4889059204724617e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1908, + "eval_samples_per_second": 272.549, + "eval_steps_per_second": 10.483, + "step": 930 + }, + { + "epoch": 466.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4877050236682408e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1921, + "eval_samples_per_second": 270.711, + "eval_steps_per_second": 10.412, + "step": 932 + }, + { + "epoch": 467.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4862207283149473e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.876, + "eval_steps_per_second": 10.457, + "step": 934 + }, + { + "epoch": 468.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4875280359992757e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.646, + "eval_steps_per_second": 10.448, + "step": 936 + }, + { + "epoch": 469.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4879076590877958e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.344, + "eval_steps_per_second": 10.398, + "step": 938 + }, + { + "epoch": 470.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4881072022253647e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.184, + "eval_steps_per_second": 10.43, + "step": 940 + }, + { + "epoch": 471.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4878598196664825e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2012, + "eval_samples_per_second": 258.474, + "eval_steps_per_second": 9.941, + "step": 942 + }, + { + "epoch": 472.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4873226720956154e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1972, + "eval_samples_per_second": 263.746, + "eval_steps_per_second": 10.144, + "step": 944 + }, + { + "epoch": 473.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4866645617294125e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.394, + "eval_steps_per_second": 10.438, + "step": 946 + }, + { + "epoch": 474.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4854529328877106e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.81, + "eval_steps_per_second": 10.416, + "step": 948 + }, + { + "epoch": 475.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.483880234649405e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.536, + "eval_steps_per_second": 10.444, + "step": 950 + }, + { + "epoch": 476.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.48231317527825e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1923, + "eval_samples_per_second": 270.406, + "eval_steps_per_second": 10.4, + "step": 952 + }, + { + "epoch": 477.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4803790438454598e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1915, + "eval_samples_per_second": 271.562, + "eval_steps_per_second": 10.445, + "step": 954 + }, + { + "epoch": 478.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4856966774677858e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.193, + "eval_samples_per_second": 269.368, + "eval_steps_per_second": 10.36, + "step": 956 + }, + { + "epoch": 479.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4963625037344173e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1913, + "eval_samples_per_second": 271.779, + "eval_steps_per_second": 10.453, + "step": 958 + }, + { + "epoch": 480.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5042354536708444e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1952, + "eval_samples_per_second": 266.399, + "eval_steps_per_second": 10.246, + "step": 960 + }, + { + "epoch": 481.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.510105332476087e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1933, + "eval_samples_per_second": 269.014, + "eval_steps_per_second": 10.347, + "step": 962 + }, + { + "epoch": 482.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5137354896287434e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.192, + "eval_samples_per_second": 270.771, + "eval_steps_per_second": 10.414, + "step": 964 + }, + { + "epoch": 483.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.516252970963251e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1954, + "eval_samples_per_second": 266.139, + "eval_steps_per_second": 10.236, + "step": 966 + }, + { + "epoch": 484.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.517920802347362e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1922, + "eval_samples_per_second": 270.59, + "eval_steps_per_second": 10.407, + "step": 968 + }, + { + "epoch": 485.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.518829751352314e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2031, + "eval_samples_per_second": 256.082, + "eval_steps_per_second": 9.849, + "step": 970 + }, + { + "epoch": 486.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5192481189151295e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1927, + "eval_samples_per_second": 269.844, + "eval_steps_per_second": 10.379, + "step": 972 + }, + { + "epoch": 487.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5190471205860376e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.2094, + "eval_samples_per_second": 248.284, + "eval_steps_per_second": 9.549, + "step": 974 + }, + { + "epoch": 488.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5186602215399034e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.06, + "eval_steps_per_second": 10.425, + "step": 976 + }, + { + "epoch": 489.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.518102883186657e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.155, + "eval_steps_per_second": 10.467, + "step": 978 + }, + { + "epoch": 490.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.517297070880886e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1916, + "eval_samples_per_second": 271.356, + "eval_steps_per_second": 10.437, + "step": 980 + }, + { + "epoch": 491.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5119625206571072e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.228, + "eval_steps_per_second": 10.432, + "step": 982 + }, + { + "epoch": 492.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5080700652324595e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1911, + "eval_samples_per_second": 272.064, + "eval_steps_per_second": 10.464, + "step": 984 + }, + { + "epoch": 493.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.5049925170606002e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1918, + "eval_samples_per_second": 271.107, + "eval_steps_per_second": 10.427, + "step": 986 + }, + { + "epoch": 494.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.502693678252399e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1909, + "eval_samples_per_second": 272.457, + "eval_steps_per_second": 10.479, + "step": 988 + }, + { + "epoch": 495.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.501013659639284e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1917, + "eval_samples_per_second": 271.308, + "eval_steps_per_second": 10.435, + "step": 990 + }, + { + "epoch": 496.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4996967113111168e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1912, + "eval_samples_per_second": 271.978, + "eval_steps_per_second": 10.461, + "step": 992 + }, + { + "epoch": 497.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4988315999507904e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1934, + "eval_samples_per_second": 268.875, + "eval_steps_per_second": 10.341, + "step": 994 + }, + { + "epoch": 498.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.4982580725918524e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.748, + "eval_steps_per_second": 10.452, + "step": 996 + }, + { + "epoch": 499.0, + "eval_accuracy": 1.0, + "eval_f1": 1.0, + "eval_loss": 2.497786954336334e-05, + "eval_precision": 1.0, + "eval_recall": 1.0, + "eval_runtime": 0.1914, + "eval_samples_per_second": 271.662, + "eval_steps_per_second": 10.449, + "step": 998 + }, + { + "epoch": 500.0, + "learning_rate": 0.0, + "loss": 0.0006, + "step": 1000 + } + ], + "max_steps": 1000, + "num_train_epochs": 500, + "total_flos": 1655456435592960.0, + "trial_name": null, + "trial_params": null +}