{"current_steps": 5, "total_steps": 7776, "loss": 0.6637, "learning_rate": 2.9999969395283144e-06, "epoch": 0.020512820512820513, "percentage": 0.06, "elapsed_time": "0:00:45", "remaining_time": "19:50:52", "throughput": 1641.28, "total_tokens": 75456} {"current_steps": 10, "total_steps": 7776, "loss": 0.6963, "learning_rate": 2.9999877581257458e-06, "epoch": 0.041025641025641026, "percentage": 0.13, "elapsed_time": "0:01:40", "remaining_time": "21:45:22", "throughput": 1596.3, "total_tokens": 160992} {"current_steps": 15, "total_steps": 7776, "loss": 0.6919, "learning_rate": 2.9999724558297605e-06, "epoch": 0.06153846153846154, "percentage": 0.19, "elapsed_time": "0:02:47", "remaining_time": "1 day, 0:01:26", "throughput": 1518.68, "total_tokens": 253856} {"current_steps": 20, "total_steps": 7776, "loss": 0.6605, "learning_rate": 2.999951032702801e-06, "epoch": 0.08205128205128205, "percentage": 0.26, "elapsed_time": "0:03:36", "remaining_time": "23:16:08", "throughput": 1521.41, "total_tokens": 328640} {"current_steps": 25, "total_steps": 7776, "loss": 0.5888, "learning_rate": 2.9999234888322877e-06, "epoch": 0.10256410256410256, "percentage": 0.32, "elapsed_time": "0:04:16", "remaining_time": "22:07:35", "throughput": 1562.76, "total_tokens": 401504} {"current_steps": 30, "total_steps": 7776, "loss": 0.6087, "learning_rate": 2.9998898243306162e-06, "epoch": 0.12307692307692308, "percentage": 0.39, "elapsed_time": "0:04:57", "remaining_time": "21:19:41", "throughput": 1597.9, "total_tokens": 475168} {"current_steps": 35, "total_steps": 7776, "loss": 0.6405, "learning_rate": 2.99985003933516e-06, "epoch": 0.14358974358974358, "percentage": 0.45, "elapsed_time": "0:05:37", "remaining_time": "20:43:51", "throughput": 1621.54, "total_tokens": 547168} {"current_steps": 40, "total_steps": 7776, "loss": 0.6443, "learning_rate": 2.999804134008266e-06, "epoch": 0.1641025641025641, "percentage": 0.51, "elapsed_time": "0:06:15", "remaining_time": "20:09:02", "throughput": 1648.07, "total_tokens": 618176} {"current_steps": 45, "total_steps": 7776, "loss": 0.6554, "learning_rate": 2.9997521085372565e-06, "epoch": 0.18461538461538463, "percentage": 0.58, "elapsed_time": "0:07:06", "remaining_time": "20:22:01", "throughput": 1642.94, "total_tokens": 701184} {"current_steps": 50, "total_steps": 7776, "loss": 0.6903, "learning_rate": 2.999693963134429e-06, "epoch": 0.20512820512820512, "percentage": 0.64, "elapsed_time": "0:07:54", "remaining_time": "20:21:45", "throughput": 1649.76, "total_tokens": 782656} {"current_steps": 55, "total_steps": 7776, "loss": 0.6915, "learning_rate": 2.9996296980370526e-06, "epoch": 0.22564102564102564, "percentage": 0.71, "elapsed_time": "0:08:42", "remaining_time": "20:23:22", "throughput": 1662.49, "total_tokens": 869280} {"current_steps": 60, "total_steps": 7776, "loss": 0.584, "learning_rate": 2.99955931350737e-06, "epoch": 0.24615384615384617, "percentage": 0.77, "elapsed_time": "0:09:21", "remaining_time": "20:03:54", "throughput": 1680.67, "total_tokens": 944032} {"current_steps": 65, "total_steps": 7776, "loss": 0.5908, "learning_rate": 2.999482809832594e-06, "epoch": 0.26666666666666666, "percentage": 0.84, "elapsed_time": "0:10:14", "remaining_time": "20:15:27", "throughput": 1668.28, "total_tokens": 1025568} {"current_steps": 70, "total_steps": 7776, "loss": 0.5811, "learning_rate": 2.9994001873249074e-06, "epoch": 0.28717948717948716, "percentage": 0.9, "elapsed_time": "0:10:56", "remaining_time": "20:03:46", "throughput": 1684.75, "total_tokens": 1105344} {"current_steps": 75, "total_steps": 7776, "loss": 0.5792, "learning_rate": 2.999311446321462e-06, "epoch": 0.3076923076923077, "percentage": 0.96, "elapsed_time": "0:11:34", "remaining_time": "19:47:45", "throughput": 1703.07, "total_tokens": 1182016} {"current_steps": 80, "total_steps": 7776, "loss": 0.5923, "learning_rate": 2.999216587184378e-06, "epoch": 0.3282051282051282, "percentage": 1.03, "elapsed_time": "0:12:16", "remaining_time": "19:40:40", "throughput": 1718.45, "total_tokens": 1265440} {"current_steps": 85, "total_steps": 7776, "loss": 0.5896, "learning_rate": 2.9991156103007394e-06, "epoch": 0.3487179487179487, "percentage": 1.09, "elapsed_time": "0:12:56", "remaining_time": "19:30:52", "throughput": 1735.26, "total_tokens": 1347296} {"current_steps": 90, "total_steps": 7776, "loss": 0.6283, "learning_rate": 2.9990085160825954e-06, "epoch": 0.36923076923076925, "percentage": 1.16, "elapsed_time": "0:13:32", "remaining_time": "19:16:46", "throughput": 1752.22, "total_tokens": 1424064} {"current_steps": 95, "total_steps": 7776, "loss": 0.5329, "learning_rate": 2.9988953049669577e-06, "epoch": 0.38974358974358975, "percentage": 1.22, "elapsed_time": "0:14:02", "remaining_time": "18:55:32", "throughput": 1771.04, "total_tokens": 1492416} {"current_steps": 100, "total_steps": 7776, "loss": 0.5582, "learning_rate": 2.998775977415799e-06, "epoch": 0.41025641025641024, "percentage": 1.29, "elapsed_time": "0:14:39", "remaining_time": "18:45:30", "throughput": 1787.06, "total_tokens": 1572192} {"current_steps": 105, "total_steps": 7776, "loss": 0.6529, "learning_rate": 2.998650533916051e-06, "epoch": 0.4307692307692308, "percentage": 1.35, "elapsed_time": "0:15:16", "remaining_time": "18:35:46", "throughput": 1801.25, "total_tokens": 1650592} {"current_steps": 110, "total_steps": 7776, "loss": 0.5449, "learning_rate": 2.998518974979602e-06, "epoch": 0.4512820512820513, "percentage": 1.41, "elapsed_time": "0:15:51", "remaining_time": "18:24:56", "throughput": 1816.61, "total_tokens": 1728128} {"current_steps": 115, "total_steps": 7776, "loss": 0.573, "learning_rate": 2.998381301143295e-06, "epoch": 0.4717948717948718, "percentage": 1.48, "elapsed_time": "0:16:24", "remaining_time": "18:13:17", "throughput": 1834.17, "total_tokens": 1806080} {"current_steps": 120, "total_steps": 7776, "loss": 0.6065, "learning_rate": 2.9982375129689253e-06, "epoch": 0.49230769230769234, "percentage": 1.54, "elapsed_time": "0:17:05", "remaining_time": "18:10:02", "throughput": 1838.37, "total_tokens": 1884544} {"current_steps": 125, "total_steps": 7776, "loss": 0.6232, "learning_rate": 2.9980876110432404e-06, "epoch": 0.5128205128205128, "percentage": 1.61, "elapsed_time": "0:17:41", "remaining_time": "18:02:33", "throughput": 1848.28, "total_tokens": 1961376} {"current_steps": 130, "total_steps": 7776, "loss": 0.5061, "learning_rate": 2.9979315959779335e-06, "epoch": 0.5333333333333333, "percentage": 1.67, "elapsed_time": "0:18:09", "remaining_time": "17:47:49", "throughput": 1869.08, "total_tokens": 2036064} {"current_steps": 135, "total_steps": 7776, "loss": 0.5657, "learning_rate": 2.9977694684096447e-06, "epoch": 0.5538461538461539, "percentage": 1.74, "elapsed_time": "0:18:38", "remaining_time": "17:35:05", "throughput": 1885.95, "total_tokens": 2109376} {"current_steps": 140, "total_steps": 7776, "loss": 0.5597, "learning_rate": 2.997601228999956e-06, "epoch": 0.5743589743589743, "percentage": 1.8, "elapsed_time": "0:19:04", "remaining_time": "17:20:28", "throughput": 1905.82, "total_tokens": 2181344} {"current_steps": 145, "total_steps": 7776, "loss": 0.5514, "learning_rate": 2.99742687843539e-06, "epoch": 0.5948717948717949, "percentage": 1.86, "elapsed_time": "0:19:35", "remaining_time": "17:11:05", "throughput": 1919.78, "total_tokens": 2256768} {"current_steps": 150, "total_steps": 7776, "loss": 0.53, "learning_rate": 2.997246417427407e-06, "epoch": 0.6153846153846154, "percentage": 1.93, "elapsed_time": "0:20:00", "remaining_time": "16:57:21", "throughput": 1940.71, "total_tokens": 2330144} {"current_steps": 155, "total_steps": 7776, "loss": 0.5365, "learning_rate": 2.9970598467124008e-06, "epoch": 0.6358974358974359, "percentage": 1.99, "elapsed_time": "0:20:25", "remaining_time": "16:44:05", "throughput": 1960.88, "total_tokens": 2402688} {"current_steps": 160, "total_steps": 7776, "loss": 0.5578, "learning_rate": 2.9968671670516983e-06, "epoch": 0.6564102564102564, "percentage": 2.06, "elapsed_time": "0:20:50", "remaining_time": "16:31:43", "throughput": 1981.32, "total_tokens": 2476800} {"current_steps": 165, "total_steps": 7776, "loss": 0.5492, "learning_rate": 2.9966683792315528e-06, "epoch": 0.676923076923077, "percentage": 2.12, "elapsed_time": "0:21:21", "remaining_time": "16:24:49", "throughput": 2002.93, "total_tokens": 2565792} {"current_steps": 170, "total_steps": 7776, "loss": 0.5144, "learning_rate": 2.9964634840631435e-06, "epoch": 0.6974358974358974, "percentage": 2.19, "elapsed_time": "0:21:42", "remaining_time": "16:11:28", "throughput": 2024.73, "total_tokens": 2637792} {"current_steps": 175, "total_steps": 7776, "loss": 0.5741, "learning_rate": 2.9962524823825724e-06, "epoch": 0.717948717948718, "percentage": 2.25, "elapsed_time": "0:22:10", "remaining_time": "16:03:16", "throughput": 2043.3, "total_tokens": 2718944} {"current_steps": 180, "total_steps": 7776, "loss": 0.5846, "learning_rate": 2.9960353750508583e-06, "epoch": 0.7384615384615385, "percentage": 2.31, "elapsed_time": "0:22:39", "remaining_time": "15:56:03", "throughput": 2061.48, "total_tokens": 2802240} {"current_steps": 185, "total_steps": 7776, "loss": 0.5834, "learning_rate": 2.995812162953936e-06, "epoch": 0.7589743589743589, "percentage": 2.38, "elapsed_time": "0:23:06", "remaining_time": "15:48:07", "throughput": 2080.68, "total_tokens": 2884672} {"current_steps": 190, "total_steps": 7776, "loss": 0.5493, "learning_rate": 2.9955828470026515e-06, "epoch": 0.7794871794871795, "percentage": 2.44, "elapsed_time": "0:23:24", "remaining_time": "15:34:41", "throughput": 2102.73, "total_tokens": 2953536} {"current_steps": 195, "total_steps": 7776, "loss": 0.5503, "learning_rate": 2.9953474281327576e-06, "epoch": 0.8, "percentage": 2.51, "elapsed_time": "0:23:43", "remaining_time": "15:22:39", "throughput": 2125.4, "total_tokens": 3026496} {"current_steps": 200, "total_steps": 7776, "loss": 0.5835, "learning_rate": 2.995105907304912e-06, "epoch": 0.8205128205128205, "percentage": 2.57, "elapsed_time": "0:24:04", "remaining_time": "15:12:13", "throughput": 2149.18, "total_tokens": 3105376} {"current_steps": 205, "total_steps": 7776, "loss": 0.5583, "learning_rate": 2.9948582855046704e-06, "epoch": 0.841025641025641, "percentage": 2.64, "elapsed_time": "0:24:25", "remaining_time": "15:01:58", "throughput": 2169.94, "total_tokens": 3179776} {"current_steps": 210, "total_steps": 7776, "loss": 0.6392, "learning_rate": 2.9946045637424864e-06, "epoch": 0.8615384615384616, "percentage": 2.7, "elapsed_time": "0:24:46", "remaining_time": "14:52:41", "throughput": 2194.43, "total_tokens": 3262336} {"current_steps": 215, "total_steps": 7776, "loss": 0.5658, "learning_rate": 2.994344743053704e-06, "epoch": 0.882051282051282, "percentage": 2.76, "elapsed_time": "0:25:07", "remaining_time": "14:43:32", "throughput": 2218.26, "total_tokens": 3343904} {"current_steps": 220, "total_steps": 7776, "loss": 0.5609, "learning_rate": 2.9940788244985557e-06, "epoch": 0.9025641025641026, "percentage": 2.83, "elapsed_time": "0:25:24", "remaining_time": "14:32:24", "throughput": 2243.5, "total_tokens": 3419264} {"current_steps": 225, "total_steps": 7776, "loss": 0.5305, "learning_rate": 2.9938068091621556e-06, "epoch": 0.9230769230769231, "percentage": 2.89, "elapsed_time": "0:25:51", "remaining_time": "14:27:57", "throughput": 2252.94, "total_tokens": 3496032} {"current_steps": 230, "total_steps": 7776, "loss": 0.5652, "learning_rate": 2.9935286981544975e-06, "epoch": 0.9435897435897436, "percentage": 2.96, "elapsed_time": "0:26:38", "remaining_time": "14:33:54", "throughput": 2234.35, "total_tokens": 3570880} {"current_steps": 235, "total_steps": 7776, "loss": 0.5348, "learning_rate": 2.9932444926104495e-06, "epoch": 0.9641025641025641, "percentage": 3.02, "elapsed_time": "0:27:21", "remaining_time": "14:37:54", "throughput": 2220.0, "total_tokens": 3644096} {"current_steps": 240, "total_steps": 7776, "loss": 0.5344, "learning_rate": 2.992954193689749e-06, "epoch": 0.9846153846153847, "percentage": 3.09, "elapsed_time": "0:28:04", "remaining_time": "14:41:32", "throughput": 2206.69, "total_tokens": 3717088} {"current_steps": 245, "total_steps": 7776, "loss": 0.5977, "learning_rate": 2.9926578025769978e-06, "epoch": 1.005128205128205, "percentage": 3.15, "elapsed_time": "0:28:41", "remaining_time": "14:42:00", "throughput": 2197.73, "total_tokens": 3783648} {"current_steps": 250, "total_steps": 7776, "loss": 0.5304, "learning_rate": 2.992355320481658e-06, "epoch": 1.0256410256410255, "percentage": 3.22, "elapsed_time": "0:29:19", "remaining_time": "14:42:56", "throughput": 2189.01, "total_tokens": 3852160} {"current_steps": 255, "total_steps": 7776, "loss": 0.5617, "learning_rate": 2.9920467486380475e-06, "epoch": 1.0461538461538462, "percentage": 3.28, "elapsed_time": "0:30:01", "remaining_time": "14:45:20", "throughput": 2178.98, "total_tokens": 3924416} {"current_steps": 260, "total_steps": 7776, "loss": 0.5367, "learning_rate": 2.991732088305333e-06, "epoch": 1.0666666666666667, "percentage": 3.34, "elapsed_time": "0:31:05", "remaining_time": "14:58:48", "throughput": 2147.59, "total_tokens": 4006432} {"current_steps": 265, "total_steps": 7776, "loss": 0.5207, "learning_rate": 2.991411340767526e-06, "epoch": 1.087179487179487, "percentage": 3.41, "elapsed_time": "0:31:50", "remaining_time": "15:02:30", "throughput": 2136.53, "total_tokens": 4081888} {"current_steps": 270, "total_steps": 7776, "loss": 0.556, "learning_rate": 2.9910845073334793e-06, "epoch": 1.1076923076923078, "percentage": 3.47, "elapsed_time": "0:32:31", "remaining_time": "15:04:08", "throughput": 2129.74, "total_tokens": 4155968} {"current_steps": 275, "total_steps": 7776, "loss": 0.537, "learning_rate": 2.9907515893368784e-06, "epoch": 1.1282051282051282, "percentage": 3.54, "elapsed_time": "0:33:17", "remaining_time": "15:08:09", "throughput": 2119.57, "total_tokens": 4234272} {"current_steps": 280, "total_steps": 7776, "loss": 0.5305, "learning_rate": 2.9904125881362378e-06, "epoch": 1.1487179487179486, "percentage": 3.6, "elapsed_time": "0:33:52", "remaining_time": "15:06:57", "throughput": 2116.61, "total_tokens": 4302368} {"current_steps": 285, "total_steps": 7776, "loss": 0.5337, "learning_rate": 2.990067505114896e-06, "epoch": 1.1692307692307693, "percentage": 3.67, "elapsed_time": "0:34:30", "remaining_time": "15:07:03", "throughput": 2113.73, "total_tokens": 4376640} {"current_steps": 290, "total_steps": 7776, "loss": 0.592, "learning_rate": 2.9897163416810084e-06, "epoch": 1.1897435897435897, "percentage": 3.73, "elapsed_time": "0:36:16", "remaining_time": "15:36:26", "throughput": 2048.25, "total_tokens": 4458208} {"current_steps": 295, "total_steps": 7776, "loss": 0.5808, "learning_rate": 2.9893590992675427e-06, "epoch": 1.2102564102564102, "percentage": 3.79, "elapsed_time": "0:37:01", "remaining_time": "15:38:51", "throughput": 2042.88, "total_tokens": 4537920} {"current_steps": 300, "total_steps": 7776, "loss": 0.5569, "learning_rate": 2.988995779332273e-06, "epoch": 1.2307692307692308, "percentage": 3.86, "elapsed_time": "0:37:33", "remaining_time": "15:36:06", "throughput": 2044.0, "total_tokens": 4606880} {"current_steps": 305, "total_steps": 7776, "loss": 0.5422, "learning_rate": 2.9886263833577725e-06, "epoch": 1.2512820512820513, "percentage": 3.92, "elapsed_time": "0:38:09", "remaining_time": "15:34:50", "throughput": 2045.0, "total_tokens": 4682816} {"current_steps": 310, "total_steps": 7776, "loss": 0.5296, "learning_rate": 2.98825091285141e-06, "epoch": 1.2717948717948717, "percentage": 3.99, "elapsed_time": "0:38:43", "remaining_time": "15:32:46", "throughput": 2046.65, "total_tokens": 4756032} {"current_steps": 315, "total_steps": 7776, "loss": 0.5012, "learning_rate": 2.987869369345341e-06, "epoch": 1.2923076923076924, "percentage": 4.05, "elapsed_time": "0:39:15", "remaining_time": "15:30:00", "throughput": 2049.04, "total_tokens": 4827232} {"current_steps": 320, "total_steps": 7776, "loss": 0.5289, "learning_rate": 2.987481754396502e-06, "epoch": 1.3128205128205128, "percentage": 4.12, "elapsed_time": "0:39:49", "remaining_time": "15:27:55", "throughput": 2051.63, "total_tokens": 4902368} {"current_steps": 325, "total_steps": 7776, "loss": 0.5245, "learning_rate": 2.9870880695866067e-06, "epoch": 1.3333333333333333, "percentage": 4.18, "elapsed_time": "0:40:26", "remaining_time": "15:27:07", "throughput": 2051.65, "total_tokens": 4978080} {"current_steps": 330, "total_steps": 7776, "loss": 0.5325, "learning_rate": 2.986688316522136e-06, "epoch": 1.353846153846154, "percentage": 4.24, "elapsed_time": "0:40:56", "remaining_time": "15:23:47", "throughput": 2054.75, "total_tokens": 5047456} {"current_steps": 335, "total_steps": 7776, "loss": 0.5068, "learning_rate": 2.9862824968343352e-06, "epoch": 1.3743589743589744, "percentage": 4.31, "elapsed_time": "0:41:25", "remaining_time": "15:20:18", "throughput": 2059.04, "total_tokens": 5118720} {"current_steps": 340, "total_steps": 7776, "loss": 0.5165, "learning_rate": 2.9858706121792036e-06, "epoch": 1.3948717948717948, "percentage": 4.37, "elapsed_time": "0:41:59", "remaining_time": "15:18:14", "throughput": 2062.75, "total_tokens": 5196288} {"current_steps": 345, "total_steps": 7776, "loss": 0.5025, "learning_rate": 2.985452664237488e-06, "epoch": 1.4153846153846155, "percentage": 4.44, "elapsed_time": "0:42:30", "remaining_time": "15:15:36", "throughput": 2067.21, "total_tokens": 5272480} {"current_steps": 350, "total_steps": 7776, "loss": 0.5285, "learning_rate": 2.98502865471468e-06, "epoch": 1.435897435897436, "percentage": 4.5, "elapsed_time": "0:42:59", "remaining_time": "15:12:02", "throughput": 2071.72, "total_tokens": 5343296} {"current_steps": 355, "total_steps": 7776, "loss": 0.4983, "learning_rate": 2.9845985853410053e-06, "epoch": 1.4564102564102563, "percentage": 4.57, "elapsed_time": "0:43:26", "remaining_time": "15:08:01", "throughput": 2078.06, "total_tokens": 5415904} {"current_steps": 360, "total_steps": 7776, "loss": 0.5789, "learning_rate": 2.9841624578714167e-06, "epoch": 1.476923076923077, "percentage": 4.63, "elapsed_time": "0:44:10", "remaining_time": "15:09:56", "throughput": 2076.05, "total_tokens": 5502176} {"current_steps": 365, "total_steps": 7776, "loss": 0.5394, "learning_rate": 2.9837202740855897e-06, "epoch": 1.4974358974358974, "percentage": 4.69, "elapsed_time": "0:44:40", "remaining_time": "15:07:14", "throughput": 2081.47, "total_tokens": 5580352} {"current_steps": 370, "total_steps": 7776, "loss": 0.5664, "learning_rate": 2.9832720357879107e-06, "epoch": 1.5179487179487179, "percentage": 4.76, "elapsed_time": "0:45:26", "remaining_time": "15:09:27", "throughput": 2077.24, "total_tokens": 5662912} {"current_steps": 375, "total_steps": 7776, "loss": 0.5546, "learning_rate": 2.9828177448074753e-06, "epoch": 1.5384615384615383, "percentage": 4.82, "elapsed_time": "0:45:59", "remaining_time": "15:07:34", "throughput": 2081.73, "total_tokens": 5743776} {"current_steps": 380, "total_steps": 7776, "loss": 0.5412, "learning_rate": 2.9823574029980757e-06, "epoch": 1.558974358974359, "percentage": 4.89, "elapsed_time": "0:46:22", "remaining_time": "15:02:35", "throughput": 2088.94, "total_tokens": 5812384} {"current_steps": 385, "total_steps": 7776, "loss": 0.5587, "learning_rate": 2.981891012238196e-06, "epoch": 1.5794871794871796, "percentage": 4.95, "elapsed_time": "0:46:51", "remaining_time": "14:59:26", "throughput": 2096.23, "total_tokens": 5892768} {"current_steps": 390, "total_steps": 7776, "loss": 0.535, "learning_rate": 2.9814185744310036e-06, "epoch": 1.6, "percentage": 5.02, "elapsed_time": "0:47:22", "remaining_time": "14:57:09", "throughput": 2102.01, "total_tokens": 5974592} {"current_steps": 395, "total_steps": 7776, "loss": 0.512, "learning_rate": 2.9809400915043424e-06, "epoch": 1.6205128205128205, "percentage": 5.08, "elapsed_time": "0:47:46", "remaining_time": "14:52:50", "throughput": 2110.33, "total_tokens": 6050080} {"current_steps": 400, "total_steps": 7776, "loss": 0.5392, "learning_rate": 2.9804555654107243e-06, "epoch": 1.641025641025641, "percentage": 5.14, "elapsed_time": "0:48:25", "remaining_time": "14:52:50", "throughput": 2112.55, "total_tokens": 6137248} {"current_steps": 405, "total_steps": 7776, "loss": 0.6444, "learning_rate": 2.9799649981273185e-06, "epoch": 1.6615384615384614, "percentage": 5.21, "elapsed_time": "0:48:57", "remaining_time": "14:50:59", "throughput": 2121.87, "total_tokens": 6232704} {"current_steps": 410, "total_steps": 7776, "loss": 0.5202, "learning_rate": 2.9794683916559493e-06, "epoch": 1.682051282051282, "percentage": 5.27, "elapsed_time": "0:49:17", "remaining_time": "14:45:39", "throughput": 2131.33, "total_tokens": 6304064} {"current_steps": 415, "total_steps": 7776, "loss": 0.5344, "learning_rate": 2.9789657480230842e-06, "epoch": 1.7025641025641025, "percentage": 5.34, "elapsed_time": "0:49:50", "remaining_time": "14:44:03", "throughput": 2137.75, "total_tokens": 6392928} {"current_steps": 420, "total_steps": 7776, "loss": 0.4614, "learning_rate": 2.9784570692798236e-06, "epoch": 1.7230769230769232, "percentage": 5.4, "elapsed_time": "0:50:14", "remaining_time": "14:40:03", "throughput": 2147.05, "total_tokens": 6473120} {"current_steps": 425, "total_steps": 7776, "loss": 0.5036, "learning_rate": 2.977942357501898e-06, "epoch": 1.7435897435897436, "percentage": 5.47, "elapsed_time": "0:50:32", "remaining_time": "14:34:18", "throughput": 2158.1, "total_tokens": 6545312} {"current_steps": 430, "total_steps": 7776, "loss": 0.5308, "learning_rate": 2.977421614789655e-06, "epoch": 1.764102564102564, "percentage": 5.53, "elapsed_time": "0:50:57", "remaining_time": "14:30:33", "throughput": 2168.43, "total_tokens": 6629984} {"current_steps": 435, "total_steps": 7776, "loss": 0.5475, "learning_rate": 2.976894843268051e-06, "epoch": 1.7846153846153845, "percentage": 5.59, "elapsed_time": "0:51:19", "remaining_time": "14:26:16", "throughput": 2180.56, "total_tokens": 6715936} {"current_steps": 440, "total_steps": 7776, "loss": 0.5704, "learning_rate": 2.976362045086647e-06, "epoch": 1.8051282051282052, "percentage": 5.66, "elapsed_time": "0:51:40", "remaining_time": "14:21:35", "throughput": 2192.32, "total_tokens": 6797472} {"current_steps": 445, "total_steps": 7776, "loss": 0.4781, "learning_rate": 2.975823222419594e-06, "epoch": 1.8256410256410256, "percentage": 5.72, "elapsed_time": "0:51:55", "remaining_time": "14:15:26", "throughput": 2204.34, "total_tokens": 6867808} {"current_steps": 450, "total_steps": 7776, "loss": 0.5247, "learning_rate": 2.9752783774656267e-06, "epoch": 1.8461538461538463, "percentage": 5.79, "elapsed_time": "0:52:47", "remaining_time": "14:19:32", "throughput": 2192.17, "total_tokens": 6944480} {"current_steps": 455, "total_steps": 7776, "loss": 0.5161, "learning_rate": 2.974727512448056e-06, "epoch": 1.8666666666666667, "percentage": 5.85, "elapsed_time": "0:53:38", "remaining_time": "14:23:09", "throughput": 2182.27, "total_tokens": 7024064} {"current_steps": 460, "total_steps": 7776, "loss": 0.5049, "learning_rate": 2.974170629614757e-06, "epoch": 1.8871794871794871, "percentage": 5.92, "elapsed_time": "0:54:31", "remaining_time": "14:27:04", "throughput": 2171.59, "total_tokens": 7103488} {"current_steps": 465, "total_steps": 7776, "loss": 0.5712, "learning_rate": 2.9736077312381624e-06, "epoch": 1.9076923076923076, "percentage": 5.98, "elapsed_time": "0:55:32", "remaining_time": "14:33:22", "throughput": 2157.35, "total_tokens": 7190304} {"current_steps": 470, "total_steps": 7776, "loss": 0.5222, "learning_rate": 2.9730388196152513e-06, "epoch": 1.9282051282051282, "percentage": 6.04, "elapsed_time": "0:56:16", "remaining_time": "14:34:49", "throughput": 2151.55, "total_tokens": 7265056} {"current_steps": 475, "total_steps": 7776, "loss": 0.4829, "learning_rate": 2.972463897067541e-06, "epoch": 1.9487179487179487, "percentage": 6.11, "elapsed_time": "0:56:57", "remaining_time": "14:35:27", "throughput": 2146.93, "total_tokens": 7336992} {"current_steps": 480, "total_steps": 7776, "loss": 0.5218, "learning_rate": 2.971882965941077e-06, "epoch": 1.9692307692307693, "percentage": 6.17, "elapsed_time": "0:57:42", "remaining_time": "14:37:06", "throughput": 2141.36, "total_tokens": 7413984} {"current_steps": 485, "total_steps": 7776, "loss": 0.5543, "learning_rate": 2.9712960286064237e-06, "epoch": 1.9897435897435898, "percentage": 6.24, "elapsed_time": "0:58:30", "remaining_time": "14:39:40", "throughput": 2134.09, "total_tokens": 7492768} {"current_steps": 490, "total_steps": 7776, "loss": 0.5036, "learning_rate": 2.970703087458655e-06, "epoch": 2.01025641025641, "percentage": 6.3, "elapsed_time": "0:59:09", "remaining_time": "14:39:32", "throughput": 2131.24, "total_tokens": 7563904} {"current_steps": 495, "total_steps": 7776, "loss": 0.556, "learning_rate": 2.9701041449173426e-06, "epoch": 2.0307692307692307, "percentage": 6.37, "elapsed_time": "0:59:45", "remaining_time": "14:39:05", "throughput": 2129.0, "total_tokens": 7634464} {"current_steps": 500, "total_steps": 7776, "loss": 0.5742, "learning_rate": 2.96949920342655e-06, "epoch": 2.051282051282051, "percentage": 6.43, "elapsed_time": "1:00:40", "remaining_time": "14:42:54", "throughput": 2118.24, "total_tokens": 7711168} {"current_steps": 505, "total_steps": 7776, "loss": 0.4905, "learning_rate": 2.968888265454818e-06, "epoch": 2.071794871794872, "percentage": 6.49, "elapsed_time": "1:01:20", "remaining_time": "14:43:06", "throughput": 2115.87, "total_tokens": 7786656} {"current_steps": 510, "total_steps": 7776, "loss": 0.5134, "learning_rate": 2.968271333495158e-06, "epoch": 2.0923076923076924, "percentage": 6.56, "elapsed_time": "1:01:56", "remaining_time": "14:42:23", "throughput": 2114.66, "total_tokens": 7858240} {"current_steps": 515, "total_steps": 7776, "loss": 0.6211, "learning_rate": 2.967648410065041e-06, "epoch": 2.112820512820513, "percentage": 6.62, "elapsed_time": "1:02:48", "remaining_time": "14:45:25", "throughput": 2110.4, "total_tokens": 7952064} {"current_steps": 520, "total_steps": 7776, "loss": 0.515, "learning_rate": 2.9670194977063857e-06, "epoch": 2.1333333333333333, "percentage": 6.69, "elapsed_time": "1:03:25", "remaining_time": "14:45:05", "throughput": 2109.07, "total_tokens": 8026688} {"current_steps": 525, "total_steps": 7776, "loss": 0.5464, "learning_rate": 2.96638459898555e-06, "epoch": 2.1538461538461537, "percentage": 6.75, "elapsed_time": "1:04:05", "remaining_time": "14:45:14", "throughput": 2107.32, "total_tokens": 8104064} {"current_steps": 530, "total_steps": 7776, "loss": 0.5331, "learning_rate": 2.9657437164933205e-06, "epoch": 2.174358974358974, "percentage": 6.82, "elapsed_time": "1:04:59", "remaining_time": "14:48:27", "throughput": 2099.98, "total_tokens": 8187968} {"current_steps": 535, "total_steps": 7776, "loss": 0.5236, "learning_rate": 2.9650968528449e-06, "epoch": 2.194871794871795, "percentage": 6.88, "elapsed_time": "1:05:34", "remaining_time": "14:47:30", "throughput": 2099.77, "total_tokens": 8261312} {"current_steps": 540, "total_steps": 7776, "loss": 0.4345, "learning_rate": 2.9644440106799e-06, "epoch": 2.2153846153846155, "percentage": 6.94, "elapsed_time": "1:06:09", "remaining_time": "14:46:29", "throughput": 2100.1, "total_tokens": 8336032} {"current_steps": 545, "total_steps": 7776, "loss": 0.4853, "learning_rate": 2.963785192662327e-06, "epoch": 2.235897435897436, "percentage": 7.01, "elapsed_time": "1:06:39", "remaining_time": "14:44:22", "throughput": 2101.63, "total_tokens": 8405024} {"current_steps": 550, "total_steps": 7776, "loss": 0.5, "learning_rate": 2.9631204014805716e-06, "epoch": 2.2564102564102564, "percentage": 7.07, "elapsed_time": "1:07:15", "remaining_time": "14:43:44", "throughput": 2101.99, "total_tokens": 8483456} {"current_steps": 555, "total_steps": 7776, "loss": 0.4863, "learning_rate": 2.9624496398474014e-06, "epoch": 2.276923076923077, "percentage": 7.14, "elapsed_time": "1:07:49", "remaining_time": "14:42:29", "throughput": 2103.55, "total_tokens": 8560768} {"current_steps": 560, "total_steps": 7776, "loss": 0.48, "learning_rate": 2.961772910499945e-06, "epoch": 2.2974358974358973, "percentage": 7.2, "elapsed_time": "1:08:22", "remaining_time": "14:41:03", "throughput": 2105.52, "total_tokens": 8637888} {"current_steps": 565, "total_steps": 7776, "loss": 0.5768, "learning_rate": 2.9610902161996838e-06, "epoch": 2.3179487179487177, "percentage": 7.27, "elapsed_time": "1:08:55", "remaining_time": "14:39:35", "throughput": 2107.64, "total_tokens": 8715360} {"current_steps": 570, "total_steps": 7776, "loss": 0.4751, "learning_rate": 2.96040155973244e-06, "epoch": 2.3384615384615386, "percentage": 7.33, "elapsed_time": "1:09:34", "remaining_time": "14:39:34", "throughput": 2106.89, "total_tokens": 8795200} {"current_steps": 575, "total_steps": 7776, "loss": 0.5161, "learning_rate": 2.959706943908365e-06, "epoch": 2.358974358974359, "percentage": 7.39, "elapsed_time": "1:10:14", "remaining_time": "14:39:45", "throughput": 2107.55, "total_tokens": 8883136} {"current_steps": 580, "total_steps": 7776, "loss": 0.5588, "learning_rate": 2.9590063715619287e-06, "epoch": 2.3794871794871795, "percentage": 7.46, "elapsed_time": "1:10:49", "remaining_time": "14:38:43", "throughput": 2108.83, "total_tokens": 8961568} {"current_steps": 585, "total_steps": 7776, "loss": 0.5527, "learning_rate": 2.9582998455519062e-06, "epoch": 2.4, "percentage": 7.52, "elapsed_time": "1:11:21", "remaining_time": "14:37:07", "throughput": 2112.27, "total_tokens": 9043360} {"current_steps": 590, "total_steps": 7776, "loss": 0.4897, "learning_rate": 2.9575873687613676e-06, "epoch": 2.4205128205128204, "percentage": 7.59, "elapsed_time": "1:11:47", "remaining_time": "14:34:25", "throughput": 2116.34, "total_tokens": 9116448} {"current_steps": 595, "total_steps": 7776, "loss": 0.5359, "learning_rate": 2.9568689440976676e-06, "epoch": 2.4410256410256412, "percentage": 7.65, "elapsed_time": "1:12:17", "remaining_time": "14:32:29", "throughput": 2119.42, "total_tokens": 9193120} {"current_steps": 600, "total_steps": 7776, "loss": 0.5763, "learning_rate": 2.95614457449243e-06, "epoch": 2.4615384615384617, "percentage": 7.72, "elapsed_time": "1:12:44", "remaining_time": "14:30:04", "throughput": 2123.74, "total_tokens": 9269920} {"current_steps": 605, "total_steps": 7776, "loss": 0.4631, "learning_rate": 2.9554142629015382e-06, "epoch": 2.482051282051282, "percentage": 7.78, "elapsed_time": "1:13:08", "remaining_time": "14:27:01", "throughput": 2128.06, "total_tokens": 9339968} {"current_steps": 610, "total_steps": 7776, "loss": 0.5349, "learning_rate": 2.954678012305123e-06, "epoch": 2.5025641025641026, "percentage": 7.84, "elapsed_time": "1:13:46", "remaining_time": "14:26:36", "throughput": 2129.83, "total_tokens": 9426976} {"current_steps": 615, "total_steps": 7776, "loss": 0.5532, "learning_rate": 2.9539358257075495e-06, "epoch": 2.523076923076923, "percentage": 7.91, "elapsed_time": "1:14:13", "remaining_time": "14:24:20", "throughput": 2134.99, "total_tokens": 9509056} {"current_steps": 620, "total_steps": 7776, "loss": 0.4748, "learning_rate": 2.9531877061374066e-06, "epoch": 2.5435897435897434, "percentage": 7.97, "elapsed_time": "1:14:41", "remaining_time": "14:22:00", "throughput": 2140.25, "total_tokens": 9590720} {"current_steps": 625, "total_steps": 7776, "loss": 0.5022, "learning_rate": 2.9524336566474915e-06, "epoch": 2.564102564102564, "percentage": 8.04, "elapsed_time": "1:15:10", "remaining_time": "14:20:03", "throughput": 2143.52, "total_tokens": 9667648} {"current_steps": 630, "total_steps": 7776, "loss": 0.5005, "learning_rate": 2.9516736803148014e-06, "epoch": 2.5846153846153848, "percentage": 8.1, "elapsed_time": "1:15:31", "remaining_time": "14:16:36", "throughput": 2149.13, "total_tokens": 9738016} {"current_steps": 635, "total_steps": 7776, "loss": 0.5297, "learning_rate": 2.9509077802405174e-06, "epoch": 2.605128205128205, "percentage": 8.17, "elapsed_time": "1:15:54", "remaining_time": "14:13:41", "throughput": 2155.13, "total_tokens": 9816224} {"current_steps": 640, "total_steps": 7776, "loss": 0.5399, "learning_rate": 2.9501359595499933e-06, "epoch": 2.6256410256410256, "percentage": 8.23, "elapsed_time": "1:16:17", "remaining_time": "14:10:35", "throughput": 2160.94, "total_tokens": 9891104} {"current_steps": 645, "total_steps": 7776, "loss": 0.4901, "learning_rate": 2.9493582213927425e-06, "epoch": 2.646153846153846, "percentage": 8.29, "elapsed_time": "1:16:42", "remaining_time": "14:08:08", "throughput": 2166.01, "total_tokens": 9969792} {"current_steps": 650, "total_steps": 7776, "loss": 0.4591, "learning_rate": 2.9485745689424267e-06, "epoch": 2.6666666666666665, "percentage": 8.36, "elapsed_time": "1:17:02", "remaining_time": "14:04:31", "throughput": 2173.2, "total_tokens": 10044608} {"current_steps": 655, "total_steps": 7776, "loss": 0.5729, "learning_rate": 2.9477850053968405e-06, "epoch": 2.6871794871794874, "percentage": 8.42, "elapsed_time": "1:17:27", "remaining_time": "14:02:06", "throughput": 2180.23, "total_tokens": 10132640} {"current_steps": 660, "total_steps": 7776, "loss": 0.5405, "learning_rate": 2.9469895339778995e-06, "epoch": 2.707692307692308, "percentage": 8.49, "elapsed_time": "1:17:45", "remaining_time": "13:58:27", "throughput": 2187.74, "total_tokens": 10207968} {"current_steps": 665, "total_steps": 7776, "loss": 0.4786, "learning_rate": 2.946188157931627e-06, "epoch": 2.7282051282051283, "percentage": 8.55, "elapsed_time": "1:18:01", "remaining_time": "13:54:19", "throughput": 2195.37, "total_tokens": 10277408} {"current_steps": 670, "total_steps": 7776, "loss": 0.5035, "learning_rate": 2.9453808805281423e-06, "epoch": 2.7487179487179487, "percentage": 8.62, "elapsed_time": "1:18:16", "remaining_time": "13:50:14", "throughput": 2203.42, "total_tokens": 10349184} {"current_steps": 675, "total_steps": 7776, "loss": 0.4719, "learning_rate": 2.944567705061644e-06, "epoch": 2.769230769230769, "percentage": 8.68, "elapsed_time": "1:19:19", "remaining_time": "13:54:27", "throughput": 2192.39, "total_tokens": 10434112} {"current_steps": 680, "total_steps": 7776, "loss": 0.5118, "learning_rate": 2.9437486348504e-06, "epoch": 2.7897435897435896, "percentage": 8.74, "elapsed_time": "1:20:03", "remaining_time": "13:55:21", "throughput": 2187.38, "total_tokens": 10506208} {"current_steps": 685, "total_steps": 7776, "loss": 0.5014, "learning_rate": 2.9429236732367318e-06, "epoch": 2.81025641025641, "percentage": 8.81, "elapsed_time": "1:20:44", "remaining_time": "13:55:53", "throughput": 2183.28, "total_tokens": 10577696} {"current_steps": 690, "total_steps": 7776, "loss": 0.4827, "learning_rate": 2.942092823587001e-06, "epoch": 2.830769230769231, "percentage": 8.87, "elapsed_time": "1:21:35", "remaining_time": "13:57:58", "throughput": 2176.93, "total_tokens": 10657984} {"current_steps": 695, "total_steps": 7776, "loss": 0.5177, "learning_rate": 2.941256089291597e-06, "epoch": 2.8512820512820514, "percentage": 8.94, "elapsed_time": "1:22:22", "remaining_time": "13:59:12", "throughput": 2172.08, "total_tokens": 10734688} {"current_steps": 700, "total_steps": 7776, "loss": 0.4517, "learning_rate": 2.940413473764923e-06, "epoch": 2.871794871794872, "percentage": 9.0, "elapsed_time": "1:23:09", "remaining_time": "14:00:40", "throughput": 2166.93, "total_tokens": 10812640} {"current_steps": 705, "total_steps": 7776, "loss": 0.4574, "learning_rate": 2.9395649804453786e-06, "epoch": 2.8923076923076922, "percentage": 9.07, "elapsed_time": "1:23:49", "remaining_time": "14:00:45", "throughput": 2164.14, "total_tokens": 10884800} {"current_steps": 710, "total_steps": 7776, "loss": 0.5092, "learning_rate": 2.9387106127953515e-06, "epoch": 2.9128205128205127, "percentage": 9.13, "elapsed_time": "1:24:46", "remaining_time": "14:03:37", "throughput": 2155.27, "total_tokens": 10962016} {"current_steps": 715, "total_steps": 7776, "loss": 0.4888, "learning_rate": 2.937850374301198e-06, "epoch": 2.9333333333333336, "percentage": 9.19, "elapsed_time": "1:25:24", "remaining_time": "14:03:29", "throughput": 2152.92, "total_tokens": 11033280} {"current_steps": 720, "total_steps": 7776, "loss": 0.5447, "learning_rate": 2.9369842684732336e-06, "epoch": 2.953846153846154, "percentage": 9.26, "elapsed_time": "1:26:09", "remaining_time": "14:04:18", "throughput": 2149.99, "total_tokens": 11113696} {"current_steps": 725, "total_steps": 7776, "loss": 0.5438, "learning_rate": 2.936112298845713e-06, "epoch": 2.9743589743589745, "percentage": 9.32, "elapsed_time": "1:26:54", "remaining_time": "14:05:18", "throughput": 2146.73, "total_tokens": 11195104} {"current_steps": 730, "total_steps": 7776, "loss": 0.46, "learning_rate": 2.935234468976822e-06, "epoch": 2.994871794871795, "percentage": 9.39, "elapsed_time": "1:27:38", "remaining_time": "14:05:58", "throughput": 2143.14, "total_tokens": 11270304} {"current_steps": 735, "total_steps": 7776, "loss": 0.569, "learning_rate": 2.934350782448658e-06, "epoch": 3.0153846153846153, "percentage": 9.45, "elapsed_time": "1:28:22", "remaining_time": "14:06:31", "throughput": 2140.82, "total_tokens": 11350784} {"current_steps": 740, "total_steps": 7776, "loss": 0.5246, "learning_rate": 2.9334612428672175e-06, "epoch": 3.0358974358974358, "percentage": 9.52, "elapsed_time": "1:29:02", "remaining_time": "14:06:39", "throughput": 2139.27, "total_tokens": 11429568} {"current_steps": 745, "total_steps": 7776, "loss": 0.4587, "learning_rate": 2.9325658538623822e-06, "epoch": 3.056410256410256, "percentage": 9.58, "elapsed_time": "1:29:38", "remaining_time": "14:06:04", "throughput": 2138.46, "total_tokens": 11502784} {"current_steps": 750, "total_steps": 7776, "loss": 0.5095, "learning_rate": 2.931664619087902e-06, "epoch": 3.076923076923077, "percentage": 9.65, "elapsed_time": "1:30:15", "remaining_time": "14:05:28", "throughput": 2137.68, "total_tokens": 11575680} {"current_steps": 755, "total_steps": 7776, "loss": 0.4916, "learning_rate": 2.9307575422213813e-06, "epoch": 3.0974358974358975, "percentage": 9.71, "elapsed_time": "1:30:49", "remaining_time": "14:04:39", "throughput": 2137.65, "total_tokens": 11649856} {"current_steps": 760, "total_steps": 7776, "loss": 0.5647, "learning_rate": 2.929844626964265e-06, "epoch": 3.117948717948718, "percentage": 9.77, "elapsed_time": "1:31:27", "remaining_time": "14:04:16", "throughput": 2137.24, "total_tokens": 11727616} {"current_steps": 765, "total_steps": 7776, "loss": 0.4448, "learning_rate": 2.9289258770418208e-06, "epoch": 3.1384615384615384, "percentage": 9.84, "elapsed_time": "1:32:04", "remaining_time": "14:03:52", "throughput": 2136.99, "total_tokens": 11806208} {"current_steps": 770, "total_steps": 7776, "loss": 0.5086, "learning_rate": 2.9280012962031263e-06, "epoch": 3.158974358974359, "percentage": 9.9, "elapsed_time": "1:32:47", "remaining_time": "14:04:21", "throughput": 2134.36, "total_tokens": 11884096} {"current_steps": 775, "total_steps": 7776, "loss": 0.4796, "learning_rate": 2.9270708882210525e-06, "epoch": 3.1794871794871793, "percentage": 9.97, "elapsed_time": "1:33:20", "remaining_time": "14:03:10", "throughput": 2134.96, "total_tokens": 11956416} {"current_steps": 780, "total_steps": 7776, "loss": 0.4797, "learning_rate": 2.92613465689225e-06, "epoch": 3.2, "percentage": 10.03, "elapsed_time": "1:33:56", "remaining_time": "14:02:30", "throughput": 2134.9, "total_tokens": 12032384} {"current_steps": 785, "total_steps": 7776, "loss": 0.4523, "learning_rate": 2.92519260603713e-06, "epoch": 3.2205128205128206, "percentage": 10.1, "elapsed_time": "1:34:28", "remaining_time": "14:01:18", "throughput": 2136.04, "total_tokens": 12107328} {"current_steps": 790, "total_steps": 7776, "loss": 0.4795, "learning_rate": 2.9242447394998545e-06, "epoch": 3.241025641025641, "percentage": 10.16, "elapsed_time": "1:34:56", "remaining_time": "13:59:36", "throughput": 2137.87, "total_tokens": 12178848} {"current_steps": 795, "total_steps": 7776, "loss": 0.5164, "learning_rate": 2.923291061148314e-06, "epoch": 3.2615384615384615, "percentage": 10.22, "elapsed_time": "1:35:27", "remaining_time": "13:58:11", "throughput": 2139.28, "total_tokens": 12252160} {"current_steps": 800, "total_steps": 7776, "loss": 0.4949, "learning_rate": 2.9223315748741146e-06, "epoch": 3.282051282051282, "percentage": 10.29, "elapsed_time": "1:35:56", "remaining_time": "13:56:36", "throughput": 2141.09, "total_tokens": 12325120} {"current_steps": 805, "total_steps": 7776, "loss": 0.4848, "learning_rate": 2.9213662845925662e-06, "epoch": 3.3025641025641024, "percentage": 10.35, "elapsed_time": "1:36:25", "remaining_time": "13:54:57", "throughput": 2143.1, "total_tokens": 12398144} {"current_steps": 810, "total_steps": 7776, "loss": 0.5114, "learning_rate": 2.9203951942426586e-06, "epoch": 3.3230769230769233, "percentage": 10.42, "elapsed_time": "1:36:54", "remaining_time": "13:53:27", "throughput": 2145.38, "total_tokens": 12475008} {"current_steps": 815, "total_steps": 7776, "loss": 0.6022, "learning_rate": 2.9194183077870516e-06, "epoch": 3.3435897435897437, "percentage": 10.48, "elapsed_time": "1:37:31", "remaining_time": "13:52:57", "throughput": 2146.88, "total_tokens": 12562336} {"current_steps": 820, "total_steps": 7776, "loss": 0.4922, "learning_rate": 2.9184356292120562e-06, "epoch": 3.364102564102564, "percentage": 10.55, "elapsed_time": "1:38:06", "remaining_time": "13:52:15", "throughput": 2148.36, "total_tokens": 12646560} {"current_steps": 825, "total_steps": 7776, "loss": 0.5707, "learning_rate": 2.9174471625276198e-06, "epoch": 3.3846153846153846, "percentage": 10.61, "elapsed_time": "1:38:31", "remaining_time": "13:50:07", "throughput": 2151.55, "total_tokens": 12718848} {"current_steps": 830, "total_steps": 7776, "loss": 0.4784, "learning_rate": 2.916452911767307e-06, "epoch": 3.405128205128205, "percentage": 10.67, "elapsed_time": "1:38:59", "remaining_time": "13:48:28", "throughput": 2154.65, "total_tokens": 12798240} {"current_steps": 835, "total_steps": 7776, "loss": 0.4423, "learning_rate": 2.915452880988287e-06, "epoch": 3.4256410256410255, "percentage": 10.74, "elapsed_time": "1:39:23", "remaining_time": "13:46:13", "throughput": 2158.48, "total_tokens": 12872608} {"current_steps": 840, "total_steps": 7776, "loss": 0.4809, "learning_rate": 2.914447074271314e-06, "epoch": 3.4461538461538463, "percentage": 10.8, "elapsed_time": "1:39:56", "remaining_time": "13:45:10", "throughput": 2160.22, "total_tokens": 12952896} {"current_steps": 845, "total_steps": 7776, "loss": 0.5316, "learning_rate": 2.913435495720712e-06, "epoch": 3.466666666666667, "percentage": 10.87, "elapsed_time": "1:40:28", "remaining_time": "13:44:12", "throughput": 2162.34, "total_tokens": 13036768} {"current_steps": 850, "total_steps": 7776, "loss": 0.4592, "learning_rate": 2.9124181494643574e-06, "epoch": 3.4871794871794872, "percentage": 10.93, "elapsed_time": "1:40:53", "remaining_time": "13:42:07", "throughput": 2166.37, "total_tokens": 13114784} {"current_steps": 855, "total_steps": 7776, "loss": 0.4878, "learning_rate": 2.911395039653663e-06, "epoch": 3.5076923076923077, "percentage": 11.0, "elapsed_time": "1:41:15", "remaining_time": "13:39:43", "throughput": 2170.59, "total_tokens": 13188448} {"current_steps": 860, "total_steps": 7776, "loss": 0.5066, "learning_rate": 2.9103661704635604e-06, "epoch": 3.528205128205128, "percentage": 11.06, "elapsed_time": "1:41:37", "remaining_time": "13:37:12", "throughput": 2175.22, "total_tokens": 13262592} {"current_steps": 865, "total_steps": 7776, "loss": 0.4649, "learning_rate": 2.909331546092483e-06, "epoch": 3.5487179487179485, "percentage": 11.12, "elapsed_time": "1:41:59", "remaining_time": "13:34:50", "throughput": 2179.97, "total_tokens": 13339936} {"current_steps": 870, "total_steps": 7776, "loss": 0.5233, "learning_rate": 2.908291170762349e-06, "epoch": 3.569230769230769, "percentage": 11.19, "elapsed_time": "1:42:23", "remaining_time": "13:32:49", "throughput": 2183.68, "total_tokens": 13416256} {"current_steps": 875, "total_steps": 7776, "loss": 0.5018, "learning_rate": 2.9072450487185434e-06, "epoch": 3.58974358974359, "percentage": 11.25, "elapsed_time": "1:42:42", "remaining_time": "13:30:01", "throughput": 2188.69, "total_tokens": 13487392} {"current_steps": 880, "total_steps": 7776, "loss": 0.4602, "learning_rate": 2.9061931842299026e-06, "epoch": 3.6102564102564103, "percentage": 11.32, "elapsed_time": "1:43:06", "remaining_time": "13:27:59", "throughput": 2193.48, "total_tokens": 13569984} {"current_steps": 885, "total_steps": 7776, "loss": 0.5309, "learning_rate": 2.9051355815886952e-06, "epoch": 3.6307692307692307, "percentage": 11.38, "elapsed_time": "1:43:27", "remaining_time": "13:25:35", "throughput": 2199.06, "total_tokens": 13650944} {"current_steps": 890, "total_steps": 7776, "loss": 0.5186, "learning_rate": 2.904072245110605e-06, "epoch": 3.651282051282051, "percentage": 11.45, "elapsed_time": "1:43:44", "remaining_time": "13:22:35", "throughput": 2204.48, "total_tokens": 13720736} {"current_steps": 895, "total_steps": 7776, "loss": 0.4839, "learning_rate": 2.9030031791347136e-06, "epoch": 3.6717948717948716, "percentage": 11.51, "elapsed_time": "1:43:59", "remaining_time": "13:19:29", "throughput": 2210.42, "total_tokens": 13791616} {"current_steps": 900, "total_steps": 7776, "loss": 0.5199, "learning_rate": 2.901928388023483e-06, "epoch": 3.6923076923076925, "percentage": 11.57, "elapsed_time": "1:44:47", "remaining_time": "13:20:34", "throughput": 2205.65, "total_tokens": 13867488} {"current_steps": 905, "total_steps": 7776, "loss": 0.5414, "learning_rate": 2.900847876162736e-06, "epoch": 3.712820512820513, "percentage": 11.64, "elapsed_time": "1:45:47", "remaining_time": "13:23:08", "throughput": 2198.62, "total_tokens": 13954848} {"current_steps": 910, "total_steps": 7776, "loss": 0.5451, "learning_rate": 2.899761647961641e-06, "epoch": 3.7333333333333334, "percentage": 11.7, "elapsed_time": "1:46:53", "remaining_time": "13:26:26", "throughput": 2188.94, "total_tokens": 14037792} {"current_steps": 915, "total_steps": 7776, "loss": 0.4448, "learning_rate": 2.898669707852692e-06, "epoch": 3.753846153846154, "percentage": 11.77, "elapsed_time": "1:47:32", "remaining_time": "13:26:20", "throughput": 2186.49, "total_tokens": 14107520} {"current_steps": 920, "total_steps": 7776, "loss": 0.5213, "learning_rate": 2.897572060291692e-06, "epoch": 3.7743589743589743, "percentage": 11.83, "elapsed_time": "1:48:37", "remaining_time": "13:29:32", "throughput": 2177.69, "total_tokens": 14193888} {"current_steps": 925, "total_steps": 7776, "loss": 0.4968, "learning_rate": 2.896468709757733e-06, "epoch": 3.7948717948717947, "percentage": 11.9, "elapsed_time": "1:49:23", "remaining_time": "13:30:14", "throughput": 2174.2, "total_tokens": 14270976} {"current_steps": 930, "total_steps": 7776, "loss": 0.5769, "learning_rate": 2.8953596607531788e-06, "epoch": 3.815384615384615, "percentage": 11.96, "elapsed_time": "1:50:14", "remaining_time": "13:31:29", "throughput": 2169.74, "total_tokens": 14351232} {"current_steps": 935, "total_steps": 7776, "loss": 0.4925, "learning_rate": 2.894244917803647e-06, "epoch": 3.835897435897436, "percentage": 12.02, "elapsed_time": "1:50:58", "remaining_time": "13:31:58", "throughput": 2166.64, "total_tokens": 14426912} {"current_steps": 940, "total_steps": 7776, "loss": 0.481, "learning_rate": 2.8931244854579904e-06, "epoch": 3.8564102564102565, "percentage": 12.09, "elapsed_time": "1:52:03", "remaining_time": "13:34:54", "throughput": 2159.02, "total_tokens": 14515776} {"current_steps": 945, "total_steps": 7776, "loss": 0.4699, "learning_rate": 2.891998368288277e-06, "epoch": 3.876923076923077, "percentage": 12.15, "elapsed_time": "1:52:41", "remaining_time": "13:34:34", "throughput": 2157.43, "total_tokens": 14587104} {"current_steps": 950, "total_steps": 7776, "loss": 0.5206, "learning_rate": 2.890866570889773e-06, "epoch": 3.8974358974358974, "percentage": 12.22, "elapsed_time": "1:53:22", "remaining_time": "13:34:35", "throughput": 2155.75, "total_tokens": 14663680} {"current_steps": 955, "total_steps": 7776, "loss": 0.5117, "learning_rate": 2.8897290978809245e-06, "epoch": 3.917948717948718, "percentage": 12.28, "elapsed_time": "1:54:18", "remaining_time": "13:36:29", "throughput": 2150.09, "total_tokens": 14747360} {"current_steps": 960, "total_steps": 7776, "loss": 0.4891, "learning_rate": 2.888585953903336e-06, "epoch": 3.9384615384615387, "percentage": 12.35, "elapsed_time": "1:55:07", "remaining_time": "13:37:20", "throughput": 2146.56, "total_tokens": 14826464} {"current_steps": 965, "total_steps": 7776, "loss": 0.4943, "learning_rate": 2.8874371436217534e-06, "epoch": 3.958974358974359, "percentage": 12.41, "elapsed_time": "1:56:08", "remaining_time": "13:39:41", "throughput": 2140.64, "total_tokens": 14916416} {"current_steps": 970, "total_steps": 7776, "loss": 0.5222, "learning_rate": 2.8862826717240464e-06, "epoch": 3.9794871794871796, "percentage": 12.47, "elapsed_time": "1:56:52", "remaining_time": "13:40:00", "throughput": 2138.44, "total_tokens": 14995072} {"current_steps": 975, "total_steps": 7776, "loss": 0.5197, "learning_rate": 2.8851225429211855e-06, "epoch": 4.0, "percentage": 12.54, "elapsed_time": "1:57:28", "remaining_time": "13:39:27", "throughput": 2138.01, "total_tokens": 15070304} {"current_steps": 980, "total_steps": 7776, "loss": 0.501, "learning_rate": 2.883956761947226e-06, "epoch": 4.02051282051282, "percentage": 12.6, "elapsed_time": "1:58:12", "remaining_time": "13:39:44", "throughput": 2136.42, "total_tokens": 15152480} {"current_steps": 985, "total_steps": 7776, "loss": 0.5142, "learning_rate": 2.8827853335592876e-06, "epoch": 4.041025641025641, "percentage": 12.67, "elapsed_time": "1:58:54", "remaining_time": "13:39:46", "throughput": 2134.65, "total_tokens": 15229184} {"current_steps": 990, "total_steps": 7776, "loss": 0.5239, "learning_rate": 2.8816082625375353e-06, "epoch": 4.061538461538461, "percentage": 12.73, "elapsed_time": "1:59:43", "remaining_time": "13:40:37", "throughput": 2131.51, "total_tokens": 15311072} {"current_steps": 995, "total_steps": 7776, "loss": 0.4823, "learning_rate": 2.8804255536851584e-06, "epoch": 4.082051282051282, "percentage": 12.8, "elapsed_time": "2:00:15", "remaining_time": "13:39:34", "throughput": 2131.96, "total_tokens": 15383232} {"current_steps": 1000, "total_steps": 7776, "loss": 0.5416, "learning_rate": 2.8792372118283528e-06, "epoch": 4.102564102564102, "percentage": 12.86, "elapsed_time": "2:01:55", "remaining_time": "13:46:09", "throughput": 2113.91, "total_tokens": 15464064} {"current_steps": 1005, "total_steps": 7776, "loss": 0.4889, "learning_rate": 2.878043241816301e-06, "epoch": 4.123076923076923, "percentage": 12.92, "elapsed_time": "2:02:26", "remaining_time": "13:44:53", "throughput": 2114.9, "total_tokens": 15536480} {"current_steps": 1010, "total_steps": 7776, "loss": 0.5338, "learning_rate": 2.876843648521152e-06, "epoch": 4.143589743589744, "percentage": 12.99, "elapsed_time": "2:03:03", "remaining_time": "13:44:21", "throughput": 2115.41, "total_tokens": 15618816} {"current_steps": 1015, "total_steps": 7776, "loss": 0.5101, "learning_rate": 2.8756384368380003e-06, "epoch": 4.164102564102564, "percentage": 13.05, "elapsed_time": "2:03:39", "remaining_time": "13:43:41", "throughput": 2115.28, "total_tokens": 15694304} {"current_steps": 1020, "total_steps": 7776, "loss": 0.4792, "learning_rate": 2.874427611684867e-06, "epoch": 4.184615384615385, "percentage": 13.12, "elapsed_time": "2:04:10", "remaining_time": "13:42:28", "throughput": 2116.74, "total_tokens": 15770784} {"current_steps": 1025, "total_steps": 7776, "loss": 0.4959, "learning_rate": 2.8732111780026813e-06, "epoch": 4.205128205128205, "percentage": 13.18, "elapsed_time": "2:04:36", "remaining_time": "13:40:39", "throughput": 2118.41, "total_tokens": 15837312} {"current_steps": 1030, "total_steps": 7776, "loss": 0.5227, "learning_rate": 2.871989140755257e-06, "epoch": 4.225641025641026, "percentage": 13.25, "elapsed_time": "2:05:02", "remaining_time": "13:39:00", "throughput": 2120.27, "total_tokens": 15908096} {"current_steps": 1035, "total_steps": 7776, "loss": 0.473, "learning_rate": 2.870761504929275e-06, "epoch": 4.246153846153846, "percentage": 13.31, "elapsed_time": "2:05:38", "remaining_time": "13:38:16", "throughput": 2120.23, "total_tokens": 15982720} {"current_steps": 1040, "total_steps": 7776, "loss": 0.4911, "learning_rate": 2.869528275534261e-06, "epoch": 4.266666666666667, "percentage": 13.37, "elapsed_time": "2:06:05", "remaining_time": "13:36:38", "throughput": 2122.41, "total_tokens": 16056256} {"current_steps": 1045, "total_steps": 7776, "loss": 0.4678, "learning_rate": 2.8682894576025677e-06, "epoch": 4.287179487179487, "percentage": 13.44, "elapsed_time": "2:06:31", "remaining_time": "13:34:56", "throughput": 2124.58, "total_tokens": 16128256} {"current_steps": 1050, "total_steps": 7776, "loss": 0.4534, "learning_rate": 2.8670450561893498e-06, "epoch": 4.3076923076923075, "percentage": 13.5, "elapsed_time": "2:07:04", "remaining_time": "13:34:01", "throughput": 2125.18, "total_tokens": 16203808} {"current_steps": 1055, "total_steps": 7776, "loss": 0.5788, "learning_rate": 2.865795076372549e-06, "epoch": 4.328205128205128, "percentage": 13.57, "elapsed_time": "2:07:36", "remaining_time": "13:32:59", "throughput": 2127.53, "total_tokens": 16290464} {"current_steps": 1060, "total_steps": 7776, "loss": 0.4744, "learning_rate": 2.8645395232528683e-06, "epoch": 4.348717948717948, "percentage": 13.63, "elapsed_time": "2:08:00", "remaining_time": "13:31:03", "throughput": 2130.36, "total_tokens": 16362688} {"current_steps": 1065, "total_steps": 7776, "loss": 0.4801, "learning_rate": 2.863278401953754e-06, "epoch": 4.36923076923077, "percentage": 13.7, "elapsed_time": "2:08:24", "remaining_time": "13:29:06", "throughput": 2133.3, "total_tokens": 16434976} {"current_steps": 1070, "total_steps": 7776, "loss": 0.5035, "learning_rate": 2.862011717621375e-06, "epoch": 4.38974358974359, "percentage": 13.76, "elapsed_time": "2:08:50", "remaining_time": "13:27:31", "throughput": 2136.23, "total_tokens": 16514880} {"current_steps": 1075, "total_steps": 7776, "loss": 0.5456, "learning_rate": 2.860739475424599e-06, "epoch": 4.410256410256411, "percentage": 13.82, "elapsed_time": "2:09:15", "remaining_time": "13:25:45", "throughput": 2139.37, "total_tokens": 16592544} {"current_steps": 1080, "total_steps": 7776, "loss": 0.4773, "learning_rate": 2.859461680554975e-06, "epoch": 4.430769230769231, "percentage": 13.89, "elapsed_time": "2:09:41", "remaining_time": "13:24:06", "throughput": 2142.88, "total_tokens": 16675360} {"current_steps": 1085, "total_steps": 7776, "loss": 0.4793, "learning_rate": 2.858178338226709e-06, "epoch": 4.4512820512820515, "percentage": 13.95, "elapsed_time": "2:10:15", "remaining_time": "13:23:15", "throughput": 2143.7, "total_tokens": 16753728} {"current_steps": 1090, "total_steps": 7776, "loss": 0.4698, "learning_rate": 2.8568894536766462e-06, "epoch": 4.471794871794872, "percentage": 14.02, "elapsed_time": "2:10:35", "remaining_time": "13:21:04", "throughput": 2147.81, "total_tokens": 16829696} {"current_steps": 1095, "total_steps": 7776, "loss": 0.4648, "learning_rate": 2.8555950321642444e-06, "epoch": 4.492307692307692, "percentage": 14.08, "elapsed_time": "2:10:59", "remaining_time": "13:19:16", "throughput": 2151.19, "total_tokens": 16908128} {"current_steps": 1100, "total_steps": 7776, "loss": 0.4473, "learning_rate": 2.8542950789715587e-06, "epoch": 4.512820512820513, "percentage": 14.15, "elapsed_time": "2:11:18", "remaining_time": "13:16:54", "throughput": 2155.15, "total_tokens": 16979136} {"current_steps": 1105, "total_steps": 7776, "loss": 0.5128, "learning_rate": 2.8529895994032153e-06, "epoch": 4.533333333333333, "percentage": 14.21, "elapsed_time": "2:11:40", "remaining_time": "13:14:56", "throughput": 2159.78, "total_tokens": 17063296} {"current_steps": 1110, "total_steps": 7776, "loss": 0.4834, "learning_rate": 2.851678598786392e-06, "epoch": 4.553846153846154, "percentage": 14.27, "elapsed_time": "2:12:01", "remaining_time": "13:12:54", "throughput": 2164.39, "total_tokens": 17145984} {"current_steps": 1115, "total_steps": 7776, "loss": 0.4581, "learning_rate": 2.8503620824707946e-06, "epoch": 4.574358974358974, "percentage": 14.34, "elapsed_time": "2:12:19", "remaining_time": "13:10:31", "throughput": 2169.02, "total_tokens": 17221152} {"current_steps": 1120, "total_steps": 7776, "loss": 0.5189, "learning_rate": 2.8490400558286395e-06, "epoch": 4.5948717948717945, "percentage": 14.4, "elapsed_time": "2:12:42", "remaining_time": "13:08:41", "throughput": 2172.46, "total_tokens": 17298688} {"current_steps": 1125, "total_steps": 7776, "loss": 0.4739, "learning_rate": 2.847712524254626e-06, "epoch": 4.615384615384615, "percentage": 14.47, "elapsed_time": "2:13:34", "remaining_time": "13:09:39", "throughput": 2167.95, "total_tokens": 17374240} {"current_steps": 1130, "total_steps": 7776, "loss": 0.5376, "learning_rate": 2.846379493165918e-06, "epoch": 4.635897435897435, "percentage": 14.53, "elapsed_time": "2:14:22", "remaining_time": "13:10:21", "throughput": 2164.39, "total_tokens": 17451360} {"current_steps": 1135, "total_steps": 7776, "loss": 0.5152, "learning_rate": 2.8450409680021204e-06, "epoch": 4.656410256410257, "percentage": 14.6, "elapsed_time": "2:15:16", "remaining_time": "13:11:30", "throughput": 2160.52, "total_tokens": 17535776} {"current_steps": 1140, "total_steps": 7776, "loss": 0.4957, "learning_rate": 2.8436969542252576e-06, "epoch": 4.676923076923077, "percentage": 14.66, "elapsed_time": "2:16:05", "remaining_time": "13:12:12", "throughput": 2157.35, "total_tokens": 17616256} {"current_steps": 1145, "total_steps": 7776, "loss": 0.4963, "learning_rate": 2.842347457319752e-06, "epoch": 4.697435897435898, "percentage": 14.72, "elapsed_time": "2:16:49", "remaining_time": "13:12:25", "throughput": 2154.9, "total_tokens": 17691616} {"current_steps": 1150, "total_steps": 7776, "loss": 0.4868, "learning_rate": 2.8409924827923985e-06, "epoch": 4.717948717948718, "percentage": 14.79, "elapsed_time": "2:17:33", "remaining_time": "13:12:34", "throughput": 2152.69, "total_tokens": 17767264} {"current_steps": 1155, "total_steps": 7776, "loss": 0.5595, "learning_rate": 2.839632036172346e-06, "epoch": 4.7384615384615385, "percentage": 14.85, "elapsed_time": "2:19:06", "remaining_time": "13:17:27", "throughput": 2138.27, "total_tokens": 17847648} {"current_steps": 1160, "total_steps": 7776, "loss": 0.6248, "learning_rate": 2.8382661230110716e-06, "epoch": 4.758974358974359, "percentage": 14.92, "elapsed_time": "2:19:57", "remaining_time": "13:18:12", "throughput": 2135.63, "total_tokens": 17932992} {"current_steps": 1165, "total_steps": 7776, "loss": 0.4935, "learning_rate": 2.8368947488823613e-06, "epoch": 4.779487179487179, "percentage": 14.98, "elapsed_time": "2:20:39", "remaining_time": "13:18:13", "throughput": 2133.77, "total_tokens": 18008544} {"current_steps": 1170, "total_steps": 7776, "loss": 0.472, "learning_rate": 2.8355179193822834e-06, "epoch": 4.8, "percentage": 15.05, "elapsed_time": "2:21:31", "remaining_time": "13:19:05", "throughput": 2130.54, "total_tokens": 18091904} {"current_steps": 1175, "total_steps": 7776, "loss": 0.4618, "learning_rate": 2.834135640129168e-06, "epoch": 4.82051282051282, "percentage": 15.11, "elapsed_time": "2:22:12", "remaining_time": "13:18:55", "throughput": 2129.45, "total_tokens": 18169760} {"current_steps": 1180, "total_steps": 7776, "loss": 0.4375, "learning_rate": 2.8327479167635834e-06, "epoch": 4.841025641025641, "percentage": 15.17, "elapsed_time": "2:22:49", "remaining_time": "13:18:22", "throughput": 2128.71, "total_tokens": 18242016} {"current_steps": 1185, "total_steps": 7776, "loss": 0.4954, "learning_rate": 2.831354754948315e-06, "epoch": 4.861538461538462, "percentage": 15.24, "elapsed_time": "2:23:28", "remaining_time": "13:18:01", "throughput": 2127.64, "total_tokens": 18316192} {"current_steps": 1190, "total_steps": 7776, "loss": 0.4885, "learning_rate": 2.829956160368338e-06, "epoch": 4.8820512820512825, "percentage": 15.3, "elapsed_time": "2:24:16", "remaining_time": "13:18:30", "throughput": 2125.83, "total_tokens": 18402720} {"current_steps": 1195, "total_steps": 7776, "loss": 0.4452, "learning_rate": 2.828552138730798e-06, "epoch": 4.902564102564103, "percentage": 15.37, "elapsed_time": "2:24:49", "remaining_time": "13:17:34", "throughput": 2125.87, "total_tokens": 18472768} {"current_steps": 1200, "total_steps": 7776, "loss": 0.4602, "learning_rate": 2.8271426957649868e-06, "epoch": 4.923076923076923, "percentage": 15.43, "elapsed_time": "2:25:26", "remaining_time": "13:17:03", "throughput": 2125.4, "total_tokens": 18548128} {"current_steps": 1205, "total_steps": 7776, "loss": 0.4391, "learning_rate": 2.8257278372223177e-06, "epoch": 4.943589743589744, "percentage": 15.5, "elapsed_time": "2:26:02", "remaining_time": "13:16:24", "throughput": 2125.14, "total_tokens": 18622112} {"current_steps": 1210, "total_steps": 7776, "loss": 0.4614, "learning_rate": 2.824307568876304e-06, "epoch": 4.964102564102564, "percentage": 15.56, "elapsed_time": "2:26:42", "remaining_time": "13:16:05", "throughput": 2124.9, "total_tokens": 18704288} {"current_steps": 1215, "total_steps": 7776, "loss": 0.5284, "learning_rate": 2.8228818965225326e-06, "epoch": 4.984615384615385, "percentage": 15.62, "elapsed_time": "2:27:18", "remaining_time": "13:15:26", "throughput": 2124.86, "total_tokens": 18780128} {"current_steps": 1220, "total_steps": 7776, "loss": 0.5213, "learning_rate": 2.8214508259786443e-06, "epoch": 5.005128205128205, "percentage": 15.69, "elapsed_time": "2:27:49", "remaining_time": "13:14:22", "throughput": 2125.31, "total_tokens": 18850496} {"current_steps": 1225, "total_steps": 7776, "loss": 0.5071, "learning_rate": 2.820014363084307e-06, "epoch": 5.0256410256410255, "percentage": 15.75, "elapsed_time": "2:28:24", "remaining_time": "13:13:38", "throughput": 2125.56, "total_tokens": 18926816} {"current_steps": 1230, "total_steps": 7776, "loss": 0.4964, "learning_rate": 2.8185725137011922e-06, "epoch": 5.046153846153846, "percentage": 15.82, "elapsed_time": "2:28:56", "remaining_time": "13:12:40", "throughput": 2126.36, "total_tokens": 19002624} {"current_steps": 1235, "total_steps": 7776, "loss": 0.5196, "learning_rate": 2.8171252837129523e-06, "epoch": 5.066666666666666, "percentage": 15.88, "elapsed_time": "2:29:37", "remaining_time": "13:12:29", "throughput": 2125.6, "total_tokens": 19083296} {"current_steps": 1240, "total_steps": 7776, "loss": 0.5272, "learning_rate": 2.815672679025196e-06, "epoch": 5.087179487179487, "percentage": 15.95, "elapsed_time": "2:30:09", "remaining_time": "13:11:28", "throughput": 2126.44, "total_tokens": 19158048} {"current_steps": 1245, "total_steps": 7776, "loss": 0.5034, "learning_rate": 2.814214705565464e-06, "epoch": 5.107692307692307, "percentage": 16.01, "elapsed_time": "2:30:40", "remaining_time": "13:10:23", "throughput": 2127.57, "total_tokens": 19233888} {"current_steps": 1250, "total_steps": 7776, "loss": 0.5069, "learning_rate": 2.8127513692832047e-06, "epoch": 5.128205128205128, "percentage": 16.08, "elapsed_time": "2:31:37", "remaining_time": "13:11:35", "throughput": 2123.41, "total_tokens": 19317472} {"current_steps": 1255, "total_steps": 7776, "loss": 0.5116, "learning_rate": 2.8112826761497507e-06, "epoch": 5.148717948717949, "percentage": 16.14, "elapsed_time": "2:32:16", "remaining_time": "13:11:13", "throughput": 2123.17, "total_tokens": 19398496} {"current_steps": 1260, "total_steps": 7776, "loss": 0.4286, "learning_rate": 2.8098086321582937e-06, "epoch": 5.1692307692307695, "percentage": 16.2, "elapsed_time": "2:32:41", "remaining_time": "13:09:37", "throughput": 2124.84, "total_tokens": 19466400} {"current_steps": 1265, "total_steps": 7776, "loss": 0.5058, "learning_rate": 2.8083292433238602e-06, "epoch": 5.18974358974359, "percentage": 16.27, "elapsed_time": "2:33:13", "remaining_time": "13:08:38", "throughput": 2126.57, "total_tokens": 19550336} {"current_steps": 1270, "total_steps": 7776, "loss": 0.4587, "learning_rate": 2.8068445156832864e-06, "epoch": 5.21025641025641, "percentage": 16.33, "elapsed_time": "2:33:40", "remaining_time": "13:07:16", "throughput": 2128.45, "total_tokens": 19625792} {"current_steps": 1275, "total_steps": 7776, "loss": 0.4901, "learning_rate": 2.805354455295196e-06, "epoch": 5.230769230769231, "percentage": 16.4, "elapsed_time": "2:34:20", "remaining_time": "13:06:58", "throughput": 2128.56, "total_tokens": 19711776} {"current_steps": 1280, "total_steps": 7776, "loss": 0.5474, "learning_rate": 2.8038590682399718e-06, "epoch": 5.251282051282051, "percentage": 16.46, "elapsed_time": "2:34:56", "remaining_time": "13:06:18", "throughput": 2129.27, "total_tokens": 19794208} {"current_steps": 1285, "total_steps": 7776, "loss": 0.4452, "learning_rate": 2.8023583606197336e-06, "epoch": 5.271794871794872, "percentage": 16.53, "elapsed_time": "2:35:22", "remaining_time": "13:04:53", "throughput": 2131.54, "total_tokens": 19872128} {"current_steps": 1290, "total_steps": 7776, "loss": 0.5081, "learning_rate": 2.800852338558312e-06, "epoch": 5.292307692307692, "percentage": 16.59, "elapsed_time": "2:35:53", "remaining_time": "13:03:46", "throughput": 2133.42, "total_tokens": 19953856} {"current_steps": 1295, "total_steps": 7776, "loss": 0.4863, "learning_rate": 2.7993410082012247e-06, "epoch": 5.312820512820513, "percentage": 16.65, "elapsed_time": "2:36:15", "remaining_time": "13:02:03", "throughput": 2135.97, "total_tokens": 20026848} {"current_steps": 1300, "total_steps": 7776, "loss": 0.4979, "learning_rate": 2.79782437571565e-06, "epoch": 5.333333333333333, "percentage": 16.72, "elapsed_time": "2:36:38", "remaining_time": "13:00:17", "throughput": 2138.78, "total_tokens": 20100928} {"current_steps": 1305, "total_steps": 7776, "loss": 0.4676, "learning_rate": 2.7963024472904013e-06, "epoch": 5.3538461538461535, "percentage": 16.78, "elapsed_time": "2:36:59", "remaining_time": "12:58:28", "throughput": 2141.63, "total_tokens": 20173504} {"current_steps": 1310, "total_steps": 7776, "loss": 0.4256, "learning_rate": 2.7947752291359053e-06, "epoch": 5.374358974358975, "percentage": 16.85, "elapsed_time": "2:37:19", "remaining_time": "12:56:34", "throughput": 2144.58, "total_tokens": 20244608} {"current_steps": 1315, "total_steps": 7776, "loss": 0.4576, "learning_rate": 2.7932427274841715e-06, "epoch": 5.394871794871795, "percentage": 16.91, "elapsed_time": "2:37:42", "remaining_time": "12:54:52", "throughput": 2147.95, "total_tokens": 20324992} {"current_steps": 1320, "total_steps": 7776, "loss": 0.5155, "learning_rate": 2.7917049485887705e-06, "epoch": 5.415384615384616, "percentage": 16.98, "elapsed_time": "2:38:03", "remaining_time": "12:53:04", "throughput": 2151.28, "total_tokens": 20402304} {"current_steps": 1325, "total_steps": 7776, "loss": 0.4304, "learning_rate": 2.790161898724808e-06, "epoch": 5.435897435897436, "percentage": 17.04, "elapsed_time": "2:38:25", "remaining_time": "12:51:17", "throughput": 2154.72, "total_tokens": 20480800} {"current_steps": 1330, "total_steps": 7776, "loss": 0.4759, "learning_rate": 2.7886135841888973e-06, "epoch": 5.456410256410257, "percentage": 17.1, "elapsed_time": "2:38:46", "remaining_time": "12:49:29", "throughput": 2158.31, "total_tokens": 20560096} {"current_steps": 1335, "total_steps": 7776, "loss": 0.4974, "learning_rate": 2.787060011299135e-06, "epoch": 5.476923076923077, "percentage": 17.17, "elapsed_time": "2:39:07", "remaining_time": "12:47:44", "throughput": 2162.37, "total_tokens": 20645216} {"current_steps": 1340, "total_steps": 7776, "loss": 0.5174, "learning_rate": 2.785501186395077e-06, "epoch": 5.4974358974358974, "percentage": 17.23, "elapsed_time": "2:39:36", "remaining_time": "12:46:37", "throughput": 2165.5, "total_tokens": 20738688} {"current_steps": 1345, "total_steps": 7776, "loss": 0.5272, "learning_rate": 2.7839371158377077e-06, "epoch": 5.517948717948718, "percentage": 17.3, "elapsed_time": "2:40:08", "remaining_time": "12:45:42", "throughput": 2166.07, "total_tokens": 20812928} {"current_steps": 1350, "total_steps": 7776, "loss": 0.5129, "learning_rate": 2.78236780600942e-06, "epoch": 5.538461538461538, "percentage": 17.36, "elapsed_time": "2:41:07", "remaining_time": "12:46:56", "throughput": 2160.94, "total_tokens": 20890592} {"current_steps": 1355, "total_steps": 7776, "loss": 0.484, "learning_rate": 2.780793263313984e-06, "epoch": 5.558974358974359, "percentage": 17.43, "elapsed_time": "2:41:50", "remaining_time": "12:46:54", "throughput": 2158.76, "total_tokens": 20961984} {"current_steps": 1360, "total_steps": 7776, "loss": 0.4793, "learning_rate": 2.7792134941765247e-06, "epoch": 5.579487179487179, "percentage": 17.49, "elapsed_time": "2:42:30", "remaining_time": "12:46:39", "throughput": 2156.88, "total_tokens": 21030784} {"current_steps": 1365, "total_steps": 7776, "loss": 0.4521, "learning_rate": 2.7776285050434937e-06, "epoch": 5.6, "percentage": 17.55, "elapsed_time": "2:43:18", "remaining_time": "12:46:59", "throughput": 2154.38, "total_tokens": 21108960} {"current_steps": 1370, "total_steps": 7776, "loss": 0.4192, "learning_rate": 2.7760383023826425e-06, "epoch": 5.62051282051282, "percentage": 17.62, "elapsed_time": "2:43:59", "remaining_time": "12:46:46", "throughput": 2152.82, "total_tokens": 21181728} {"current_steps": 1375, "total_steps": 7776, "loss": 0.5131, "learning_rate": 2.7744428926829993e-06, "epoch": 5.641025641025641, "percentage": 17.68, "elapsed_time": "2:44:42", "remaining_time": "12:46:47", "throughput": 2150.71, "total_tokens": 21255328} {"current_steps": 1380, "total_steps": 7776, "loss": 0.483, "learning_rate": 2.7728422824548387e-06, "epoch": 5.661538461538462, "percentage": 17.75, "elapsed_time": "2:45:21", "remaining_time": "12:46:22", "throughput": 2149.35, "total_tokens": 21324064} {"current_steps": 1385, "total_steps": 7776, "loss": 0.4858, "learning_rate": 2.7712364782296567e-06, "epoch": 5.682051282051282, "percentage": 17.81, "elapsed_time": "2:46:03", "remaining_time": "12:46:14", "throughput": 2147.8, "total_tokens": 21399040} {"current_steps": 1390, "total_steps": 7776, "loss": 0.4629, "learning_rate": 2.769625486560145e-06, "epoch": 5.702564102564103, "percentage": 17.88, "elapsed_time": "2:46:43", "remaining_time": "12:45:56", "throughput": 2146.59, "total_tokens": 21472640} {"current_steps": 1395, "total_steps": 7776, "loss": 0.5023, "learning_rate": 2.7680093140201625e-06, "epoch": 5.723076923076923, "percentage": 17.94, "elapsed_time": "2:47:21", "remaining_time": "12:45:32", "throughput": 2145.49, "total_tokens": 21544448} {"current_steps": 1400, "total_steps": 7776, "loss": 0.4903, "learning_rate": 2.766387967204709e-06, "epoch": 5.743589743589744, "percentage": 18.0, "elapsed_time": "2:47:55", "remaining_time": "12:44:48", "throughput": 2144.84, "total_tokens": 21611136} {"current_steps": 1405, "total_steps": 7776, "loss": 0.5558, "learning_rate": 2.7647614527299007e-06, "epoch": 5.764102564102564, "percentage": 18.07, "elapsed_time": "2:49:04", "remaining_time": "12:46:39", "throughput": 2139.45, "total_tokens": 21703040} {"current_steps": 1410, "total_steps": 7776, "loss": 0.5612, "learning_rate": 2.763129777232938e-06, "epoch": 5.7846153846153845, "percentage": 18.13, "elapsed_time": "2:49:47", "remaining_time": "12:46:36", "throughput": 2138.28, "total_tokens": 21784096} {"current_steps": 1415, "total_steps": 7776, "loss": 0.4683, "learning_rate": 2.7614929473720847e-06, "epoch": 5.805128205128205, "percentage": 18.2, "elapsed_time": "2:50:22", "remaining_time": "12:45:55", "throughput": 2137.86, "total_tokens": 21855072} {"current_steps": 1420, "total_steps": 7776, "loss": 0.5171, "learning_rate": 2.7598509698266346e-06, "epoch": 5.825641025641025, "percentage": 18.26, "elapsed_time": "2:51:09", "remaining_time": "12:46:08", "throughput": 2135.71, "total_tokens": 21933312} {"current_steps": 1425, "total_steps": 7776, "loss": 0.5214, "learning_rate": 2.758203851296889e-06, "epoch": 5.846153846153846, "percentage": 18.33, "elapsed_time": "2:51:54", "remaining_time": "12:46:07", "throughput": 2134.86, "total_tokens": 22019008} {"current_steps": 1430, "total_steps": 7776, "loss": 0.4975, "learning_rate": 2.756551598504128e-06, "epoch": 5.866666666666667, "percentage": 18.39, "elapsed_time": "2:52:29", "remaining_time": "12:45:28", "throughput": 2134.67, "total_tokens": 22092864} {"current_steps": 1435, "total_steps": 7776, "loss": 0.4853, "learning_rate": 2.7548942181905816e-06, "epoch": 5.887179487179488, "percentage": 18.45, "elapsed_time": "2:53:07", "remaining_time": "12:45:00", "throughput": 2134.45, "total_tokens": 22171584} {"current_steps": 1440, "total_steps": 7776, "loss": 0.483, "learning_rate": 2.753231717119405e-06, "epoch": 5.907692307692308, "percentage": 18.52, "elapsed_time": "2:53:37", "remaining_time": "12:43:56", "throughput": 2135.02, "total_tokens": 22241376} {"current_steps": 1445, "total_steps": 7776, "loss": 0.4965, "learning_rate": 2.751564102074646e-06, "epoch": 5.9282051282051285, "percentage": 18.58, "elapsed_time": "2:54:09", "remaining_time": "12:43:00", "throughput": 2135.46, "total_tokens": 22313664} {"current_steps": 1450, "total_steps": 7776, "loss": 0.5342, "learning_rate": 2.749891379861225e-06, "epoch": 5.948717948717949, "percentage": 18.65, "elapsed_time": "2:54:54", "remaining_time": "12:43:07", "throughput": 2134.11, "total_tokens": 22397408} {"current_steps": 1455, "total_steps": 7776, "loss": 0.4233, "learning_rate": 2.748213557304899e-06, "epoch": 5.969230769230769, "percentage": 18.71, "elapsed_time": "2:55:28", "remaining_time": "12:42:20", "throughput": 2134.48, "total_tokens": 22473664} {"current_steps": 1460, "total_steps": 7776, "loss": 0.5244, "learning_rate": 2.74653064125224e-06, "epoch": 5.98974358974359, "percentage": 18.78, "elapsed_time": "2:56:07", "remaining_time": "12:41:54", "throughput": 2134.32, "total_tokens": 22553760} {"current_steps": 1465, "total_steps": 7776, "loss": 0.5211, "learning_rate": 2.7448426385706036e-06, "epoch": 6.01025641025641, "percentage": 18.84, "elapsed_time": "2:56:36", "remaining_time": "12:40:46", "throughput": 2135.17, "total_tokens": 22624608} {"current_steps": 1470, "total_steps": 7776, "loss": 0.5618, "learning_rate": 2.7431495561481027e-06, "epoch": 6.030769230769231, "percentage": 18.9, "elapsed_time": "2:57:14", "remaining_time": "12:40:20", "throughput": 2135.48, "total_tokens": 22710048} {"current_steps": 1475, "total_steps": 7776, "loss": 0.5172, "learning_rate": 2.741451400893578e-06, "epoch": 6.051282051282051, "percentage": 18.97, "elapsed_time": "2:57:47", "remaining_time": "12:39:31", "throughput": 2136.1, "total_tokens": 22787392} {"current_steps": 1480, "total_steps": 7776, "loss": 0.5035, "learning_rate": 2.739748179736571e-06, "epoch": 6.0717948717948715, "percentage": 19.03, "elapsed_time": "2:58:18", "remaining_time": "12:38:33", "throughput": 2137.14, "total_tokens": 22865120} {"current_steps": 1485, "total_steps": 7776, "loss": 0.519, "learning_rate": 2.7380398996272955e-06, "epoch": 6.092307692307692, "percentage": 19.1, "elapsed_time": "2:58:56", "remaining_time": "12:38:04", "throughput": 2137.79, "total_tokens": 22952832} {"current_steps": 1490, "total_steps": 7776, "loss": 0.4438, "learning_rate": 2.736326567536609e-06, "epoch": 6.112820512820512, "percentage": 19.16, "elapsed_time": "2:59:24", "remaining_time": "12:36:54", "throughput": 2139.24, "total_tokens": 23028544} {"current_steps": 1495, "total_steps": 7776, "loss": 0.4669, "learning_rate": 2.7346081904559827e-06, "epoch": 6.133333333333334, "percentage": 19.23, "elapsed_time": "2:59:49", "remaining_time": "12:35:31", "throughput": 2140.91, "total_tokens": 23100096} {"current_steps": 1500, "total_steps": 7776, "loss": 0.4702, "learning_rate": 2.732884775397477e-06, "epoch": 6.153846153846154, "percentage": 19.29, "elapsed_time": "3:00:25", "remaining_time": "12:34:55", "throughput": 2141.47, "total_tokens": 23183392} {"current_steps": 1505, "total_steps": 7776, "loss": 0.5031, "learning_rate": 2.731156329393709e-06, "epoch": 6.174358974358975, "percentage": 19.35, "elapsed_time": "3:00:57", "remaining_time": "12:34:02", "throughput": 2142.8, "total_tokens": 23266208} {"current_steps": 1510, "total_steps": 7776, "loss": 0.5005, "learning_rate": 2.729422859497825e-06, "epoch": 6.194871794871795, "percentage": 19.42, "elapsed_time": "3:01:25", "remaining_time": "12:32:52", "throughput": 2144.83, "total_tokens": 23348064} {"current_steps": 1515, "total_steps": 7776, "loss": 0.4798, "learning_rate": 2.7276843727834727e-06, "epoch": 6.2153846153846155, "percentage": 19.48, "elapsed_time": "3:01:48", "remaining_time": "12:31:22", "throughput": 2146.89, "total_tokens": 23420128} {"current_steps": 1520, "total_steps": 7776, "loss": 0.5059, "learning_rate": 2.725940876344771e-06, "epoch": 6.235897435897436, "percentage": 19.55, "elapsed_time": "3:02:13", "remaining_time": "12:29:59", "throughput": 2149.09, "total_tokens": 23497056} {"current_steps": 1525, "total_steps": 7776, "loss": 0.4582, "learning_rate": 2.7241923772962823e-06, "epoch": 6.256410256410256, "percentage": 19.61, "elapsed_time": "3:02:32", "remaining_time": "12:28:16", "throughput": 2151.47, "total_tokens": 23564928} {"current_steps": 1530, "total_steps": 7776, "loss": 0.4295, "learning_rate": 2.722438882772982e-06, "epoch": 6.276923076923077, "percentage": 19.68, "elapsed_time": "3:02:59", "remaining_time": "12:27:04", "throughput": 2153.61, "total_tokens": 23646624} {"current_steps": 1535, "total_steps": 7776, "loss": 0.4682, "learning_rate": 2.720680399930231e-06, "epoch": 6.297435897435897, "percentage": 19.74, "elapsed_time": "3:03:19", "remaining_time": "12:25:22", "throughput": 2156.13, "total_tokens": 23716960} {"current_steps": 1540, "total_steps": 7776, "loss": 0.4944, "learning_rate": 2.7189169359437443e-06, "epoch": 6.317948717948718, "percentage": 19.8, "elapsed_time": "3:03:44", "remaining_time": "12:24:01", "throughput": 2158.48, "total_tokens": 23796032} {"current_steps": 1545, "total_steps": 7776, "loss": 0.4405, "learning_rate": 2.7171484980095653e-06, "epoch": 6.338461538461538, "percentage": 19.87, "elapsed_time": "3:04:02", "remaining_time": "12:22:14", "throughput": 2161.51, "total_tokens": 23868768} {"current_steps": 1550, "total_steps": 7776, "loss": 0.4742, "learning_rate": 2.715375093344032e-06, "epoch": 6.358974358974359, "percentage": 19.93, "elapsed_time": "3:04:20", "remaining_time": "12:20:25", "throughput": 2164.35, "total_tokens": 23937824} {"current_steps": 1555, "total_steps": 7776, "loss": 0.4654, "learning_rate": 2.713596729183751e-06, "epoch": 6.37948717948718, "percentage": 20.0, "elapsed_time": "3:04:37", "remaining_time": "12:18:38", "throughput": 2167.34, "total_tokens": 24009472} {"current_steps": 1560, "total_steps": 7776, "loss": 0.4686, "learning_rate": 2.7118134127855667e-06, "epoch": 6.4, "percentage": 20.06, "elapsed_time": "3:05:12", "remaining_time": "12:17:58", "throughput": 2168.43, "total_tokens": 24096256} {"current_steps": 1565, "total_steps": 7776, "loss": 0.5152, "learning_rate": 2.7100251514265317e-06, "epoch": 6.420512820512821, "percentage": 20.13, "elapsed_time": "3:05:34", "remaining_time": "12:16:28", "throughput": 2171.73, "total_tokens": 24180640} {"current_steps": 1570, "total_steps": 7776, "loss": 0.4762, "learning_rate": 2.7082319524038764e-06, "epoch": 6.441025641025641, "percentage": 20.19, "elapsed_time": "3:06:06", "remaining_time": "12:15:41", "throughput": 2171.71, "total_tokens": 24251296} {"current_steps": 1575, "total_steps": 7776, "loss": 0.5113, "learning_rate": 2.706433823034981e-06, "epoch": 6.461538461538462, "percentage": 20.25, "elapsed_time": "3:07:00", "remaining_time": "12:16:15", "throughput": 2168.4, "total_tokens": 24329760} {"current_steps": 1580, "total_steps": 7776, "loss": 0.4942, "learning_rate": 2.7046307706573445e-06, "epoch": 6.482051282051282, "percentage": 20.32, "elapsed_time": "3:08:14", "remaining_time": "12:18:11", "throughput": 2162.21, "total_tokens": 24420896} {"current_steps": 1585, "total_steps": 7776, "loss": 0.475, "learning_rate": 2.702822802628554e-06, "epoch": 6.5025641025641026, "percentage": 20.38, "elapsed_time": "3:08:58", "remaining_time": "12:18:06", "throughput": 2160.43, "total_tokens": 24495360} {"current_steps": 1590, "total_steps": 7776, "loss": 0.4801, "learning_rate": 2.701009926326256e-06, "epoch": 6.523076923076923, "percentage": 20.45, "elapsed_time": "3:09:45", "remaining_time": "12:18:17", "throughput": 2158.11, "total_tokens": 24572192} {"current_steps": 1595, "total_steps": 7776, "loss": 0.4776, "learning_rate": 2.6991921491481267e-06, "epoch": 6.543589743589743, "percentage": 20.51, "elapsed_time": "3:10:28", "remaining_time": "12:18:09", "throughput": 2156.6, "total_tokens": 24647552} {"current_steps": 1600, "total_steps": 7776, "loss": 0.4878, "learning_rate": 2.6973694785118394e-06, "epoch": 6.564102564102564, "percentage": 20.58, "elapsed_time": "3:11:08", "remaining_time": "12:17:47", "throughput": 2155.42, "total_tokens": 24719136} {"current_steps": 1605, "total_steps": 7776, "loss": 0.5138, "learning_rate": 2.695541921855037e-06, "epoch": 6.584615384615384, "percentage": 20.64, "elapsed_time": "3:11:56", "remaining_time": "12:17:59", "throughput": 2153.44, "total_tokens": 24800320} {"current_steps": 1610, "total_steps": 7776, "loss": 0.4782, "learning_rate": 2.6937094866353006e-06, "epoch": 6.605128205128205, "percentage": 20.7, "elapsed_time": "3:12:42", "remaining_time": "12:18:00", "throughput": 2151.62, "total_tokens": 24877088} {"current_steps": 1615, "total_steps": 7776, "loss": 0.5043, "learning_rate": 2.6918721803301174e-06, "epoch": 6.625641025641025, "percentage": 20.77, "elapsed_time": "3:13:24", "remaining_time": "12:17:50", "throughput": 2150.33, "total_tokens": 24954272} {"current_steps": 1620, "total_steps": 7776, "loss": 0.4237, "learning_rate": 2.690030010436853e-06, "epoch": 6.6461538461538465, "percentage": 20.83, "elapsed_time": "3:14:01", "remaining_time": "12:17:17", "throughput": 2149.55, "total_tokens": 25023744} {"current_steps": 1625, "total_steps": 7776, "loss": 0.5302, "learning_rate": 2.688182984472719e-06, "epoch": 6.666666666666667, "percentage": 20.9, "elapsed_time": "3:14:46", "remaining_time": "12:17:17", "throughput": 2148.18, "total_tokens": 25105664} {"current_steps": 1630, "total_steps": 7776, "loss": 0.4991, "learning_rate": 2.686331109974743e-06, "epoch": 6.687179487179487, "percentage": 20.96, "elapsed_time": "3:15:32", "remaining_time": "12:17:16", "throughput": 2146.58, "total_tokens": 25183680} {"current_steps": 1635, "total_steps": 7776, "loss": 0.5142, "learning_rate": 2.684474394499738e-06, "epoch": 6.707692307692308, "percentage": 21.03, "elapsed_time": "3:17:08", "remaining_time": "12:20:29", "throughput": 2135.94, "total_tokens": 25265920} {"current_steps": 1640, "total_steps": 7776, "loss": 0.4651, "learning_rate": 2.6826128456242708e-06, "epoch": 6.728205128205128, "percentage": 21.09, "elapsed_time": "3:17:48", "remaining_time": "12:20:06", "throughput": 2135.33, "total_tokens": 25343648} {"current_steps": 1645, "total_steps": 7776, "loss": 0.5633, "learning_rate": 2.680746470944631e-06, "epoch": 6.748717948717949, "percentage": 21.15, "elapsed_time": "3:18:25", "remaining_time": "12:19:34", "throughput": 2134.91, "total_tokens": 25418176} {"current_steps": 1650, "total_steps": 7776, "loss": 0.5124, "learning_rate": 2.6788752780768007e-06, "epoch": 6.769230769230769, "percentage": 21.22, "elapsed_time": "3:19:11", "remaining_time": "12:19:32", "throughput": 2134.05, "total_tokens": 25504832} {"current_steps": 1655, "total_steps": 7776, "loss": 0.5046, "learning_rate": 2.6769992746564256e-06, "epoch": 6.78974358974359, "percentage": 21.28, "elapsed_time": "3:19:49", "remaining_time": "12:19:03", "throughput": 2133.7, "total_tokens": 25582112} {"current_steps": 1660, "total_steps": 7776, "loss": 0.484, "learning_rate": 2.6751184683387777e-06, "epoch": 6.81025641025641, "percentage": 21.35, "elapsed_time": "3:20:25", "remaining_time": "12:18:24", "throughput": 2133.63, "total_tokens": 25656992} {"current_steps": 1665, "total_steps": 7776, "loss": 0.4526, "learning_rate": 2.67323286679873e-06, "epoch": 6.8307692307692305, "percentage": 21.41, "elapsed_time": "3:20:56", "remaining_time": "12:17:31", "throughput": 2134.05, "total_tokens": 25729600} {"current_steps": 1670, "total_steps": 7776, "loss": 0.4563, "learning_rate": 2.671342477730723e-06, "epoch": 6.851282051282051, "percentage": 21.48, "elapsed_time": "3:21:28", "remaining_time": "12:16:38", "throughput": 2134.43, "total_tokens": 25801536} {"current_steps": 1675, "total_steps": 7776, "loss": 0.4951, "learning_rate": 2.6694473088487324e-06, "epoch": 6.871794871794872, "percentage": 21.54, "elapsed_time": "3:22:06", "remaining_time": "12:16:07", "throughput": 2134.49, "total_tokens": 25882912} {"current_steps": 1680, "total_steps": 7776, "loss": 0.5223, "learning_rate": 2.6675473678862403e-06, "epoch": 6.892307692307693, "percentage": 21.6, "elapsed_time": "3:22:38", "remaining_time": "12:15:19", "throughput": 2134.88, "total_tokens": 25957952} {"current_steps": 1685, "total_steps": 7776, "loss": 0.5471, "learning_rate": 2.6656426625961993e-06, "epoch": 6.912820512820513, "percentage": 21.67, "elapsed_time": "3:23:11", "remaining_time": "12:14:31", "throughput": 2135.39, "total_tokens": 26034432} {"current_steps": 1690, "total_steps": 7776, "loss": 0.4252, "learning_rate": 2.6637332007510063e-06, "epoch": 6.933333333333334, "percentage": 21.73, "elapsed_time": "3:23:41", "remaining_time": "12:13:30", "throughput": 2136.2, "total_tokens": 26106656} {"current_steps": 1695, "total_steps": 7776, "loss": 0.5269, "learning_rate": 2.661818990142465e-06, "epoch": 6.953846153846154, "percentage": 21.8, "elapsed_time": "3:24:14", "remaining_time": "12:12:45", "throughput": 2136.89, "total_tokens": 26186976} {"current_steps": 1700, "total_steps": 7776, "loss": 0.4487, "learning_rate": 2.65990003858176e-06, "epoch": 6.9743589743589745, "percentage": 21.86, "elapsed_time": "3:24:41", "remaining_time": "12:11:37", "throughput": 2138.04, "total_tokens": 26259264} {"current_steps": 1705, "total_steps": 7776, "loss": 0.4705, "learning_rate": 2.6579763538994197e-06, "epoch": 6.994871794871795, "percentage": 21.93, "elapsed_time": "3:25:10", "remaining_time": "12:10:32", "throughput": 2139.16, "total_tokens": 26333248} {"current_steps": 1710, "total_steps": 7776, "loss": 0.4443, "learning_rate": 2.656047943945287e-06, "epoch": 7.015384615384615, "percentage": 21.99, "elapsed_time": "3:25:36", "remaining_time": "12:09:21", "throughput": 2140.39, "total_tokens": 26404832} {"current_steps": 1715, "total_steps": 7776, "loss": 0.4615, "learning_rate": 2.6541148165884885e-06, "epoch": 7.035897435897436, "percentage": 22.06, "elapsed_time": "3:26:07", "remaining_time": "12:08:28", "throughput": 2141.45, "total_tokens": 26484608} {"current_steps": 1720, "total_steps": 7776, "loss": 0.5042, "learning_rate": 2.652176979717399e-06, "epoch": 7.056410256410256, "percentage": 22.12, "elapsed_time": "3:26:31", "remaining_time": "12:07:10", "throughput": 2143.07, "total_tokens": 26556224} {"current_steps": 1725, "total_steps": 7776, "loss": 0.4601, "learning_rate": 2.6502344412396116e-06, "epoch": 7.076923076923077, "percentage": 22.18, "elapsed_time": "3:26:57", "remaining_time": "12:05:57", "throughput": 2144.58, "total_tokens": 26629632} {"current_steps": 1730, "total_steps": 7776, "loss": 0.534, "learning_rate": 2.6482872090819053e-06, "epoch": 7.097435897435897, "percentage": 22.25, "elapsed_time": "3:27:25", "remaining_time": "12:04:53", "throughput": 2146.15, "total_tokens": 26709568} {"current_steps": 1735, "total_steps": 7776, "loss": 0.4875, "learning_rate": 2.646335291190211e-06, "epoch": 7.1179487179487175, "percentage": 22.31, "elapsed_time": "3:27:51", "remaining_time": "12:03:43", "throughput": 2147.78, "total_tokens": 26785728} {"current_steps": 1740, "total_steps": 7776, "loss": 0.5223, "learning_rate": 2.6443786955295827e-06, "epoch": 7.138461538461539, "percentage": 22.38, "elapsed_time": "3:28:17", "remaining_time": "12:02:34", "throughput": 2149.57, "total_tokens": 26865024} {"current_steps": 1745, "total_steps": 7776, "loss": 0.4365, "learning_rate": 2.6424174300841606e-06, "epoch": 7.158974358974359, "percentage": 22.44, "elapsed_time": "3:28:39", "remaining_time": "12:01:09", "throughput": 2151.42, "total_tokens": 26934720} {"current_steps": 1750, "total_steps": 7776, "loss": 0.4951, "learning_rate": 2.6404515028571406e-06, "epoch": 7.17948717948718, "percentage": 22.51, "elapsed_time": "3:29:01", "remaining_time": "11:59:45", "throughput": 2153.54, "total_tokens": 27008192} {"current_steps": 1755, "total_steps": 7776, "loss": 0.5132, "learning_rate": 2.638480921870743e-06, "epoch": 7.2, "percentage": 22.57, "elapsed_time": "3:29:26", "remaining_time": "11:58:33", "throughput": 2155.87, "total_tokens": 27092000} {"current_steps": 1760, "total_steps": 7776, "loss": 0.4713, "learning_rate": 2.636505695166177e-06, "epoch": 7.220512820512821, "percentage": 22.63, "elapsed_time": "3:29:50", "remaining_time": "11:57:17", "throughput": 2158.11, "total_tokens": 27172160} {"current_steps": 1765, "total_steps": 7776, "loss": 0.479, "learning_rate": 2.63452583080361e-06, "epoch": 7.241025641025641, "percentage": 22.7, "elapsed_time": "3:30:15", "remaining_time": "11:56:03", "throughput": 2160.51, "total_tokens": 27255712} {"current_steps": 1770, "total_steps": 7776, "loss": 0.4967, "learning_rate": 2.6325413368621337e-06, "epoch": 7.2615384615384615, "percentage": 22.76, "elapsed_time": "3:30:55", "remaining_time": "11:55:41", "throughput": 2160.64, "total_tokens": 27343136} {"current_steps": 1775, "total_steps": 7776, "loss": 0.4843, "learning_rate": 2.630552221439732e-06, "epoch": 7.282051282051282, "percentage": 22.83, "elapsed_time": "3:31:14", "remaining_time": "11:54:08", "throughput": 2163.27, "total_tokens": 27417312} {"current_steps": 1780, "total_steps": 7776, "loss": 0.4738, "learning_rate": 2.6285584926532465e-06, "epoch": 7.302564102564102, "percentage": 22.89, "elapsed_time": "3:31:52", "remaining_time": "11:53:41", "throughput": 2163.73, "total_tokens": 27505824} {"current_steps": 1785, "total_steps": 7776, "loss": 0.5716, "learning_rate": 2.626560158638344e-06, "epoch": 7.323076923076923, "percentage": 22.96, "elapsed_time": "3:32:14", "remaining_time": "11:52:21", "throughput": 2166.05, "total_tokens": 27583776} {"current_steps": 1790, "total_steps": 7776, "loss": 0.515, "learning_rate": 2.6245572275494845e-06, "epoch": 7.343589743589743, "percentage": 23.02, "elapsed_time": "3:32:30", "remaining_time": "11:50:40", "throughput": 2169.17, "total_tokens": 27658912} {"current_steps": 1795, "total_steps": 7776, "loss": 0.47, "learning_rate": 2.6225497075598865e-06, "epoch": 7.364102564102564, "percentage": 23.08, "elapsed_time": "3:33:11", "remaining_time": "11:50:20", "throughput": 2168.18, "total_tokens": 27733472} {"current_steps": 1800, "total_steps": 7776, "loss": 0.4749, "learning_rate": 2.6205376068614943e-06, "epoch": 7.384615384615385, "percentage": 23.15, "elapsed_time": "3:34:01", "remaining_time": "11:50:32", "throughput": 2165.86, "total_tokens": 27812160} {"current_steps": 1805, "total_steps": 7776, "loss": 0.4727, "learning_rate": 2.6185209336649438e-06, "epoch": 7.4051282051282055, "percentage": 23.21, "elapsed_time": "3:34:43", "remaining_time": "11:50:20", "throughput": 2164.32, "total_tokens": 27885024} {"current_steps": 1810, "total_steps": 7776, "loss": 0.478, "learning_rate": 2.61649969619953e-06, "epoch": 7.425641025641026, "percentage": 23.28, "elapsed_time": "3:35:26", "remaining_time": "11:50:07", "throughput": 2162.73, "total_tokens": 27956480} {"current_steps": 1815, "total_steps": 7776, "loss": 0.4778, "learning_rate": 2.614473902713173e-06, "epoch": 7.446153846153846, "percentage": 23.34, "elapsed_time": "3:36:07", "remaining_time": "11:49:50", "throughput": 2161.35, "total_tokens": 28028032} {"current_steps": 1820, "total_steps": 7776, "loss": 0.4443, "learning_rate": 2.612443561472385e-06, "epoch": 7.466666666666667, "percentage": 23.41, "elapsed_time": "3:37:00", "remaining_time": "11:50:10", "throughput": 2159.1, "total_tokens": 28112992} {"current_steps": 1825, "total_steps": 7776, "loss": 0.5186, "learning_rate": 2.610408680762234e-06, "epoch": 7.487179487179487, "percentage": 23.47, "elapsed_time": "3:37:48", "remaining_time": "11:50:14", "throughput": 2157.17, "total_tokens": 28191520} {"current_steps": 1830, "total_steps": 7776, "loss": 0.5152, "learning_rate": 2.6083692688863135e-06, "epoch": 7.507692307692308, "percentage": 23.53, "elapsed_time": "3:38:45", "remaining_time": "11:50:46", "throughput": 2154.44, "total_tokens": 28277440} {"current_steps": 1835, "total_steps": 7776, "loss": 0.5173, "learning_rate": 2.6063253341667064e-06, "epoch": 7.528205128205128, "percentage": 23.6, "elapsed_time": "3:39:36", "remaining_time": "11:51:01", "throughput": 2152.05, "total_tokens": 28357440} {"current_steps": 1840, "total_steps": 7776, "loss": 0.4585, "learning_rate": 2.604276884943953e-06, "epoch": 7.5487179487179485, "percentage": 23.66, "elapsed_time": "3:40:12", "remaining_time": "11:50:25", "throughput": 2151.47, "total_tokens": 28426656} {"current_steps": 1845, "total_steps": 7776, "loss": 0.4611, "learning_rate": 2.602223929577013e-06, "epoch": 7.569230769230769, "percentage": 23.73, "elapsed_time": "3:40:51", "remaining_time": "11:49:58", "throughput": 2150.72, "total_tokens": 28499968} {"current_steps": 1850, "total_steps": 7776, "loss": 0.4929, "learning_rate": 2.6001664764432363e-06, "epoch": 7.589743589743589, "percentage": 23.79, "elapsed_time": "3:41:29", "remaining_time": "11:49:30", "throughput": 2150.06, "total_tokens": 28573664} {"current_steps": 1855, "total_steps": 7776, "loss": 0.5018, "learning_rate": 2.5981045339383244e-06, "epoch": 7.61025641025641, "percentage": 23.86, "elapsed_time": "3:42:45", "remaining_time": "11:51:01", "throughput": 2144.18, "total_tokens": 28658144} {"current_steps": 1860, "total_steps": 7776, "loss": 0.483, "learning_rate": 2.596038110476301e-06, "epoch": 7.63076923076923, "percentage": 23.92, "elapsed_time": "3:43:22", "remaining_time": "11:50:29", "throughput": 2143.66, "total_tokens": 28730944} {"current_steps": 1865, "total_steps": 7776, "loss": 0.5111, "learning_rate": 2.593967214489473e-06, "epoch": 7.651282051282052, "percentage": 23.98, "elapsed_time": "3:44:55", "remaining_time": "11:52:51", "throughput": 2135.33, "total_tokens": 28816384} {"current_steps": 1870, "total_steps": 7776, "loss": 0.4689, "learning_rate": 2.591891854428398e-06, "epoch": 7.671794871794872, "percentage": 24.05, "elapsed_time": "3:45:32", "remaining_time": "11:52:19", "throughput": 2134.98, "total_tokens": 28891616} {"current_steps": 1875, "total_steps": 7776, "loss": 0.4917, "learning_rate": 2.5898120387618507e-06, "epoch": 7.6923076923076925, "percentage": 24.11, "elapsed_time": "3:46:19", "remaining_time": "11:52:16", "throughput": 2133.42, "total_tokens": 28970400} {"current_steps": 1880, "total_steps": 7776, "loss": 0.4956, "learning_rate": 2.587727775976787e-06, "epoch": 7.712820512820513, "percentage": 24.18, "elapsed_time": "3:47:00", "remaining_time": "11:51:57", "throughput": 2132.87, "total_tokens": 29051520} {"current_steps": 1885, "total_steps": 7776, "loss": 0.438, "learning_rate": 2.585639074578309e-06, "epoch": 7.733333333333333, "percentage": 24.24, "elapsed_time": "3:47:37", "remaining_time": "11:51:23", "throughput": 2132.76, "total_tokens": 29128544} {"current_steps": 1890, "total_steps": 7776, "loss": 0.4644, "learning_rate": 2.5835459430896333e-06, "epoch": 7.753846153846154, "percentage": 24.31, "elapsed_time": "3:48:16", "remaining_time": "11:50:55", "throughput": 2132.64, "total_tokens": 29210496} {"current_steps": 1895, "total_steps": 7776, "loss": 0.4901, "learning_rate": 2.5814483900520522e-06, "epoch": 7.774358974358974, "percentage": 24.37, "elapsed_time": "3:48:47", "remaining_time": "11:50:00", "throughput": 2133.19, "total_tokens": 29282400} {"current_steps": 1900, "total_steps": 7776, "loss": 0.4879, "learning_rate": 2.5793464240249014e-06, "epoch": 7.794871794871795, "percentage": 24.43, "elapsed_time": "3:49:16", "remaining_time": "11:49:04", "throughput": 2133.67, "total_tokens": 29352256} {"current_steps": 1905, "total_steps": 7776, "loss": 0.4552, "learning_rate": 2.5772400535855242e-06, "epoch": 7.815384615384615, "percentage": 24.5, "elapsed_time": "3:49:48", "remaining_time": "11:48:14", "throughput": 2134.13, "total_tokens": 29426336} {"current_steps": 1910, "total_steps": 7776, "loss": 0.5417, "learning_rate": 2.575129287329237e-06, "epoch": 7.835897435897436, "percentage": 24.56, "elapsed_time": "3:50:32", "remaining_time": "11:48:02", "throughput": 2133.55, "total_tokens": 29512224} {"current_steps": 1915, "total_steps": 7776, "loss": 0.4637, "learning_rate": 2.5730141338692926e-06, "epoch": 7.856410256410256, "percentage": 24.63, "elapsed_time": "3:51:04", "remaining_time": "11:47:13", "throughput": 2134.22, "total_tokens": 29590112} {"current_steps": 1920, "total_steps": 7776, "loss": 0.4486, "learning_rate": 2.5708946018368487e-06, "epoch": 7.876923076923077, "percentage": 24.69, "elapsed_time": "3:51:39", "remaining_time": "11:46:34", "throughput": 2134.76, "total_tokens": 29672608} {"current_steps": 1925, "total_steps": 7776, "loss": 0.5094, "learning_rate": 2.568770699880928e-06, "epoch": 7.897435897435898, "percentage": 24.76, "elapsed_time": "3:52:19", "remaining_time": "11:46:09", "throughput": 2134.59, "total_tokens": 29755520} {"current_steps": 1930, "total_steps": 7776, "loss": 0.5111, "learning_rate": 2.566642436668387e-06, "epoch": 7.917948717948718, "percentage": 24.82, "elapsed_time": "3:52:49", "remaining_time": "11:45:12", "throughput": 2135.67, "total_tokens": 29833344} {"current_steps": 1935, "total_steps": 7776, "loss": 0.4737, "learning_rate": 2.5645098208838774e-06, "epoch": 7.938461538461539, "percentage": 24.88, "elapsed_time": "3:53:15", "remaining_time": "11:44:06", "throughput": 2136.77, "total_tokens": 29904800} {"current_steps": 1940, "total_steps": 7776, "loss": 0.4384, "learning_rate": 2.562372861229813e-06, "epoch": 7.958974358974359, "percentage": 24.95, "elapsed_time": "3:53:40", "remaining_time": "11:42:57", "throughput": 2137.96, "total_tokens": 29975488} {"current_steps": 1945, "total_steps": 7776, "loss": 0.4383, "learning_rate": 2.5602315664263337e-06, "epoch": 7.97948717948718, "percentage": 25.01, "elapsed_time": "3:54:04", "remaining_time": "11:41:44", "throughput": 2139.37, "total_tokens": 30046496} {"current_steps": 1950, "total_steps": 7776, "loss": 0.4782, "learning_rate": 2.5580859452112685e-06, "epoch": 8.0, "percentage": 25.08, "elapsed_time": "3:54:29", "remaining_time": "11:40:35", "throughput": 2140.76, "total_tokens": 30119840} {"current_steps": 1955, "total_steps": 7776, "loss": 0.5371, "learning_rate": 2.555936006340101e-06, "epoch": 8.02051282051282, "percentage": 25.14, "elapsed_time": "3:55:01", "remaining_time": "11:39:47", "throughput": 2142.1, "total_tokens": 30207040} {"current_steps": 1960, "total_steps": 7776, "loss": 0.4867, "learning_rate": 2.553781758585935e-06, "epoch": 8.04102564102564, "percentage": 25.21, "elapsed_time": "3:55:27", "remaining_time": "11:38:40", "throughput": 2143.63, "total_tokens": 30283968} {"current_steps": 1965, "total_steps": 7776, "loss": 0.4309, "learning_rate": 2.551623210739455e-06, "epoch": 8.061538461538461, "percentage": 25.27, "elapsed_time": "3:55:48", "remaining_time": "11:37:22", "throughput": 2145.43, "total_tokens": 30355552} {"current_steps": 1970, "total_steps": 7776, "loss": 0.5087, "learning_rate": 2.549460371608895e-06, "epoch": 8.082051282051282, "percentage": 25.33, "elapsed_time": "3:56:17", "remaining_time": "11:36:24", "throughput": 2146.76, "total_tokens": 30435776} {"current_steps": 1975, "total_steps": 7776, "loss": 0.4746, "learning_rate": 2.5472932500199976e-06, "epoch": 8.102564102564102, "percentage": 25.4, "elapsed_time": "3:56:39", "remaining_time": "11:35:08", "throughput": 2148.44, "total_tokens": 30507616} {"current_steps": 1980, "total_steps": 7776, "loss": 0.4833, "learning_rate": 2.5451218548159823e-06, "epoch": 8.123076923076923, "percentage": 25.46, "elapsed_time": "3:57:01", "remaining_time": "11:33:50", "throughput": 2150.5, "total_tokens": 30583456} {"current_steps": 1985, "total_steps": 7776, "loss": 0.4849, "learning_rate": 2.5429461948575077e-06, "epoch": 8.143589743589743, "percentage": 25.53, "elapsed_time": "3:57:20", "remaining_time": "11:32:26", "throughput": 2152.54, "total_tokens": 30654176} {"current_steps": 1990, "total_steps": 7776, "loss": 0.4812, "learning_rate": 2.540766279022634e-06, "epoch": 8.164102564102564, "percentage": 25.59, "elapsed_time": "3:57:39", "remaining_time": "11:30:58", "throughput": 2154.56, "total_tokens": 30721920} {"current_steps": 1995, "total_steps": 7776, "loss": 0.4976, "learning_rate": 2.53858211620679e-06, "epoch": 8.184615384615384, "percentage": 25.66, "elapsed_time": "3:57:57", "remaining_time": "11:29:31", "throughput": 2156.7, "total_tokens": 30791264} {"current_steps": 2000, "total_steps": 7776, "loss": 0.4556, "learning_rate": 2.536393715322732e-06, "epoch": 8.205128205128204, "percentage": 25.72, "elapsed_time": "3:58:13", "remaining_time": "11:28:00", "throughput": 2159.15, "total_tokens": 30862336} {"current_steps": 2005, "total_steps": 7776, "loss": 0.4496, "learning_rate": 2.5342010853005127e-06, "epoch": 8.225641025641025, "percentage": 25.78, "elapsed_time": "3:58:53", "remaining_time": "11:27:35", "throughput": 2158.63, "total_tokens": 30940064} {"current_steps": 2010, "total_steps": 7776, "loss": 0.4722, "learning_rate": 2.532004235087441e-06, "epoch": 8.246153846153845, "percentage": 25.85, "elapsed_time": "3:59:10", "remaining_time": "11:26:06", "throughput": 2161.14, "total_tokens": 31013248} {"current_steps": 2015, "total_steps": 7776, "loss": 0.4875, "learning_rate": 2.529803173648049e-06, "epoch": 8.266666666666667, "percentage": 25.91, "elapsed_time": "3:59:30", "remaining_time": "11:24:45", "throughput": 2163.78, "total_tokens": 31094496} {"current_steps": 2020, "total_steps": 7776, "loss": 0.4598, "learning_rate": 2.52759790996405e-06, "epoch": 8.287179487179488, "percentage": 25.98, "elapsed_time": "4:00:31", "remaining_time": "11:25:22", "throughput": 2159.99, "total_tokens": 31171680} {"current_steps": 2025, "total_steps": 7776, "loss": 0.5069, "learning_rate": 2.525388453034307e-06, "epoch": 8.307692307692308, "percentage": 26.04, "elapsed_time": "4:01:30", "remaining_time": "11:25:51", "throughput": 2156.8, "total_tokens": 31252064} {"current_steps": 2030, "total_steps": 7776, "loss": 0.5155, "learning_rate": 2.5231748118747945e-06, "epoch": 8.328205128205129, "percentage": 26.11, "elapsed_time": "4:02:17", "remaining_time": "11:25:49", "throughput": 2155.05, "total_tokens": 31329696} {"current_steps": 2035, "total_steps": 7776, "loss": 0.5436, "learning_rate": 2.5209569955185604e-06, "epoch": 8.34871794871795, "percentage": 26.17, "elapsed_time": "4:03:20", "remaining_time": "11:26:29", "throughput": 2151.17, "total_tokens": 31407648} {"current_steps": 2040, "total_steps": 7776, "loss": 0.4953, "learning_rate": 2.51873501301569e-06, "epoch": 8.36923076923077, "percentage": 26.23, "elapsed_time": "4:03:58", "remaining_time": "11:26:00", "throughput": 2150.15, "total_tokens": 31475200} {"current_steps": 2045, "total_steps": 7776, "loss": 0.4804, "learning_rate": 2.5165088734332695e-06, "epoch": 8.38974358974359, "percentage": 26.3, "elapsed_time": "4:04:40", "remaining_time": "11:25:42", "throughput": 2148.86, "total_tokens": 31547104} {"current_steps": 2050, "total_steps": 7776, "loss": 0.5533, "learning_rate": 2.5142785858553486e-06, "epoch": 8.41025641025641, "percentage": 26.36, "elapsed_time": "4:05:40", "remaining_time": "11:26:12", "throughput": 2145.74, "total_tokens": 31629440} {"current_steps": 2055, "total_steps": 7776, "loss": 0.541, "learning_rate": 2.512044159382903e-06, "epoch": 8.430769230769231, "percentage": 26.43, "elapsed_time": "4:06:47", "remaining_time": "11:27:03", "throughput": 2141.68, "total_tokens": 31713024} {"current_steps": 2060, "total_steps": 7776, "loss": 0.4444, "learning_rate": 2.5098056031337975e-06, "epoch": 8.451282051282051, "percentage": 26.49, "elapsed_time": "4:07:31", "remaining_time": "11:26:49", "throughput": 2140.54, "total_tokens": 31790432} {"current_steps": 2065, "total_steps": 7776, "loss": 0.4869, "learning_rate": 2.5075629262427507e-06, "epoch": 8.471794871794872, "percentage": 26.56, "elapsed_time": "4:08:19", "remaining_time": "11:26:45", "throughput": 2139.09, "total_tokens": 31870592} {"current_steps": 2070, "total_steps": 7776, "loss": 0.4855, "learning_rate": 2.505316137861294e-06, "epoch": 8.492307692307692, "percentage": 26.62, "elapsed_time": "4:09:10", "remaining_time": "11:26:52", "throughput": 2136.67, "total_tokens": 31945344} {"current_steps": 2075, "total_steps": 7776, "loss": 0.5027, "learning_rate": 2.503065247157737e-06, "epoch": 8.512820512820513, "percentage": 26.68, "elapsed_time": "4:10:44", "remaining_time": "11:28:54", "throughput": 2129.0, "total_tokens": 32030016} {"current_steps": 2080, "total_steps": 7776, "loss": 0.4885, "learning_rate": 2.500810263317129e-06, "epoch": 8.533333333333333, "percentage": 26.75, "elapsed_time": "4:11:25", "remaining_time": "11:28:32", "throughput": 2128.36, "total_tokens": 32108160} {"current_steps": 2085, "total_steps": 7776, "loss": 0.4451, "learning_rate": 2.4985511955412238e-06, "epoch": 8.553846153846154, "percentage": 26.81, "elapsed_time": "4:12:14", "remaining_time": "11:28:30", "throughput": 2126.76, "total_tokens": 32188288} {"current_steps": 2090, "total_steps": 7776, "loss": 0.4899, "learning_rate": 2.4962880530484375e-06, "epoch": 8.574358974358974, "percentage": 26.88, "elapsed_time": "4:12:55", "remaining_time": "11:28:05", "throughput": 2126.25, "total_tokens": 32266656} {"current_steps": 2095, "total_steps": 7776, "loss": 0.5083, "learning_rate": 2.4940208450738146e-06, "epoch": 8.594871794871795, "percentage": 26.94, "elapsed_time": "4:13:44", "remaining_time": "11:28:04", "throughput": 2125.25, "total_tokens": 32356544} {"current_steps": 2100, "total_steps": 7776, "loss": 0.4839, "learning_rate": 2.49174958086899e-06, "epoch": 8.615384615384615, "percentage": 27.01, "elapsed_time": "4:14:23", "remaining_time": "11:27:35", "throughput": 2124.96, "total_tokens": 32434720} {"current_steps": 2105, "total_steps": 7776, "loss": 0.437, "learning_rate": 2.48947426970215e-06, "epoch": 8.635897435897435, "percentage": 27.07, "elapsed_time": "4:14:56", "remaining_time": "11:26:50", "throughput": 2125.13, "total_tokens": 32507712} {"current_steps": 2110, "total_steps": 7776, "loss": 0.435, "learning_rate": 2.487194920857995e-06, "epoch": 8.656410256410256, "percentage": 27.13, "elapsed_time": "4:15:27", "remaining_time": "11:25:59", "throughput": 2125.36, "total_tokens": 32577216} {"current_steps": 2115, "total_steps": 7776, "loss": 0.4768, "learning_rate": 2.484911543637702e-06, "epoch": 8.676923076923076, "percentage": 27.2, "elapsed_time": "4:15:58", "remaining_time": "11:25:09", "throughput": 2125.64, "total_tokens": 32647552} {"current_steps": 2120, "total_steps": 7776, "loss": 0.4578, "learning_rate": 2.4826241473588855e-06, "epoch": 8.697435897435897, "percentage": 27.26, "elapsed_time": "4:16:35", "remaining_time": "11:24:33", "throughput": 2125.79, "total_tokens": 32727520} {"current_steps": 2125, "total_steps": 7776, "loss": 0.5142, "learning_rate": 2.4803327413555623e-06, "epoch": 8.717948717948717, "percentage": 27.33, "elapsed_time": "4:17:12", "remaining_time": "11:24:00", "throughput": 2125.68, "total_tokens": 32805440} {"current_steps": 2130, "total_steps": 7776, "loss": 0.4013, "learning_rate": 2.4780373349781083e-06, "epoch": 8.73846153846154, "percentage": 27.39, "elapsed_time": "4:17:44", "remaining_time": "11:23:12", "throughput": 2126.16, "total_tokens": 32880480} {"current_steps": 2135, "total_steps": 7776, "loss": 0.4616, "learning_rate": 2.4757379375932265e-06, "epoch": 8.75897435897436, "percentage": 27.46, "elapsed_time": "4:18:14", "remaining_time": "11:22:18", "throughput": 2126.72, "total_tokens": 32951936} {"current_steps": 2140, "total_steps": 7776, "loss": 0.4791, "learning_rate": 2.473434558583903e-06, "epoch": 8.77948717948718, "percentage": 27.52, "elapsed_time": "4:18:51", "remaining_time": "11:21:44", "throughput": 2126.46, "total_tokens": 33027104} {"current_steps": 2145, "total_steps": 7776, "loss": 0.5163, "learning_rate": 2.4711272073493745e-06, "epoch": 8.8, "percentage": 27.58, "elapsed_time": "4:19:26", "remaining_time": "11:21:05", "throughput": 2127.06, "total_tokens": 33111040} {"current_steps": 2150, "total_steps": 7776, "loss": 0.4761, "learning_rate": 2.468815893305084e-06, "epoch": 8.820512820512821, "percentage": 27.65, "elapsed_time": "4:20:50", "remaining_time": "11:22:33", "throughput": 2121.47, "total_tokens": 33202304} {"current_steps": 2155, "total_steps": 7776, "loss": 0.4405, "learning_rate": 2.466500625882646e-06, "epoch": 8.841025641025642, "percentage": 27.71, "elapsed_time": "4:21:20", "remaining_time": "11:21:41", "throughput": 2122.41, "total_tokens": 33281376} {"current_steps": 2160, "total_steps": 7776, "loss": 0.4538, "learning_rate": 2.464181414529809e-06, "epoch": 8.861538461538462, "percentage": 27.78, "elapsed_time": "4:21:46", "remaining_time": "11:20:37", "throughput": 2123.45, "total_tokens": 33352640} {"current_steps": 2165, "total_steps": 7776, "loss": 0.4598, "learning_rate": 2.4618582687104132e-06, "epoch": 8.882051282051282, "percentage": 27.84, "elapsed_time": "4:22:11", "remaining_time": "11:19:32", "throughput": 2124.54, "total_tokens": 33423232} {"current_steps": 2170, "total_steps": 7776, "loss": 0.4556, "learning_rate": 2.4595311979043545e-06, "epoch": 8.902564102564103, "percentage": 27.91, "elapsed_time": "4:22:45", "remaining_time": "11:18:48", "throughput": 2125.12, "total_tokens": 33503744} {"current_steps": 2175, "total_steps": 7776, "loss": 0.4665, "learning_rate": 2.4572002116075454e-06, "epoch": 8.923076923076923, "percentage": 27.97, "elapsed_time": "4:23:09", "remaining_time": "11:17:40", "throughput": 2126.52, "total_tokens": 33576800} {"current_steps": 2180, "total_steps": 7776, "loss": 0.4683, "learning_rate": 2.454865319331876e-06, "epoch": 8.943589743589744, "percentage": 28.03, "elapsed_time": "4:23:39", "remaining_time": "11:16:47", "throughput": 2127.86, "total_tokens": 33661120} {"current_steps": 2185, "total_steps": 7776, "loss": 0.5183, "learning_rate": 2.4525265306051755e-06, "epoch": 8.964102564102564, "percentage": 28.1, "elapsed_time": "4:24:02", "remaining_time": "11:15:38", "throughput": 2129.26, "total_tokens": 33733568} {"current_steps": 2190, "total_steps": 7776, "loss": 0.4671, "learning_rate": 2.4501838549711723e-06, "epoch": 8.984615384615385, "percentage": 28.16, "elapsed_time": "4:24:23", "remaining_time": "11:14:22", "throughput": 2130.88, "total_tokens": 33802592} {"current_steps": 2195, "total_steps": 7776, "loss": 0.4858, "learning_rate": 2.447837301989457e-06, "epoch": 9.005128205128205, "percentage": 28.23, "elapsed_time": "4:24:50", "remaining_time": "11:13:23", "throughput": 2132.23, "total_tokens": 33882272} {"current_steps": 2200, "total_steps": 7776, "loss": 0.4574, "learning_rate": 2.4454868812354403e-06, "epoch": 9.025641025641026, "percentage": 28.29, "elapsed_time": "4:25:12", "remaining_time": "11:12:10", "throughput": 2133.81, "total_tokens": 33953920} {"current_steps": 2205, "total_steps": 7776, "loss": 0.4419, "learning_rate": 2.4431326023003188e-06, "epoch": 9.046153846153846, "percentage": 28.36, "elapsed_time": "4:25:33", "remaining_time": "11:10:56", "throughput": 2135.58, "total_tokens": 34027552} {"current_steps": 2210, "total_steps": 7776, "loss": 0.5126, "learning_rate": 2.44077447479103e-06, "epoch": 9.066666666666666, "percentage": 28.42, "elapsed_time": "4:25:59", "remaining_time": "11:09:55", "throughput": 2137.43, "total_tokens": 34112480} {"current_steps": 2215, "total_steps": 7776, "loss": 0.4517, "learning_rate": 2.4384125083302178e-06, "epoch": 9.087179487179487, "percentage": 28.49, "elapsed_time": "4:26:18", "remaining_time": "11:08:36", "throughput": 2139.3, "total_tokens": 34183840} {"current_steps": 2220, "total_steps": 7776, "loss": 0.5161, "learning_rate": 2.4360467125561907e-06, "epoch": 9.107692307692307, "percentage": 28.55, "elapsed_time": "4:26:40", "remaining_time": "11:07:24", "throughput": 2141.09, "total_tokens": 34258912} {"current_steps": 2225, "total_steps": 7776, "loss": 0.4486, "learning_rate": 2.433677097122883e-06, "epoch": 9.128205128205128, "percentage": 28.61, "elapsed_time": "4:26:57", "remaining_time": "11:06:00", "throughput": 2143.27, "total_tokens": 34329248} {"current_steps": 2230, "total_steps": 7776, "loss": 0.5191, "learning_rate": 2.4313036716998154e-06, "epoch": 9.148717948717948, "percentage": 28.68, "elapsed_time": "4:27:18", "remaining_time": "11:04:48", "throughput": 2145.5, "total_tokens": 34411232} {"current_steps": 2235, "total_steps": 7776, "loss": 0.5117, "learning_rate": 2.428926445972058e-06, "epoch": 9.169230769230769, "percentage": 28.74, "elapsed_time": "4:27:36", "remaining_time": "11:03:27", "throughput": 2147.77, "total_tokens": 34486144} {"current_steps": 2240, "total_steps": 7776, "loss": 0.4739, "learning_rate": 2.4265454296401857e-06, "epoch": 9.189743589743589, "percentage": 28.81, "elapsed_time": "4:28:02", "remaining_time": "11:02:26", "throughput": 2149.23, "total_tokens": 34564864} {"current_steps": 2245, "total_steps": 7776, "loss": 0.4468, "learning_rate": 2.4241606324202426e-06, "epoch": 9.21025641025641, "percentage": 28.87, "elapsed_time": "4:28:49", "remaining_time": "11:02:18", "throughput": 2147.65, "total_tokens": 34640704} {"current_steps": 2250, "total_steps": 7776, "loss": 0.457, "learning_rate": 2.4217720640437015e-06, "epoch": 9.23076923076923, "percentage": 28.94, "elapsed_time": "4:29:35", "remaining_time": "11:02:07", "throughput": 2146.15, "total_tokens": 34715744} {"current_steps": 2255, "total_steps": 7776, "loss": 0.4915, "learning_rate": 2.4193797342574235e-06, "epoch": 9.25128205128205, "percentage": 29.0, "elapsed_time": "4:30:41", "remaining_time": "11:02:44", "throughput": 2142.54, "total_tokens": 34798144} {"current_steps": 2260, "total_steps": 7776, "loss": 0.4417, "learning_rate": 2.4169836528236187e-06, "epoch": 9.271794871794873, "percentage": 29.06, "elapsed_time": "4:31:25", "remaining_time": "11:02:29", "throughput": 2141.33, "total_tokens": 34873440} {"current_steps": 2265, "total_steps": 7776, "loss": 0.4999, "learning_rate": 2.4145838295198066e-06, "epoch": 9.292307692307693, "percentage": 29.13, "elapsed_time": "4:32:21", "remaining_time": "11:02:40", "throughput": 2138.85, "total_tokens": 34951552} {"current_steps": 2270, "total_steps": 7776, "loss": 0.453, "learning_rate": 2.4121802741387743e-06, "epoch": 9.312820512820513, "percentage": 29.19, "elapsed_time": "4:33:00", "remaining_time": "11:02:11", "throughput": 2137.98, "total_tokens": 35021184} {"current_steps": 2275, "total_steps": 7776, "loss": 0.4473, "learning_rate": 2.4097729964885407e-06, "epoch": 9.333333333333334, "percentage": 29.26, "elapsed_time": "4:33:46", "remaining_time": "11:02:00", "throughput": 2136.63, "total_tokens": 35098080} {"current_steps": 2280, "total_steps": 7776, "loss": 0.4749, "learning_rate": 2.4073620063923123e-06, "epoch": 9.353846153846154, "percentage": 29.32, "elapsed_time": "4:34:25", "remaining_time": "11:01:30", "throughput": 2135.98, "total_tokens": 35170336} {"current_steps": 2285, "total_steps": 7776, "loss": 0.5229, "learning_rate": 2.404947313688445e-06, "epoch": 9.374358974358975, "percentage": 29.39, "elapsed_time": "4:35:20", "remaining_time": "11:01:40", "throughput": 2134.0, "total_tokens": 35255200} {"current_steps": 2290, "total_steps": 7776, "loss": 0.5158, "learning_rate": 2.4025289282304037e-06, "epoch": 9.394871794871795, "percentage": 29.45, "elapsed_time": "4:36:01", "remaining_time": "11:01:14", "throughput": 2133.21, "total_tokens": 35328928} {"current_steps": 2295, "total_steps": 7776, "loss": 0.4548, "learning_rate": 2.4001068598867216e-06, "epoch": 9.415384615384616, "percentage": 29.51, "elapsed_time": "4:36:41", "remaining_time": "11:00:49", "throughput": 2132.46, "total_tokens": 35402976} {"current_steps": 2300, "total_steps": 7776, "loss": 0.4313, "learning_rate": 2.397681118540961e-06, "epoch": 9.435897435897436, "percentage": 29.58, "elapsed_time": "4:37:24", "remaining_time": "11:00:27", "throughput": 2131.74, "total_tokens": 35481344} {"current_steps": 2305, "total_steps": 7776, "loss": 0.4664, "learning_rate": 2.3952517140916724e-06, "epoch": 9.456410256410257, "percentage": 29.64, "elapsed_time": "4:38:01", "remaining_time": "10:59:53", "throughput": 2131.35, "total_tokens": 35553664} {"current_steps": 2310, "total_steps": 7776, "loss": 0.4948, "learning_rate": 2.392818656452354e-06, "epoch": 9.476923076923077, "percentage": 29.71, "elapsed_time": "4:38:40", "remaining_time": "10:59:25", "throughput": 2130.91, "total_tokens": 35630592} {"current_steps": 2315, "total_steps": 7776, "loss": 0.5035, "learning_rate": 2.39038195555141e-06, "epoch": 9.497435897435897, "percentage": 29.77, "elapsed_time": "4:39:30", "remaining_time": "10:59:21", "throughput": 2129.48, "total_tokens": 35712864} {"current_steps": 2320, "total_steps": 7776, "loss": 0.4964, "learning_rate": 2.387941621332114e-06, "epoch": 9.517948717948718, "percentage": 29.84, "elapsed_time": "4:40:09", "remaining_time": "10:58:51", "throughput": 2129.2, "total_tokens": 35790784} {"current_steps": 2325, "total_steps": 7776, "loss": 0.4684, "learning_rate": 2.3854976637525637e-06, "epoch": 9.538461538461538, "percentage": 29.9, "elapsed_time": "4:40:57", "remaining_time": "10:58:43", "throughput": 2127.73, "total_tokens": 35868960} {"current_steps": 2330, "total_steps": 7776, "loss": 0.5117, "learning_rate": 2.3830500927856433e-06, "epoch": 9.558974358974359, "percentage": 29.96, "elapsed_time": "4:41:45", "remaining_time": "10:58:33", "throughput": 2126.97, "total_tokens": 35956832} {"current_steps": 2335, "total_steps": 7776, "loss": 0.4574, "learning_rate": 2.3805989184189813e-06, "epoch": 9.57948717948718, "percentage": 30.03, "elapsed_time": "4:42:16", "remaining_time": "10:57:46", "throughput": 2127.16, "total_tokens": 36027520} {"current_steps": 2340, "total_steps": 7776, "loss": 0.5291, "learning_rate": 2.378144150654911e-06, "epoch": 9.6, "percentage": 30.09, "elapsed_time": "4:42:58", "remaining_time": "10:57:22", "throughput": 2126.78, "total_tokens": 36109248} {"current_steps": 2345, "total_steps": 7776, "loss": 0.4528, "learning_rate": 2.3756857995104286e-06, "epoch": 9.62051282051282, "percentage": 30.16, "elapsed_time": "4:43:28", "remaining_time": "10:56:32", "throughput": 2127.09, "total_tokens": 36179584} {"current_steps": 2350, "total_steps": 7776, "loss": 0.4976, "learning_rate": 2.3732238750171527e-06, "epoch": 9.64102564102564, "percentage": 30.22, "elapsed_time": "4:44:02", "remaining_time": "10:55:49", "throughput": 2127.5, "total_tokens": 36257216} {"current_steps": 2355, "total_steps": 7776, "loss": 0.4576, "learning_rate": 2.3707583872212837e-06, "epoch": 9.661538461538461, "percentage": 30.29, "elapsed_time": "4:44:30", "remaining_time": "10:54:54", "throughput": 2128.01, "total_tokens": 36326272} {"current_steps": 2360, "total_steps": 7776, "loss": 0.5315, "learning_rate": 2.3682893461835626e-06, "epoch": 9.682051282051281, "percentage": 30.35, "elapsed_time": "4:45:20", "remaining_time": "10:54:50", "throughput": 2126.41, "total_tokens": 36405504} {"current_steps": 2365, "total_steps": 7776, "loss": 0.5407, "learning_rate": 2.3658167619792294e-06, "epoch": 9.702564102564102, "percentage": 30.41, "elapsed_time": "4:45:52", "remaining_time": "10:54:04", "throughput": 2126.86, "total_tokens": 36481536} {"current_steps": 2370, "total_steps": 7776, "loss": 0.4525, "learning_rate": 2.363340644697983e-06, "epoch": 9.723076923076922, "percentage": 30.48, "elapsed_time": "4:46:29", "remaining_time": "10:53:30", "throughput": 2127.02, "total_tokens": 36563200} {"current_steps": 2375, "total_steps": 7776, "loss": 0.5628, "learning_rate": 2.360861004443939e-06, "epoch": 9.743589743589745, "percentage": 30.54, "elapsed_time": "4:47:13", "remaining_time": "10:53:11", "throughput": 2127.29, "total_tokens": 36661120} {"current_steps": 2380, "total_steps": 7776, "loss": 0.4633, "learning_rate": 2.358377851335589e-06, "epoch": 9.764102564102565, "percentage": 30.61, "elapsed_time": "4:47:44", "remaining_time": "10:52:22", "throughput": 2128.03, "total_tokens": 36738880} {"current_steps": 2385, "total_steps": 7776, "loss": 0.4438, "learning_rate": 2.3558911955057592e-06, "epoch": 9.784615384615385, "percentage": 30.67, "elapsed_time": "4:48:14", "remaining_time": "10:51:31", "throughput": 2129.03, "total_tokens": 36820128} {"current_steps": 2390, "total_steps": 7776, "loss": 0.4609, "learning_rate": 2.35340104710157e-06, "epoch": 9.805128205128206, "percentage": 30.74, "elapsed_time": "4:48:43", "remaining_time": "10:50:40", "throughput": 2130.0, "total_tokens": 36900128} {"current_steps": 2395, "total_steps": 7776, "loss": 0.4843, "learning_rate": 2.350907416284392e-06, "epoch": 9.825641025641026, "percentage": 30.8, "elapsed_time": "4:49:07", "remaining_time": "10:49:35", "throughput": 2131.09, "total_tokens": 36969024} {"current_steps": 2400, "total_steps": 7776, "loss": 0.4607, "learning_rate": 2.348410313229808e-06, "epoch": 9.846153846153847, "percentage": 30.86, "elapsed_time": "4:50:03", "remaining_time": "10:49:43", "throughput": 2129.12, "total_tokens": 37053440} {"current_steps": 2405, "total_steps": 7776, "loss": 0.5134, "learning_rate": 2.3459097481275687e-06, "epoch": 9.866666666666667, "percentage": 30.93, "elapsed_time": "4:50:30", "remaining_time": "10:48:46", "throughput": 2130.34, "total_tokens": 37132128} {"current_steps": 2410, "total_steps": 7776, "loss": 0.478, "learning_rate": 2.343405731181552e-06, "epoch": 9.887179487179488, "percentage": 30.99, "elapsed_time": "4:50:56", "remaining_time": "10:47:47", "throughput": 2131.57, "total_tokens": 37209664} {"current_steps": 2415, "total_steps": 7776, "loss": 0.4864, "learning_rate": 2.3408982726097227e-06, "epoch": 9.907692307692308, "percentage": 31.06, "elapsed_time": "4:51:19", "remaining_time": "10:46:43", "throughput": 2132.96, "total_tokens": 37283936} {"current_steps": 2420, "total_steps": 7776, "loss": 0.4876, "learning_rate": 2.3383873826440878e-06, "epoch": 9.928205128205128, "percentage": 31.12, "elapsed_time": "4:51:43", "remaining_time": "10:45:38", "throughput": 2134.46, "total_tokens": 37359552} {"current_steps": 2425, "total_steps": 7776, "loss": 0.5265, "learning_rate": 2.3358730715306574e-06, "epoch": 9.948717948717949, "percentage": 31.19, "elapsed_time": "4:52:05", "remaining_time": "10:44:32", "throughput": 2135.96, "total_tokens": 37434112} {"current_steps": 2430, "total_steps": 7776, "loss": 0.4759, "learning_rate": 2.3333553495294033e-06, "epoch": 9.96923076923077, "percentage": 31.25, "elapsed_time": "4:52:28", "remaining_time": "10:43:27", "throughput": 2137.57, "total_tokens": 37511456} {"current_steps": 2435, "total_steps": 7776, "loss": 0.4336, "learning_rate": 2.330834226914214e-06, "epoch": 9.98974358974359, "percentage": 31.31, "elapsed_time": "4:52:47", "remaining_time": "10:42:13", "throughput": 2139.37, "total_tokens": 37584320} {"current_steps": 2440, "total_steps": 7776, "loss": 0.5338, "learning_rate": 2.3283097139728557e-06, "epoch": 10.01025641025641, "percentage": 31.38, "elapsed_time": "4:53:29", "remaining_time": "10:41:49", "throughput": 2139.35, "total_tokens": 37672864} {"current_steps": 2445, "total_steps": 7776, "loss": 0.4542, "learning_rate": 2.3257818210069277e-06, "epoch": 10.03076923076923, "percentage": 31.44, "elapsed_time": "4:53:47", "remaining_time": "10:40:35", "throughput": 2141.11, "total_tokens": 37743488} {"current_steps": 2450, "total_steps": 7776, "loss": 0.5379, "learning_rate": 2.3232505583318246e-06, "epoch": 10.051282051282051, "percentage": 31.51, "elapsed_time": "4:54:32", "remaining_time": "10:40:18", "throughput": 2140.73, "total_tokens": 37832256} {"current_steps": 2455, "total_steps": 7776, "loss": 0.4418, "learning_rate": 2.320715936276689e-06, "epoch": 10.071794871794872, "percentage": 31.57, "elapsed_time": "4:54:50", "remaining_time": "10:39:02", "throughput": 2142.9, "total_tokens": 37908832} {"current_steps": 2460, "total_steps": 7776, "loss": 0.5294, "learning_rate": 2.3181779651843738e-06, "epoch": 10.092307692307692, "percentage": 31.64, "elapsed_time": "4:55:10", "remaining_time": "10:37:52", "throughput": 2144.99, "total_tokens": 37989088} {"current_steps": 2465, "total_steps": 7776, "loss": 0.4438, "learning_rate": 2.3156366554113967e-06, "epoch": 10.112820512820512, "percentage": 31.7, "elapsed_time": "4:55:39", "remaining_time": "10:37:01", "throughput": 2145.52, "total_tokens": 38061024} {"current_steps": 2470, "total_steps": 7776, "loss": 0.4544, "learning_rate": 2.3130920173278997e-06, "epoch": 10.133333333333333, "percentage": 31.76, "elapsed_time": "4:56:26", "remaining_time": "10:36:48", "throughput": 2144.13, "total_tokens": 38136480} {"current_steps": 2475, "total_steps": 7776, "loss": 0.4918, "learning_rate": 2.310544061317607e-06, "epoch": 10.153846153846153, "percentage": 31.83, "elapsed_time": "4:57:14", "remaining_time": "10:36:37", "throughput": 2142.71, "total_tokens": 38213280} {"current_steps": 2480, "total_steps": 7776, "loss": 0.4821, "learning_rate": 2.307992797777782e-06, "epoch": 10.174358974358974, "percentage": 31.89, "elapsed_time": "4:57:55", "remaining_time": "10:36:12", "throughput": 2141.67, "total_tokens": 38283296} {"current_steps": 2485, "total_steps": 7776, "loss": 0.464, "learning_rate": 2.3054382371191836e-06, "epoch": 10.194871794871794, "percentage": 31.96, "elapsed_time": "4:58:41", "remaining_time": "10:35:58", "throughput": 2140.43, "total_tokens": 38360320} {"current_steps": 2490, "total_steps": 7776, "loss": 0.4829, "learning_rate": 2.3028803897660256e-06, "epoch": 10.215384615384615, "percentage": 32.02, "elapsed_time": "4:59:36", "remaining_time": "10:36:02", "throughput": 2138.32, "total_tokens": 38440000} {"current_steps": 2495, "total_steps": 7776, "loss": 0.4495, "learning_rate": 2.3003192661559346e-06, "epoch": 10.235897435897435, "percentage": 32.09, "elapsed_time": "5:00:16", "remaining_time": "10:35:35", "throughput": 2137.44, "total_tokens": 38510208} {"current_steps": 2500, "total_steps": 7776, "loss": 0.5503, "learning_rate": 2.297754876739905e-06, "epoch": 10.256410256410255, "percentage": 32.15, "elapsed_time": "5:01:23", "remaining_time": "10:36:04", "throughput": 2134.5, "total_tokens": 38600256} {"current_steps": 2505, "total_steps": 7776, "loss": 0.5341, "learning_rate": 2.2951872319822597e-06, "epoch": 10.276923076923078, "percentage": 32.21, "elapsed_time": "5:02:34", "remaining_time": "10:36:39", "throughput": 2130.61, "total_tokens": 38679168} {"current_steps": 2510, "total_steps": 7776, "loss": 0.4903, "learning_rate": 2.2926163423606027e-06, "epoch": 10.297435897435898, "percentage": 32.28, "elapsed_time": "5:03:13", "remaining_time": "10:36:09", "throughput": 2130.05, "total_tokens": 38752064} {"current_steps": 2515, "total_steps": 7776, "loss": 0.4543, "learning_rate": 2.2900422183657816e-06, "epoch": 10.317948717948719, "percentage": 32.34, "elapsed_time": "5:03:55", "remaining_time": "10:35:46", "throughput": 2129.3, "total_tokens": 38829504} {"current_steps": 2520, "total_steps": 7776, "loss": 0.5428, "learning_rate": 2.2874648705018403e-06, "epoch": 10.338461538461539, "percentage": 32.41, "elapsed_time": "5:04:46", "remaining_time": "10:35:40", "throughput": 2128.14, "total_tokens": 38915904} {"current_steps": 2525, "total_steps": 7776, "loss": 0.4588, "learning_rate": 2.28488430928598e-06, "epoch": 10.35897435897436, "percentage": 32.47, "elapsed_time": "5:05:30", "remaining_time": "10:35:19", "throughput": 2127.5, "total_tokens": 38997760} {"current_steps": 2530, "total_steps": 7776, "loss": 0.4441, "learning_rate": 2.282300545248512e-06, "epoch": 10.37948717948718, "percentage": 32.54, "elapsed_time": "5:06:05", "remaining_time": "10:34:40", "throughput": 2127.29, "total_tokens": 39068000} {"current_steps": 2535, "total_steps": 7776, "loss": 0.4441, "learning_rate": 2.27971358893282e-06, "epoch": 10.4, "percentage": 32.6, "elapsed_time": "5:06:38", "remaining_time": "10:33:57", "throughput": 2127.18, "total_tokens": 39136480} {"current_steps": 2540, "total_steps": 7776, "loss": 0.442, "learning_rate": 2.2771234508953116e-06, "epoch": 10.42051282051282, "percentage": 32.66, "elapsed_time": "5:07:32", "remaining_time": "10:33:57", "throughput": 2125.48, "total_tokens": 39219488} {"current_steps": 2545, "total_steps": 7776, "loss": 0.5199, "learning_rate": 2.27453014170538e-06, "epoch": 10.441025641025641, "percentage": 32.73, "elapsed_time": "5:08:11", "remaining_time": "10:33:27", "throughput": 2125.09, "total_tokens": 39295712} {"current_steps": 2550, "total_steps": 7776, "loss": 0.5147, "learning_rate": 2.271933671945357e-06, "epoch": 10.461538461538462, "percentage": 32.79, "elapsed_time": "5:08:53", "remaining_time": "10:33:03", "throughput": 2124.26, "total_tokens": 39371008} {"current_steps": 2555, "total_steps": 7776, "loss": 0.5296, "learning_rate": 2.2693340522104727e-06, "epoch": 10.482051282051282, "percentage": 32.86, "elapsed_time": "5:09:32", "remaining_time": "10:32:31", "throughput": 2124.19, "total_tokens": 39450944} {"current_steps": 2560, "total_steps": 7776, "loss": 0.4707, "learning_rate": 2.2667312931088096e-06, "epoch": 10.502564102564103, "percentage": 32.92, "elapsed_time": "5:10:08", "remaining_time": "10:31:54", "throughput": 2124.34, "total_tokens": 39530912} {"current_steps": 2565, "total_steps": 7776, "loss": 0.4726, "learning_rate": 2.264125405261263e-06, "epoch": 10.523076923076923, "percentage": 32.99, "elapsed_time": "5:10:38", "remaining_time": "10:31:06", "throughput": 2124.71, "total_tokens": 39602400} {"current_steps": 2570, "total_steps": 7776, "loss": 0.4344, "learning_rate": 2.261516399301493e-06, "epoch": 10.543589743589743, "percentage": 33.05, "elapsed_time": "5:11:12", "remaining_time": "10:30:24", "throughput": 2125.02, "total_tokens": 39679232} {"current_steps": 2575, "total_steps": 7776, "loss": 0.4427, "learning_rate": 2.2589042858758853e-06, "epoch": 10.564102564102564, "percentage": 33.11, "elapsed_time": "5:11:53", "remaining_time": "10:29:57", "throughput": 2124.47, "total_tokens": 39755904} {"current_steps": 2580, "total_steps": 7776, "loss": 0.4975, "learning_rate": 2.256289075643506e-06, "epoch": 10.584615384615384, "percentage": 33.18, "elapsed_time": "5:12:22", "remaining_time": "10:29:06", "throughput": 2124.95, "total_tokens": 39826368} {"current_steps": 2585, "total_steps": 7776, "loss": 0.5045, "learning_rate": 2.2536707792760566e-06, "epoch": 10.605128205128205, "percentage": 33.24, "elapsed_time": "5:12:56", "remaining_time": "10:28:25", "throughput": 2125.34, "total_tokens": 39906464} {"current_steps": 2590, "total_steps": 7776, "loss": 0.4833, "learning_rate": 2.251049407457833e-06, "epoch": 10.625641025641025, "percentage": 33.31, "elapsed_time": "5:13:23", "remaining_time": "10:27:31", "throughput": 2125.95, "total_tokens": 39975712} {"current_steps": 2595, "total_steps": 7776, "loss": 0.4984, "learning_rate": 2.2484249708856823e-06, "epoch": 10.646153846153846, "percentage": 33.37, "elapsed_time": "5:14:04", "remaining_time": "10:27:04", "throughput": 2125.77, "total_tokens": 40060032} {"current_steps": 2600, "total_steps": 7776, "loss": 0.4186, "learning_rate": 2.2457974802689545e-06, "epoch": 10.666666666666666, "percentage": 33.44, "elapsed_time": "5:14:32", "remaining_time": "10:26:11", "throughput": 2126.4, "total_tokens": 40131520} {"current_steps": 2605, "total_steps": 7776, "loss": 0.4441, "learning_rate": 2.2431669463294646e-06, "epoch": 10.687179487179487, "percentage": 33.5, "elapsed_time": "5:15:00", "remaining_time": "10:25:18", "throughput": 2127.2, "total_tokens": 40205760} {"current_steps": 2610, "total_steps": 7776, "loss": 0.5337, "learning_rate": 2.2405333798014453e-06, "epoch": 10.707692307692307, "percentage": 33.56, "elapsed_time": "5:15:35", "remaining_time": "10:24:39", "throughput": 2127.66, "total_tokens": 40288992} {"current_steps": 2615, "total_steps": 7776, "loss": 0.4703, "learning_rate": 2.237896791431505e-06, "epoch": 10.728205128205127, "percentage": 33.63, "elapsed_time": "5:16:05", "remaining_time": "10:23:51", "throughput": 2128.52, "total_tokens": 40369440} {"current_steps": 2620, "total_steps": 7776, "loss": 0.5217, "learning_rate": 2.2352571919785812e-06, "epoch": 10.74871794871795, "percentage": 33.69, "elapsed_time": "5:16:42", "remaining_time": "10:23:14", "throughput": 2128.84, "total_tokens": 40452288} {"current_steps": 2625, "total_steps": 7776, "loss": 0.4475, "learning_rate": 2.2326145922139004e-06, "epoch": 10.76923076923077, "percentage": 33.76, "elapsed_time": "5:17:06", "remaining_time": "10:22:14", "throughput": 2129.9, "total_tokens": 40523808} {"current_steps": 2630, "total_steps": 7776, "loss": 0.4734, "learning_rate": 2.2299690029209313e-06, "epoch": 10.78974358974359, "percentage": 33.82, "elapsed_time": "5:17:34", "remaining_time": "10:21:23", "throughput": 2131.03, "total_tokens": 40606496} {"current_steps": 2635, "total_steps": 7776, "loss": 0.4686, "learning_rate": 2.227320434895343e-06, "epoch": 10.810256410256411, "percentage": 33.89, "elapsed_time": "5:18:01", "remaining_time": "10:20:27", "throughput": 2132.2, "total_tokens": 40684672} {"current_steps": 2640, "total_steps": 7776, "loss": 0.5027, "learning_rate": 2.2246688989449577e-06, "epoch": 10.830769230769231, "percentage": 33.95, "elapsed_time": "5:18:26", "remaining_time": "10:19:30", "throughput": 2133.44, "total_tokens": 40762752} {"current_steps": 2645, "total_steps": 7776, "loss": 0.4582, "learning_rate": 2.2220144058897104e-06, "epoch": 10.851282051282052, "percentage": 34.01, "elapsed_time": "5:18:56", "remaining_time": "10:18:41", "throughput": 2134.81, "total_tokens": 40851776} {"current_steps": 2650, "total_steps": 7776, "loss": 0.4516, "learning_rate": 2.2193569665616017e-06, "epoch": 10.871794871794872, "percentage": 34.08, "elapsed_time": "5:19:16", "remaining_time": "10:17:35", "throughput": 2136.21, "total_tokens": 40922304} {"current_steps": 2655, "total_steps": 7776, "loss": 0.4346, "learning_rate": 2.2166965918046554e-06, "epoch": 10.892307692307693, "percentage": 34.14, "elapsed_time": "5:19:38", "remaining_time": "10:16:32", "throughput": 2137.69, "total_tokens": 40998784} {"current_steps": 2660, "total_steps": 7776, "loss": 0.5093, "learning_rate": 2.214033292474874e-06, "epoch": 10.912820512820513, "percentage": 34.21, "elapsed_time": "5:20:04", "remaining_time": "10:15:36", "throughput": 2138.87, "total_tokens": 41075872} {"current_steps": 2665, "total_steps": 7776, "loss": 0.4853, "learning_rate": 2.2113670794401935e-06, "epoch": 10.933333333333334, "percentage": 34.27, "elapsed_time": "5:20:23", "remaining_time": "10:14:27", "throughput": 2140.6, "total_tokens": 41149728} {"current_steps": 2670, "total_steps": 7776, "loss": 0.5042, "learning_rate": 2.20869796358044e-06, "epoch": 10.953846153846154, "percentage": 34.34, "elapsed_time": "5:20:41", "remaining_time": "10:13:16", "throughput": 2142.27, "total_tokens": 41220160} {"current_steps": 2675, "total_steps": 7776, "loss": 0.4601, "learning_rate": 2.2060259557872845e-06, "epoch": 10.974358974358974, "percentage": 34.4, "elapsed_time": "5:20:57", "remaining_time": "10:12:03", "throughput": 2143.95, "total_tokens": 41287712} {"current_steps": 2680, "total_steps": 7776, "loss": 0.4138, "learning_rate": 2.2033510669641997e-06, "epoch": 10.994871794871795, "percentage": 34.47, "elapsed_time": "5:21:15", "remaining_time": "10:10:52", "throughput": 2145.89, "total_tokens": 41363264} {"current_steps": 2685, "total_steps": 7776, "loss": 0.4724, "learning_rate": 2.2006733080264144e-06, "epoch": 11.015384615384615, "percentage": 34.53, "elapsed_time": "5:21:32", "remaining_time": "10:09:40", "throughput": 2147.8, "total_tokens": 41437152} {"current_steps": 2690, "total_steps": 7776, "loss": 0.4932, "learning_rate": 2.197992689900869e-06, "epoch": 11.035897435897436, "percentage": 34.59, "elapsed_time": "5:22:26", "remaining_time": "10:09:38", "throughput": 2145.92, "total_tokens": 41515520} {"current_steps": 2695, "total_steps": 7776, "loss": 0.4299, "learning_rate": 2.195309223526171e-06, "epoch": 11.056410256410256, "percentage": 34.66, "elapsed_time": "5:23:09", "remaining_time": "10:09:16", "throughput": 2144.79, "total_tokens": 41587200} {"current_steps": 2700, "total_steps": 7776, "loss": 0.4774, "learning_rate": 2.192622919852551e-06, "epoch": 11.076923076923077, "percentage": 34.72, "elapsed_time": "5:23:55", "remaining_time": "10:08:59", "throughput": 2143.62, "total_tokens": 41663008} {"current_steps": 2705, "total_steps": 7776, "loss": 0.5241, "learning_rate": 2.1899337898418174e-06, "epoch": 11.097435897435897, "percentage": 34.79, "elapsed_time": "5:24:52", "remaining_time": "10:09:02", "throughput": 2141.5, "total_tokens": 41743264} {"current_steps": 2710, "total_steps": 7776, "loss": 0.498, "learning_rate": 2.187241844467313e-06, "epoch": 11.117948717948718, "percentage": 34.85, "elapsed_time": "5:25:54", "remaining_time": "10:09:15", "throughput": 2138.76, "total_tokens": 41823264} {"current_steps": 2715, "total_steps": 7776, "loss": 0.5311, "learning_rate": 2.1845470947138658e-06, "epoch": 11.138461538461538, "percentage": 34.92, "elapsed_time": "5:27:30", "remaining_time": "10:10:29", "throughput": 2133.04, "total_tokens": 41914560} {"current_steps": 2720, "total_steps": 7776, "loss": 0.4464, "learning_rate": 2.181849551577751e-06, "epoch": 11.158974358974358, "percentage": 34.98, "elapsed_time": "5:28:12", "remaining_time": "10:10:04", "throughput": 2132.22, "total_tokens": 41988288} {"current_steps": 2725, "total_steps": 7776, "loss": 0.4905, "learning_rate": 2.179149226066641e-06, "epoch": 11.179487179487179, "percentage": 35.04, "elapsed_time": "5:29:01", "remaining_time": "10:09:51", "throughput": 2131.02, "total_tokens": 42068416} {"current_steps": 2730, "total_steps": 7776, "loss": 0.4629, "learning_rate": 2.1764461291995618e-06, "epoch": 11.2, "percentage": 35.11, "elapsed_time": "5:29:40", "remaining_time": "10:09:20", "throughput": 2130.41, "total_tokens": 42139744} {"current_steps": 2735, "total_steps": 7776, "loss": 0.5278, "learning_rate": 2.173740272006849e-06, "epoch": 11.22051282051282, "percentage": 35.17, "elapsed_time": "5:30:31", "remaining_time": "10:09:12", "throughput": 2129.36, "total_tokens": 42228672} {"current_steps": 2740, "total_steps": 7776, "loss": 0.4513, "learning_rate": 2.1710316655301016e-06, "epoch": 11.24102564102564, "percentage": 35.24, "elapsed_time": "5:31:14", "remaining_time": "10:08:48", "throughput": 2128.67, "total_tokens": 42306528} {"current_steps": 2745, "total_steps": 7776, "loss": 0.4917, "learning_rate": 2.1683203208221375e-06, "epoch": 11.261538461538462, "percentage": 35.3, "elapsed_time": "5:32:34", "remaining_time": "10:09:31", "throughput": 2124.31, "total_tokens": 42389024} {"current_steps": 2750, "total_steps": 7776, "loss": 0.4159, "learning_rate": 2.165606248946948e-06, "epoch": 11.282051282051283, "percentage": 35.37, "elapsed_time": "5:33:41", "remaining_time": "10:09:51", "throughput": 2121.4, "total_tokens": 42473088} {"current_steps": 2755, "total_steps": 7776, "loss": 0.4917, "learning_rate": 2.1628894609796533e-06, "epoch": 11.302564102564103, "percentage": 35.43, "elapsed_time": "5:34:22", "remaining_time": "10:09:23", "throughput": 2120.97, "total_tokens": 42551360} {"current_steps": 2760, "total_steps": 7776, "loss": 0.5037, "learning_rate": 2.1601699680064573e-06, "epoch": 11.323076923076924, "percentage": 35.49, "elapsed_time": "5:35:03", "remaining_time": "10:08:56", "throughput": 2120.33, "total_tokens": 42626688} {"current_steps": 2765, "total_steps": 7776, "loss": 0.4756, "learning_rate": 2.1574477811246014e-06, "epoch": 11.343589743589744, "percentage": 35.56, "elapsed_time": "5:35:53", "remaining_time": "10:08:44", "throughput": 2118.99, "total_tokens": 42705056} {"current_steps": 2770, "total_steps": 7776, "loss": 0.4985, "learning_rate": 2.1547229114423207e-06, "epoch": 11.364102564102565, "percentage": 35.62, "elapsed_time": "5:36:27", "remaining_time": "10:08:02", "throughput": 2119.03, "total_tokens": 42777632} {"current_steps": 2775, "total_steps": 7776, "loss": 0.4561, "learning_rate": 2.1519953700787963e-06, "epoch": 11.384615384615385, "percentage": 35.69, "elapsed_time": "5:36:58", "remaining_time": "10:07:16", "throughput": 2119.16, "total_tokens": 42845888} {"current_steps": 2780, "total_steps": 7776, "loss": 0.5091, "learning_rate": 2.149265168164113e-06, "epoch": 11.405128205128205, "percentage": 35.75, "elapsed_time": "5:37:34", "remaining_time": "10:06:40", "throughput": 2119.15, "total_tokens": 42922976} {"current_steps": 2785, "total_steps": 7776, "loss": 0.4711, "learning_rate": 2.146532316839211e-06, "epoch": 11.425641025641026, "percentage": 35.82, "elapsed_time": "5:38:07", "remaining_time": "10:05:56", "throughput": 2119.38, "total_tokens": 42996000} {"current_steps": 2790, "total_steps": 7776, "loss": 0.457, "learning_rate": 2.1437968272558435e-06, "epoch": 11.446153846153846, "percentage": 35.88, "elapsed_time": "5:38:43", "remaining_time": "10:05:19", "throughput": 2119.47, "total_tokens": 43074688} {"current_steps": 2795, "total_steps": 7776, "loss": 0.541, "learning_rate": 2.1410587105765275e-06, "epoch": 11.466666666666667, "percentage": 35.94, "elapsed_time": "5:39:21", "remaining_time": "10:04:46", "throughput": 2119.55, "total_tokens": 43157280} {"current_steps": 2800, "total_steps": 7776, "loss": 0.4279, "learning_rate": 2.138317977974501e-06, "epoch": 11.487179487179487, "percentage": 36.01, "elapsed_time": "5:39:55", "remaining_time": "10:04:06", "throughput": 2119.76, "total_tokens": 43234016} {"current_steps": 2805, "total_steps": 7776, "loss": 0.5213, "learning_rate": 2.135574640633678e-06, "epoch": 11.507692307692308, "percentage": 36.07, "elapsed_time": "5:40:38", "remaining_time": "10:03:40", "throughput": 2119.12, "total_tokens": 43310816} {"current_steps": 2810, "total_steps": 7776, "loss": 0.4444, "learning_rate": 2.132828709748598e-06, "epoch": 11.528205128205128, "percentage": 36.14, "elapsed_time": "5:41:08", "remaining_time": "10:02:52", "throughput": 2119.51, "total_tokens": 43382976} {"current_steps": 2815, "total_steps": 7776, "loss": 0.4768, "learning_rate": 2.130080196524388e-06, "epoch": 11.548717948717949, "percentage": 36.2, "elapsed_time": "5:41:46", "remaining_time": "10:02:19", "throughput": 2119.49, "total_tokens": 43462944} {"current_steps": 2820, "total_steps": 7776, "loss": 0.4376, "learning_rate": 2.1273291121767094e-06, "epoch": 11.569230769230769, "percentage": 36.27, "elapsed_time": "5:42:13", "remaining_time": "10:01:26", "throughput": 2120.22, "total_tokens": 43535232} {"current_steps": 2825, "total_steps": 7776, "loss": 0.4342, "learning_rate": 2.124575467931717e-06, "epoch": 11.58974358974359, "percentage": 36.33, "elapsed_time": "5:43:11", "remaining_time": "10:01:27", "throughput": 2118.28, "total_tokens": 43618528} {"current_steps": 2830, "total_steps": 7776, "loss": 0.4596, "learning_rate": 2.1218192750260114e-06, "epoch": 11.61025641025641, "percentage": 36.39, "elapsed_time": "5:43:39", "remaining_time": "10:00:36", "throughput": 2118.99, "total_tokens": 43691904} {"current_steps": 2835, "total_steps": 7776, "loss": 0.4811, "learning_rate": 2.119060544706592e-06, "epoch": 11.63076923076923, "percentage": 36.46, "elapsed_time": "5:44:03", "remaining_time": "9:59:39", "throughput": 2119.77, "total_tokens": 43760480} {"current_steps": 2840, "total_steps": 7776, "loss": 0.4864, "learning_rate": 2.1162992882308147e-06, "epoch": 11.65128205128205, "percentage": 36.52, "elapsed_time": "5:44:27", "remaining_time": "9:58:40", "throughput": 2120.74, "total_tokens": 43829984} {"current_steps": 2845, "total_steps": 7776, "loss": 0.4678, "learning_rate": 2.1135355168663417e-06, "epoch": 11.671794871794871, "percentage": 36.59, "elapsed_time": "5:44:58", "remaining_time": "9:57:54", "throughput": 2121.29, "total_tokens": 43906816} {"current_steps": 2850, "total_steps": 7776, "loss": 0.5001, "learning_rate": 2.1107692418910985e-06, "epoch": 11.692307692307692, "percentage": 36.65, "elapsed_time": "5:45:25", "remaining_time": "9:57:02", "throughput": 2122.24, "total_tokens": 43984960} {"current_steps": 2855, "total_steps": 7776, "loss": 0.4662, "learning_rate": 2.1080004745932274e-06, "epoch": 11.712820512820512, "percentage": 36.72, "elapsed_time": "5:45:50", "remaining_time": "9:56:07", "throughput": 2123.36, "total_tokens": 44061440} {"current_steps": 2860, "total_steps": 7776, "loss": 0.526, "learning_rate": 2.1052292262710392e-06, "epoch": 11.733333333333333, "percentage": 36.78, "elapsed_time": "5:46:20", "remaining_time": "9:55:18", "throughput": 2124.48, "total_tokens": 44147008} {"current_steps": 2865, "total_steps": 7776, "loss": 0.4821, "learning_rate": 2.102455508232971e-06, "epoch": 11.753846153846155, "percentage": 36.84, "elapsed_time": "5:46:44", "remaining_time": "9:54:22", "throughput": 2125.68, "total_tokens": 44224224} {"current_steps": 2870, "total_steps": 7776, "loss": 0.4923, "learning_rate": 2.099679331797536e-06, "epoch": 11.774358974358975, "percentage": 36.91, "elapsed_time": "5:47:12", "remaining_time": "9:53:30", "throughput": 2126.66, "total_tokens": 44302816} {"current_steps": 2875, "total_steps": 7776, "loss": 0.521, "learning_rate": 2.0969007082932803e-06, "epoch": 11.794871794871796, "percentage": 36.97, "elapsed_time": "5:47:32", "remaining_time": "9:52:27", "throughput": 2128.08, "total_tokens": 44376160} {"current_steps": 2880, "total_steps": 7776, "loss": 0.4932, "learning_rate": 2.0941196490587354e-06, "epoch": 11.815384615384616, "percentage": 37.04, "elapsed_time": "5:47:58", "remaining_time": "9:51:34", "throughput": 2129.38, "total_tokens": 44459200} {"current_steps": 2885, "total_steps": 7776, "loss": 0.4866, "learning_rate": 2.0913361654423723e-06, "epoch": 11.835897435897436, "percentage": 37.1, "elapsed_time": "5:48:21", "remaining_time": "9:50:34", "throughput": 2130.78, "total_tokens": 44536128} {"current_steps": 2890, "total_steps": 7776, "loss": 0.4826, "learning_rate": 2.0885502688025538e-06, "epoch": 11.856410256410257, "percentage": 37.17, "elapsed_time": "5:48:38", "remaining_time": "9:49:25", "throughput": 2132.36, "total_tokens": 44605088} {"current_steps": 2895, "total_steps": 7776, "loss": 0.4433, "learning_rate": 2.0857619705074912e-06, "epoch": 11.876923076923077, "percentage": 37.23, "elapsed_time": "5:48:56", "remaining_time": "9:48:19", "throughput": 2133.95, "total_tokens": 44677984} {"current_steps": 2900, "total_steps": 7776, "loss": 0.4122, "learning_rate": 2.082971281935195e-06, "epoch": 11.897435897435898, "percentage": 37.29, "elapsed_time": "5:49:14", "remaining_time": "9:47:13", "throughput": 2135.6, "total_tokens": 44751200} {"current_steps": 2905, "total_steps": 7776, "loss": 0.4266, "learning_rate": 2.0801782144734295e-06, "epoch": 11.917948717948718, "percentage": 37.36, "elapsed_time": "5:49:32", "remaining_time": "9:46:05", "throughput": 2137.32, "total_tokens": 44824672} {"current_steps": 2910, "total_steps": 7776, "loss": 0.4574, "learning_rate": 2.0773827795196667e-06, "epoch": 11.938461538461539, "percentage": 37.42, "elapsed_time": "5:49:54", "remaining_time": "9:45:06", "throughput": 2139.23, "total_tokens": 44912768} {"current_steps": 2915, "total_steps": 7776, "loss": 0.5026, "learning_rate": 2.074584988481039e-06, "epoch": 11.95897435897436, "percentage": 37.49, "elapsed_time": "5:50:47", "remaining_time": "9:44:59", "throughput": 2137.68, "total_tokens": 44993632} {"current_steps": 2920, "total_steps": 7776, "loss": 0.5444, "learning_rate": 2.0717848527742935e-06, "epoch": 11.97948717948718, "percentage": 37.55, "elapsed_time": "5:51:36", "remaining_time": "9:44:44", "throughput": 2136.39, "total_tokens": 45070848} {"current_steps": 2925, "total_steps": 7776, "loss": 0.4509, "learning_rate": 2.0689823838257455e-06, "epoch": 12.0, "percentage": 37.62, "elapsed_time": "5:52:27", "remaining_time": "9:44:33", "throughput": 2134.98, "total_tokens": 45150496} {"current_steps": 2930, "total_steps": 7776, "loss": 0.4534, "learning_rate": 2.0661775930712297e-06, "epoch": 12.02051282051282, "percentage": 37.68, "elapsed_time": "5:53:15", "remaining_time": "9:44:15", "throughput": 2133.74, "total_tokens": 45225440} {"current_steps": 2935, "total_steps": 7776, "loss": 0.5264, "learning_rate": 2.0633704919560573e-06, "epoch": 12.04102564102564, "percentage": 37.74, "elapsed_time": "5:54:00", "remaining_time": "9:43:54", "throughput": 2132.77, "total_tokens": 45300992} {"current_steps": 2940, "total_steps": 7776, "loss": 0.4373, "learning_rate": 2.0605610919349658e-06, "epoch": 12.061538461538461, "percentage": 37.81, "elapsed_time": "5:54:49", "remaining_time": "9:43:39", "throughput": 2131.47, "total_tokens": 45378944} {"current_steps": 2945, "total_steps": 7776, "loss": 0.4779, "learning_rate": 2.0577494044720746e-06, "epoch": 12.082051282051282, "percentage": 37.87, "elapsed_time": "5:55:32", "remaining_time": "9:43:13", "throughput": 2130.76, "total_tokens": 45453504} {"current_steps": 2950, "total_steps": 7776, "loss": 0.556, "learning_rate": 2.0549354410408364e-06, "epoch": 12.102564102564102, "percentage": 37.94, "elapsed_time": "5:56:28", "remaining_time": "9:43:09", "throughput": 2128.89, "total_tokens": 45532992} {"current_steps": 2955, "total_steps": 7776, "loss": 0.5152, "learning_rate": 2.052119213123992e-06, "epoch": 12.123076923076923, "percentage": 38.0, "elapsed_time": "5:57:15", "remaining_time": "9:42:50", "throughput": 2127.78, "total_tokens": 45609120} {"current_steps": 2960, "total_steps": 7776, "loss": 0.4412, "learning_rate": 2.049300732213522e-06, "epoch": 12.143589743589743, "percentage": 38.07, "elapsed_time": "5:58:07", "remaining_time": "9:42:40", "throughput": 2126.42, "total_tokens": 45690624} {"current_steps": 2965, "total_steps": 7776, "loss": 0.4553, "learning_rate": 2.046480009810602e-06, "epoch": 12.164102564102564, "percentage": 38.13, "elapsed_time": "5:58:45", "remaining_time": "9:42:06", "throughput": 2126.02, "total_tokens": 45763264} {"current_steps": 2970, "total_steps": 7776, "loss": 0.4913, "learning_rate": 2.0436570574255523e-06, "epoch": 12.184615384615384, "percentage": 38.19, "elapsed_time": "5:59:34", "remaining_time": "9:41:51", "throughput": 2125.17, "total_tokens": 45849472} {"current_steps": 2975, "total_steps": 7776, "loss": 0.5487, "learning_rate": 2.0408318865777953e-06, "epoch": 12.205128205128204, "percentage": 38.26, "elapsed_time": "6:01:04", "remaining_time": "9:42:42", "throughput": 2119.91, "total_tokens": 45927552} {"current_steps": 2980, "total_steps": 7776, "loss": 0.465, "learning_rate": 2.0380045087958036e-06, "epoch": 12.225641025641025, "percentage": 38.32, "elapsed_time": "6:01:49", "remaining_time": "9:42:18", "throughput": 2119.05, "total_tokens": 46002656} {"current_steps": 2985, "total_steps": 7776, "loss": 0.4854, "learning_rate": 2.0351749356170574e-06, "epoch": 12.246153846153845, "percentage": 38.39, "elapsed_time": "6:02:42", "remaining_time": "9:42:10", "throughput": 2117.72, "total_tokens": 46087904} {"current_steps": 2990, "total_steps": 7776, "loss": 0.4568, "learning_rate": 2.032343178587995e-06, "epoch": 12.266666666666667, "percentage": 38.45, "elapsed_time": "6:03:26", "remaining_time": "9:41:45", "throughput": 2117.04, "total_tokens": 46165408} {"current_steps": 2995, "total_steps": 7776, "loss": 0.4926, "learning_rate": 2.0295092492639657e-06, "epoch": 12.287179487179488, "percentage": 38.52, "elapsed_time": "6:04:00", "remaining_time": "9:41:04", "throughput": 2117.06, "total_tokens": 46237344} {"current_steps": 3000, "total_steps": 7776, "loss": 0.5093, "learning_rate": 2.0266731592091834e-06, "epoch": 12.307692307692308, "percentage": 38.58, "elapsed_time": "6:04:32", "remaining_time": "9:40:20", "throughput": 2117.18, "total_tokens": 46307456} {"current_steps": 3005, "total_steps": 7776, "loss": 0.5077, "learning_rate": 2.0238349199966793e-06, "epoch": 12.328205128205129, "percentage": 38.64, "elapsed_time": "6:05:19", "remaining_time": "9:40:02", "throughput": 2116.36, "total_tokens": 46390688} {"current_steps": 3010, "total_steps": 7776, "loss": 0.4541, "learning_rate": 2.020994543208254e-06, "epoch": 12.34871794871795, "percentage": 38.71, "elapsed_time": "6:06:00", "remaining_time": "9:39:31", "throughput": 2115.99, "total_tokens": 46467904} {"current_steps": 3015, "total_steps": 7776, "loss": 0.4975, "learning_rate": 2.018152040434432e-06, "epoch": 12.36923076923077, "percentage": 38.77, "elapsed_time": "6:06:34", "remaining_time": "9:38:52", "throughput": 2116.22, "total_tokens": 46545632} {"current_steps": 3020, "total_steps": 7776, "loss": 0.4988, "learning_rate": 2.015307423274411e-06, "epoch": 12.38974358974359, "percentage": 38.84, "elapsed_time": "6:07:15", "remaining_time": "9:38:22", "throughput": 2115.85, "total_tokens": 46624768} {"current_steps": 3025, "total_steps": 7776, "loss": 0.4877, "learning_rate": 2.0124607033360193e-06, "epoch": 12.41025641025641, "percentage": 38.9, "elapsed_time": "6:07:45", "remaining_time": "9:37:35", "throughput": 2116.21, "total_tokens": 46694528} {"current_steps": 3030, "total_steps": 7776, "loss": 0.4621, "learning_rate": 2.0096118922356646e-06, "epoch": 12.430769230769231, "percentage": 38.97, "elapsed_time": "6:08:14", "remaining_time": "9:36:47", "throughput": 2116.67, "total_tokens": 46767520} {"current_steps": 3035, "total_steps": 7776, "loss": 0.4742, "learning_rate": 2.0067610015982868e-06, "epoch": 12.451282051282051, "percentage": 39.03, "elapsed_time": "6:08:51", "remaining_time": "9:36:12", "throughput": 2116.56, "total_tokens": 46843616} {"current_steps": 3040, "total_steps": 7776, "loss": 0.3993, "learning_rate": 2.0039080430573133e-06, "epoch": 12.471794871794872, "percentage": 39.09, "elapsed_time": "6:09:21", "remaining_time": "9:35:24", "throughput": 2116.99, "total_tokens": 46915136} {"current_steps": 3045, "total_steps": 7776, "loss": 0.464, "learning_rate": 2.0010530282546093e-06, "epoch": 12.492307692307692, "percentage": 39.16, "elapsed_time": "6:09:52", "remaining_time": "9:34:40", "throughput": 2117.48, "total_tokens": 46992000} {"current_steps": 3050, "total_steps": 7776, "loss": 0.4744, "learning_rate": 1.9981959688404303e-06, "epoch": 12.512820512820513, "percentage": 39.22, "elapsed_time": "6:10:27", "remaining_time": "9:34:02", "throughput": 2117.86, "total_tokens": 47075360} {"current_steps": 3055, "total_steps": 7776, "loss": 0.4788, "learning_rate": 1.9953368764733763e-06, "epoch": 12.533333333333333, "percentage": 39.29, "elapsed_time": "6:10:57", "remaining_time": "9:33:14", "throughput": 2118.56, "total_tokens": 47152704} {"current_steps": 3060, "total_steps": 7776, "loss": 0.4704, "learning_rate": 1.992475762820342e-06, "epoch": 12.553846153846154, "percentage": 39.35, "elapsed_time": "6:11:26", "remaining_time": "9:32:26", "throughput": 2119.24, "total_tokens": 47229696} {"current_steps": 3065, "total_steps": 7776, "loss": 0.4645, "learning_rate": 1.9896126395564695e-06, "epoch": 12.574358974358974, "percentage": 39.42, "elapsed_time": "6:11:58", "remaining_time": "9:31:43", "throughput": 2119.67, "total_tokens": 47307360} {"current_steps": 3070, "total_steps": 7776, "loss": 0.5485, "learning_rate": 1.986747518365104e-06, "epoch": 12.594871794871795, "percentage": 39.48, "elapsed_time": "6:12:41", "remaining_time": "9:31:17", "throughput": 2119.47, "total_tokens": 47393824} {"current_steps": 3075, "total_steps": 7776, "loss": 0.511, "learning_rate": 1.9838804109377405e-06, "epoch": 12.615384615384615, "percentage": 39.54, "elapsed_time": "6:13:10", "remaining_time": "9:30:29", "throughput": 2120.36, "total_tokens": 47475104} {"current_steps": 3080, "total_steps": 7776, "loss": 0.4624, "learning_rate": 1.9810113289739818e-06, "epoch": 12.635897435897435, "percentage": 39.61, "elapsed_time": "6:13:34", "remaining_time": "9:29:34", "throughput": 2121.35, "total_tokens": 47548704} {"current_steps": 3085, "total_steps": 7776, "loss": 0.5197, "learning_rate": 1.9781402841814855e-06, "epoch": 12.656410256410256, "percentage": 39.67, "elapsed_time": "6:14:05", "remaining_time": "9:28:49", "throughput": 2122.46, "total_tokens": 47638880} {"current_steps": 3090, "total_steps": 7776, "loss": 0.4277, "learning_rate": 1.9752672882759204e-06, "epoch": 12.676923076923076, "percentage": 39.74, "elapsed_time": "6:14:27", "remaining_time": "9:27:51", "throughput": 2123.61, "total_tokens": 47711456} {"current_steps": 3095, "total_steps": 7776, "loss": 0.5166, "learning_rate": 1.972392352980917e-06, "epoch": 12.697435897435897, "percentage": 39.8, "elapsed_time": "6:14:50", "remaining_time": "9:26:55", "throughput": 2124.78, "total_tokens": 47787776} {"current_steps": 3100, "total_steps": 7776, "loss": 0.4201, "learning_rate": 1.969515490028019e-06, "epoch": 12.717948717948717, "percentage": 39.87, "elapsed_time": "6:15:10", "remaining_time": "9:25:54", "throughput": 2126.12, "total_tokens": 47860480} {"current_steps": 3105, "total_steps": 7776, "loss": 0.4425, "learning_rate": 1.966636711156636e-06, "epoch": 12.73846153846154, "percentage": 39.93, "elapsed_time": "6:15:33", "remaining_time": "9:24:58", "throughput": 2127.34, "total_tokens": 47936704} {"current_steps": 3110, "total_steps": 7776, "loss": 0.5056, "learning_rate": 1.9637560281139982e-06, "epoch": 12.75897435897436, "percentage": 39.99, "elapsed_time": "6:16:00", "remaining_time": "9:24:07", "throughput": 2128.58, "total_tokens": 48021792} {"current_steps": 3115, "total_steps": 7776, "loss": 0.4929, "learning_rate": 1.960873452655102e-06, "epoch": 12.77948717948718, "percentage": 40.06, "elapsed_time": "6:16:22", "remaining_time": "9:23:10", "throughput": 2130.05, "total_tokens": 48101984} {"current_steps": 3120, "total_steps": 7776, "loss": 0.4868, "learning_rate": 1.95798899654267e-06, "epoch": 12.8, "percentage": 40.12, "elapsed_time": "6:16:45", "remaining_time": "9:22:14", "throughput": 2131.66, "total_tokens": 48186688} {"current_steps": 3125, "total_steps": 7776, "loss": 0.4668, "learning_rate": 1.9551026715470954e-06, "epoch": 12.820512820512821, "percentage": 40.19, "elapsed_time": "6:17:03", "remaining_time": "9:21:10", "throughput": 2133.19, "total_tokens": 48259872} {"current_steps": 3130, "total_steps": 7776, "loss": 0.53, "learning_rate": 1.952214489446401e-06, "epoch": 12.841025641025642, "percentage": 40.25, "elapsed_time": "6:17:25", "remaining_time": "9:20:14", "throughput": 2134.93, "total_tokens": 48347232} {"current_steps": 3135, "total_steps": 7776, "loss": 0.4388, "learning_rate": 1.949324462026185e-06, "epoch": 12.861538461538462, "percentage": 40.32, "elapsed_time": "6:17:42", "remaining_time": "9:19:09", "throughput": 2136.66, "total_tokens": 48422624} {"current_steps": 3140, "total_steps": 7776, "loss": 0.4246, "learning_rate": 1.9464326010795776e-06, "epoch": 12.882051282051282, "percentage": 40.38, "elapsed_time": "6:18:24", "remaining_time": "9:18:42", "throughput": 2135.76, "total_tokens": 48492288} {"current_steps": 3145, "total_steps": 7776, "loss": 0.5186, "learning_rate": 1.9435389184071895e-06, "epoch": 12.902564102564103, "percentage": 40.44, "elapsed_time": "6:19:17", "remaining_time": "9:18:30", "throughput": 2134.15, "total_tokens": 48568224} {"current_steps": 3150, "total_steps": 7776, "loss": 0.4351, "learning_rate": 1.9406434258170666e-06, "epoch": 12.923076923076923, "percentage": 40.51, "elapsed_time": "6:19:58", "remaining_time": "9:18:01", "throughput": 2133.32, "total_tokens": 48637280} {"current_steps": 3155, "total_steps": 7776, "loss": 0.5281, "learning_rate": 1.9377461351246395e-06, "epoch": 12.943589743589744, "percentage": 40.57, "elapsed_time": "6:20:48", "remaining_time": "9:17:44", "throughput": 2132.2, "total_tokens": 48717088} {"current_steps": 3160, "total_steps": 7776, "loss": 0.4308, "learning_rate": 1.9348470581526763e-06, "epoch": 12.964102564102564, "percentage": 40.64, "elapsed_time": "6:21:28", "remaining_time": "9:17:15", "throughput": 2131.5, "total_tokens": 48787584} {"current_steps": 3165, "total_steps": 7776, "loss": 0.4133, "learning_rate": 1.9319462067312344e-06, "epoch": 12.984615384615385, "percentage": 40.7, "elapsed_time": "6:22:25", "remaining_time": "9:17:09", "throughput": 2129.57, "total_tokens": 48864640} {"current_steps": 3170, "total_steps": 7776, "loss": 0.4802, "learning_rate": 1.929043592697612e-06, "epoch": 13.005128205128205, "percentage": 40.77, "elapsed_time": "6:23:06", "remaining_time": "9:16:39", "throughput": 2128.98, "total_tokens": 48938176} {"current_steps": 3175, "total_steps": 7776, "loss": 0.4504, "learning_rate": 1.926139227896299e-06, "epoch": 13.025641025641026, "percentage": 40.83, "elapsed_time": "6:23:50", "remaining_time": "9:16:14", "throughput": 2128.26, "total_tokens": 49015040} {"current_steps": 3180, "total_steps": 7776, "loss": 0.494, "learning_rate": 1.923233124178932e-06, "epoch": 13.046153846153846, "percentage": 40.9, "elapsed_time": "6:24:35", "remaining_time": "9:15:50", "throughput": 2127.45, "total_tokens": 49091680} {"current_steps": 3185, "total_steps": 7776, "loss": 0.4628, "learning_rate": 1.9203252934042403e-06, "epoch": 13.066666666666666, "percentage": 40.96, "elapsed_time": "6:25:15", "remaining_time": "9:15:19", "throughput": 2126.97, "total_tokens": 49165600} {"current_steps": 3190, "total_steps": 7776, "loss": 0.4431, "learning_rate": 1.9174157474380034e-06, "epoch": 13.087179487179487, "percentage": 41.02, "elapsed_time": "6:25:59", "remaining_time": "9:14:55", "throughput": 2126.39, "total_tokens": 49247136} {"current_steps": 3195, "total_steps": 7776, "loss": 0.4479, "learning_rate": 1.914504498152998e-06, "epoch": 13.107692307692307, "percentage": 41.09, "elapsed_time": "6:26:37", "remaining_time": "9:14:20", "throughput": 2126.06, "total_tokens": 49319648} {"current_steps": 3200, "total_steps": 7776, "loss": 0.4278, "learning_rate": 1.9115915574289525e-06, "epoch": 13.128205128205128, "percentage": 41.15, "elapsed_time": "6:27:15", "remaining_time": "9:13:46", "throughput": 2125.77, "total_tokens": 49393216} {"current_steps": 3205, "total_steps": 7776, "loss": 0.5124, "learning_rate": 1.9086769371524966e-06, "epoch": 13.148717948717948, "percentage": 41.22, "elapsed_time": "6:28:37", "remaining_time": "9:14:15", "throughput": 2122.06, "total_tokens": 49480864} {"current_steps": 3210, "total_steps": 7776, "loss": 0.4438, "learning_rate": 1.9057606492171144e-06, "epoch": 13.169230769230769, "percentage": 41.28, "elapsed_time": "6:29:23", "remaining_time": "9:13:53", "throughput": 2121.23, "total_tokens": 49559904} {"current_steps": 3215, "total_steps": 7776, "loss": 0.4312, "learning_rate": 1.9028427055230948e-06, "epoch": 13.189743589743589, "percentage": 41.35, "elapsed_time": "6:29:57", "remaining_time": "9:13:13", "throughput": 2121.18, "total_tokens": 49630240} {"current_steps": 3220, "total_steps": 7776, "loss": 0.5431, "learning_rate": 1.8999231179774833e-06, "epoch": 13.21025641025641, "percentage": 41.41, "elapsed_time": "6:30:44", "remaining_time": "9:12:51", "throughput": 2120.33, "total_tokens": 49709888} {"current_steps": 3225, "total_steps": 7776, "loss": 0.4567, "learning_rate": 1.897001898494033e-06, "epoch": 13.23076923076923, "percentage": 41.47, "elapsed_time": "6:31:15", "remaining_time": "9:12:07", "throughput": 2120.5, "total_tokens": 49778848} {"current_steps": 3230, "total_steps": 7776, "loss": 0.4227, "learning_rate": 1.8940790589931568e-06, "epoch": 13.25128205128205, "percentage": 41.54, "elapsed_time": "6:31:46", "remaining_time": "9:11:24", "throughput": 2120.62, "total_tokens": 49849024} {"current_steps": 3235, "total_steps": 7776, "loss": 0.4738, "learning_rate": 1.8911546114018775e-06, "epoch": 13.271794871794873, "percentage": 41.6, "elapsed_time": "6:32:17", "remaining_time": "9:10:39", "throughput": 2120.8, "total_tokens": 49917952} {"current_steps": 3240, "total_steps": 7776, "loss": 0.4661, "learning_rate": 1.888228567653781e-06, "epoch": 13.292307692307693, "percentage": 41.67, "elapsed_time": "6:33:06", "remaining_time": "9:10:20", "throughput": 2120.01, "total_tokens": 50003392} {"current_steps": 3245, "total_steps": 7776, "loss": 0.5039, "learning_rate": 1.8853009396889665e-06, "epoch": 13.312820512820513, "percentage": 41.73, "elapsed_time": "6:33:47", "remaining_time": "9:09:51", "throughput": 2119.75, "total_tokens": 50085280} {"current_steps": 3250, "total_steps": 7776, "loss": 0.4442, "learning_rate": 1.8823717394539966e-06, "epoch": 13.333333333333334, "percentage": 41.8, "elapsed_time": "6:34:43", "remaining_time": "9:09:41", "throughput": 2118.23, "total_tokens": 50166304} {"current_steps": 3255, "total_steps": 7776, "loss": 0.5048, "learning_rate": 1.8794409789018507e-06, "epoch": 13.353846153846154, "percentage": 41.86, "elapsed_time": "6:35:28", "remaining_time": "9:09:17", "throughput": 2117.62, "total_tokens": 50247200} {"current_steps": 3260, "total_steps": 7776, "loss": 0.4615, "learning_rate": 1.8765086699918747e-06, "epoch": 13.374358974358975, "percentage": 41.92, "elapsed_time": "6:35:57", "remaining_time": "9:08:30", "throughput": 2118.15, "total_tokens": 50321120} {"current_steps": 3265, "total_steps": 7776, "loss": 0.4838, "learning_rate": 1.8735748246897337e-06, "epoch": 13.394871794871795, "percentage": 41.99, "elapsed_time": "6:36:39", "remaining_time": "9:08:01", "throughput": 2117.87, "total_tokens": 50403680} {"current_steps": 3270, "total_steps": 7776, "loss": 0.4454, "learning_rate": 1.8706394549673615e-06, "epoch": 13.415384615384616, "percentage": 42.05, "elapsed_time": "6:37:17", "remaining_time": "9:07:27", "throughput": 2117.76, "total_tokens": 50481504} {"current_steps": 3275, "total_steps": 7776, "loss": 0.4806, "learning_rate": 1.8677025728029122e-06, "epoch": 13.435897435897436, "percentage": 42.12, "elapsed_time": "6:37:44", "remaining_time": "9:06:38", "throughput": 2118.44, "total_tokens": 50556448} {"current_steps": 3280, "total_steps": 7776, "loss": 0.4601, "learning_rate": 1.8647641901807126e-06, "epoch": 13.456410256410257, "percentage": 42.18, "elapsed_time": "6:38:11", "remaining_time": "9:05:49", "throughput": 2119.14, "total_tokens": 50630304} {"current_steps": 3285, "total_steps": 7776, "loss": 0.4513, "learning_rate": 1.861824319091212e-06, "epoch": 13.476923076923077, "percentage": 42.25, "elapsed_time": "6:38:38", "remaining_time": "9:05:00", "throughput": 2119.86, "total_tokens": 50704704} {"current_steps": 3290, "total_steps": 7776, "loss": 0.4704, "learning_rate": 1.8588829715309324e-06, "epoch": 13.497435897435897, "percentage": 42.31, "elapsed_time": "6:39:07", "remaining_time": "9:04:12", "throughput": 2120.61, "total_tokens": 50782464} {"current_steps": 3295, "total_steps": 7776, "loss": 0.4959, "learning_rate": 1.855940159502423e-06, "epoch": 13.517948717948718, "percentage": 42.37, "elapsed_time": "6:39:34", "remaining_time": "9:03:23", "throughput": 2121.49, "total_tokens": 50861696} {"current_steps": 3300, "total_steps": 7776, "loss": 0.5215, "learning_rate": 1.8529958950142066e-06, "epoch": 13.538461538461538, "percentage": 42.44, "elapsed_time": "6:40:15", "remaining_time": "9:02:53", "throughput": 2121.52, "total_tokens": 50949568} {"current_steps": 3305, "total_steps": 7776, "loss": 0.4692, "learning_rate": 1.8500501900807345e-06, "epoch": 13.558974358974359, "percentage": 42.5, "elapsed_time": "6:40:37", "remaining_time": "9:01:58", "throughput": 2122.44, "total_tokens": 51018432} {"current_steps": 3310, "total_steps": 7776, "loss": 0.5015, "learning_rate": 1.847103056722335e-06, "epoch": 13.57948717948718, "percentage": 42.57, "elapsed_time": "6:41:04", "remaining_time": "9:01:08", "throughput": 2123.47, "total_tokens": 51100352} {"current_steps": 3315, "total_steps": 7776, "loss": 0.4779, "learning_rate": 1.8441545069651665e-06, "epoch": 13.6, "percentage": 42.63, "elapsed_time": "6:41:32", "remaining_time": "9:00:21", "throughput": 2124.23, "total_tokens": 51178144} {"current_steps": 3320, "total_steps": 7776, "loss": 0.4971, "learning_rate": 1.8412045528411652e-06, "epoch": 13.62051282051282, "percentage": 42.7, "elapsed_time": "6:41:59", "remaining_time": "8:59:32", "throughput": 2125.35, "total_tokens": 51262432} {"current_steps": 3325, "total_steps": 7776, "loss": 0.5063, "learning_rate": 1.8382532063880005e-06, "epoch": 13.64102564102564, "percentage": 42.76, "elapsed_time": "6:42:24", "remaining_time": "8:58:40", "throughput": 2126.51, "total_tokens": 51342624} {"current_steps": 3330, "total_steps": 7776, "loss": 0.4273, "learning_rate": 1.8353004796490212e-06, "epoch": 13.661538461538461, "percentage": 42.82, "elapsed_time": "6:42:42", "remaining_time": "8:57:40", "throughput": 2127.83, "total_tokens": 51413920} {"current_steps": 3335, "total_steps": 7776, "loss": 0.5491, "learning_rate": 1.8323463846732099e-06, "epoch": 13.682051282051281, "percentage": 42.89, "elapsed_time": "6:43:32", "remaining_time": "8:57:22", "throughput": 2127.05, "total_tokens": 51501184} {"current_steps": 3340, "total_steps": 7776, "loss": 0.4199, "learning_rate": 1.8293909335151316e-06, "epoch": 13.702564102564102, "percentage": 42.95, "elapsed_time": "6:43:50", "remaining_time": "8:56:21", "throughput": 2128.35, "total_tokens": 51570944} {"current_steps": 3345, "total_steps": 7776, "loss": 0.4468, "learning_rate": 1.826434138234886e-06, "epoch": 13.723076923076922, "percentage": 43.02, "elapsed_time": "6:44:11", "remaining_time": "8:55:25", "throughput": 2129.8, "total_tokens": 51650784} {"current_steps": 3350, "total_steps": 7776, "loss": 0.5225, "learning_rate": 1.8234760108980572e-06, "epoch": 13.743589743589745, "percentage": 43.08, "elapsed_time": "6:44:31", "remaining_time": "8:54:27", "throughput": 2131.32, "total_tokens": 51731008} {"current_steps": 3355, "total_steps": 7776, "loss": 0.4634, "learning_rate": 1.820516563575665e-06, "epoch": 13.764102564102565, "percentage": 43.15, "elapsed_time": "6:44:50", "remaining_time": "8:53:28", "throughput": 2132.88, "total_tokens": 51809056} {"current_steps": 3360, "total_steps": 7776, "loss": 0.5321, "learning_rate": 1.8175558083441164e-06, "epoch": 13.784615384615385, "percentage": 43.21, "elapsed_time": "6:45:14", "remaining_time": "8:52:36", "throughput": 2133.95, "total_tokens": 51886688} {"current_steps": 3365, "total_steps": 7776, "loss": 0.4633, "learning_rate": 1.814593757285154e-06, "epoch": 13.805128205128206, "percentage": 43.27, "elapsed_time": "6:45:58", "remaining_time": "8:52:10", "throughput": 2133.13, "total_tokens": 51959488} {"current_steps": 3370, "total_steps": 7776, "loss": 0.4812, "learning_rate": 1.8116304224858092e-06, "epoch": 13.825641025641026, "percentage": 43.34, "elapsed_time": "6:46:47", "remaining_time": "8:51:50", "throughput": 2131.94, "total_tokens": 52035424} {"current_steps": 3375, "total_steps": 7776, "loss": 0.506, "learning_rate": 1.8086658160383524e-06, "epoch": 13.846153846153847, "percentage": 43.4, "elapsed_time": "6:47:36", "remaining_time": "8:51:31", "throughput": 2130.82, "total_tokens": 52112576} {"current_steps": 3380, "total_steps": 7776, "loss": 0.5091, "learning_rate": 1.8056999500402414e-06, "epoch": 13.866666666666667, "percentage": 43.47, "elapsed_time": "6:49:04", "remaining_time": "8:52:02", "throughput": 2126.78, "total_tokens": 52200480} {"current_steps": 3385, "total_steps": 7776, "loss": 0.4861, "learning_rate": 1.8027328365940755e-06, "epoch": 13.887179487179488, "percentage": 43.53, "elapsed_time": "6:49:46", "remaining_time": "8:51:34", "throughput": 2126.1, "total_tokens": 52274368} {"current_steps": 3390, "total_steps": 7776, "loss": 0.5051, "learning_rate": 1.799764487807543e-06, "epoch": 13.907692307692308, "percentage": 43.6, "elapsed_time": "6:50:32", "remaining_time": "8:51:09", "throughput": 2125.29, "total_tokens": 52350656} {"current_steps": 3395, "total_steps": 7776, "loss": 0.4608, "learning_rate": 1.7967949157933742e-06, "epoch": 13.928205128205128, "percentage": 43.66, "elapsed_time": "6:51:16", "remaining_time": "8:50:43", "throughput": 2124.56, "total_tokens": 52427328} {"current_steps": 3400, "total_steps": 7776, "loss": 0.4719, "learning_rate": 1.7938241326692907e-06, "epoch": 13.948717948717949, "percentage": 43.72, "elapsed_time": "6:52:10", "remaining_time": "8:50:29", "throughput": 2123.03, "total_tokens": 52503840} {"current_steps": 3405, "total_steps": 7776, "loss": 0.5062, "learning_rate": 1.7908521505579554e-06, "epoch": 13.96923076923077, "percentage": 43.79, "elapsed_time": "6:52:51", "remaining_time": "8:49:58", "throughput": 2122.52, "total_tokens": 52577056} {"current_steps": 3410, "total_steps": 7776, "loss": 0.5096, "learning_rate": 1.7878789815869247e-06, "epoch": 13.98974358974359, "percentage": 43.85, "elapsed_time": "6:53:45", "remaining_time": "8:49:45", "throughput": 2121.05, "total_tokens": 52656000} {"current_steps": 3415, "total_steps": 7776, "loss": 0.4476, "learning_rate": 1.7849046378885977e-06, "epoch": 14.01025641025641, "percentage": 43.92, "elapsed_time": "6:54:21", "remaining_time": "8:49:08", "throughput": 2120.79, "total_tokens": 52725312} {"current_steps": 3420, "total_steps": 7776, "loss": 0.436, "learning_rate": 1.7819291316001679e-06, "epoch": 14.03076923076923, "percentage": 43.98, "elapsed_time": "6:55:03", "remaining_time": "8:48:39", "throughput": 2120.38, "total_tokens": 52804736} {"current_steps": 3425, "total_steps": 7776, "loss": 0.4761, "learning_rate": 1.7789524748635717e-06, "epoch": 14.051282051282051, "percentage": 44.05, "elapsed_time": "6:55:51", "remaining_time": "8:48:18", "throughput": 2119.48, "total_tokens": 52885056} {"current_steps": 3430, "total_steps": 7776, "loss": 0.5039, "learning_rate": 1.775974679825441e-06, "epoch": 14.071794871794872, "percentage": 44.11, "elapsed_time": "6:56:34", "remaining_time": "8:47:48", "throughput": 2119.03, "total_tokens": 52963136} {"current_steps": 3435, "total_steps": 7776, "loss": 0.5039, "learning_rate": 1.7729957586370525e-06, "epoch": 14.092307692307692, "percentage": 44.17, "elapsed_time": "6:58:10", "remaining_time": "8:48:28", "throughput": 2114.32, "total_tokens": 53049856} {"current_steps": 3440, "total_steps": 7776, "loss": 0.5397, "learning_rate": 1.7700157234542773e-06, "epoch": 14.112820512820512, "percentage": 44.24, "elapsed_time": "6:58:49", "remaining_time": "8:47:55", "throughput": 2114.13, "total_tokens": 53127616} {"current_steps": 3445, "total_steps": 7776, "loss": 0.4747, "learning_rate": 1.7670345864375339e-06, "epoch": 14.133333333333333, "percentage": 44.3, "elapsed_time": "6:59:25", "remaining_time": "8:47:17", "throughput": 2114.08, "total_tokens": 53201600} {"current_steps": 3450, "total_steps": 7776, "loss": 0.4582, "learning_rate": 1.7640523597517357e-06, "epoch": 14.153846153846153, "percentage": 44.37, "elapsed_time": "6:59:59", "remaining_time": "8:46:37", "throughput": 2114.18, "total_tokens": 53275520} {"current_steps": 3455, "total_steps": 7776, "loss": 0.4747, "learning_rate": 1.7610690555662435e-06, "epoch": 14.174358974358974, "percentage": 44.43, "elapsed_time": "7:00:31", "remaining_time": "8:45:55", "throughput": 2114.3, "total_tokens": 53346720} {"current_steps": 3460, "total_steps": 7776, "loss": 0.4758, "learning_rate": 1.7580846860548146e-06, "epoch": 14.194871794871794, "percentage": 44.5, "elapsed_time": "7:01:05", "remaining_time": "8:45:15", "throughput": 2114.39, "total_tokens": 53420864} {"current_steps": 3465, "total_steps": 7776, "loss": 0.4305, "learning_rate": 1.7550992633955535e-06, "epoch": 14.215384615384615, "percentage": 44.56, "elapsed_time": "7:01:35", "remaining_time": "8:44:32", "throughput": 2114.61, "total_tokens": 53490976} {"current_steps": 3470, "total_steps": 7776, "loss": 0.4533, "learning_rate": 1.7521127997708621e-06, "epoch": 14.235897435897435, "percentage": 44.62, "elapsed_time": "7:02:11", "remaining_time": "8:43:53", "throughput": 2114.83, "total_tokens": 53570816} {"current_steps": 3475, "total_steps": 7776, "loss": 0.5019, "learning_rate": 1.7491253073673903e-06, "epoch": 14.256410256410255, "percentage": 44.69, "elapsed_time": "7:02:50", "remaining_time": "8:43:20", "throughput": 2114.55, "total_tokens": 53647072} {"current_steps": 3480, "total_steps": 7776, "loss": 0.4575, "learning_rate": 1.7461367983759862e-06, "epoch": 14.276923076923078, "percentage": 44.75, "elapsed_time": "7:03:32", "remaining_time": "8:42:51", "throughput": 2114.24, "total_tokens": 53727648} {"current_steps": 3485, "total_steps": 7776, "loss": 0.4728, "learning_rate": 1.7431472849916455e-06, "epoch": 14.297435897435898, "percentage": 44.82, "elapsed_time": "7:04:00", "remaining_time": "8:42:04", "throughput": 2114.77, "total_tokens": 53800544} {"current_steps": 3490, "total_steps": 7776, "loss": 0.4677, "learning_rate": 1.7401567794134636e-06, "epoch": 14.317948717948719, "percentage": 44.88, "elapsed_time": "7:04:30", "remaining_time": "8:41:19", "throughput": 2115.22, "total_tokens": 53875552} {"current_steps": 3495, "total_steps": 7776, "loss": 0.456, "learning_rate": 1.737165293844583e-06, "epoch": 14.338461538461539, "percentage": 44.95, "elapsed_time": "7:05:03", "remaining_time": "8:40:39", "throughput": 2115.55, "total_tokens": 53954208} {"current_steps": 3500, "total_steps": 7776, "loss": 0.4798, "learning_rate": 1.7341728404921471e-06, "epoch": 14.35897435897436, "percentage": 45.01, "elapsed_time": "7:05:34", "remaining_time": "8:39:56", "throughput": 2116.05, "total_tokens": 54033248} {"current_steps": 3505, "total_steps": 7776, "loss": 0.4166, "learning_rate": 1.7311794315672477e-06, "epoch": 14.37948717948718, "percentage": 45.07, "elapsed_time": "7:06:02", "remaining_time": "8:39:08", "throughput": 2116.78, "total_tokens": 54109440} {"current_steps": 3510, "total_steps": 7776, "loss": 0.4663, "learning_rate": 1.7281850792848752e-06, "epoch": 14.4, "percentage": 45.14, "elapsed_time": "7:06:30", "remaining_time": "8:38:22", "throughput": 2117.44, "total_tokens": 54186368} {"current_steps": 3515, "total_steps": 7776, "loss": 0.4053, "learning_rate": 1.7251897958638704e-06, "epoch": 14.42051282051282, "percentage": 45.2, "elapsed_time": "7:06:59", "remaining_time": "8:37:36", "throughput": 2118.24, "total_tokens": 54267648} {"current_steps": 3520, "total_steps": 7776, "loss": 0.5342, "learning_rate": 1.7221935935268735e-06, "epoch": 14.441025641025641, "percentage": 45.27, "elapsed_time": "7:07:24", "remaining_time": "8:36:46", "throughput": 2119.07, "total_tokens": 54342304} {"current_steps": 3525, "total_steps": 7776, "loss": 0.4992, "learning_rate": 1.719196484500274e-06, "epoch": 14.461538461538462, "percentage": 45.33, "elapsed_time": "7:07:52", "remaining_time": "8:36:00", "throughput": 2119.91, "total_tokens": 54423808} {"current_steps": 3530, "total_steps": 7776, "loss": 0.5067, "learning_rate": 1.7161984810141625e-06, "epoch": 14.482051282051282, "percentage": 45.4, "elapsed_time": "7:08:20", "remaining_time": "8:35:13", "throughput": 2120.64, "total_tokens": 54501760} {"current_steps": 3535, "total_steps": 7776, "loss": 0.4286, "learning_rate": 1.7131995953022776e-06, "epoch": 14.502564102564103, "percentage": 45.46, "elapsed_time": "7:08:43", "remaining_time": "8:34:20", "throughput": 2121.7, "total_tokens": 54576512} {"current_steps": 3540, "total_steps": 7776, "loss": 0.436, "learning_rate": 1.7101998396019593e-06, "epoch": 14.523076923076923, "percentage": 45.52, "elapsed_time": "7:09:03", "remaining_time": "8:33:25", "throughput": 2122.82, "total_tokens": 54649696} {"current_steps": 3545, "total_steps": 7776, "loss": 0.4889, "learning_rate": 1.7071992261540983e-06, "epoch": 14.543589743589743, "percentage": 45.59, "elapsed_time": "7:09:26", "remaining_time": "8:32:33", "throughput": 2123.99, "total_tokens": 54728864} {"current_steps": 3550, "total_steps": 7776, "loss": 0.4585, "learning_rate": 1.7041977672030842e-06, "epoch": 14.564102564102564, "percentage": 45.65, "elapsed_time": "7:09:45", "remaining_time": "8:31:35", "throughput": 2125.16, "total_tokens": 54797856} {"current_steps": 3555, "total_steps": 7776, "loss": 0.4646, "learning_rate": 1.7011954749967564e-06, "epoch": 14.584615384615384, "percentage": 45.72, "elapsed_time": "7:10:06", "remaining_time": "8:30:40", "throughput": 2126.42, "total_tokens": 54875168} {"current_steps": 3560, "total_steps": 7776, "loss": 0.4894, "learning_rate": 1.6981923617863566e-06, "epoch": 14.605128205128205, "percentage": 45.78, "elapsed_time": "7:10:25", "remaining_time": "8:29:44", "throughput": 2127.72, "total_tokens": 54949312} {"current_steps": 3565, "total_steps": 7776, "loss": 0.5159, "learning_rate": 1.6951884398264742e-06, "epoch": 14.625641025641025, "percentage": 45.85, "elapsed_time": "7:10:44", "remaining_time": "8:28:47", "throughput": 2129.05, "total_tokens": 55024768} {"current_steps": 3570, "total_steps": 7776, "loss": 0.4221, "learning_rate": 1.692183721375001e-06, "epoch": 14.646153846153846, "percentage": 45.91, "elapsed_time": "7:11:03", "remaining_time": "8:27:50", "throughput": 2130.46, "total_tokens": 55100128} {"current_steps": 3575, "total_steps": 7776, "loss": 0.5417, "learning_rate": 1.6891782186930767e-06, "epoch": 14.666666666666666, "percentage": 45.97, "elapsed_time": "7:11:22", "remaining_time": "8:26:55", "throughput": 2131.99, "total_tokens": 55182080} {"current_steps": 3580, "total_steps": 7776, "loss": 0.5072, "learning_rate": 1.6861719440450437e-06, "epoch": 14.687179487179487, "percentage": 46.04, "elapsed_time": "7:11:46", "remaining_time": "8:26:04", "throughput": 2133.58, "total_tokens": 55274048} {"current_steps": 3585, "total_steps": 7776, "loss": 0.5008, "learning_rate": 1.6831649096983923e-06, "epoch": 14.707692307692307, "percentage": 46.1, "elapsed_time": "7:12:14", "remaining_time": "8:25:18", "throughput": 2134.12, "total_tokens": 55347648} {"current_steps": 3590, "total_steps": 7776, "loss": 0.4411, "learning_rate": 1.680157127923715e-06, "epoch": 14.728205128205127, "percentage": 46.17, "elapsed_time": "7:12:56", "remaining_time": "8:24:49", "throughput": 2133.37, "total_tokens": 55418368} {"current_steps": 3595, "total_steps": 7776, "loss": 0.4654, "learning_rate": 1.677148610994652e-06, "epoch": 14.74871794871795, "percentage": 46.23, "elapsed_time": "7:13:39", "remaining_time": "8:24:21", "throughput": 2132.62, "total_tokens": 55490176} {"current_steps": 3600, "total_steps": 7776, "loss": 0.4576, "learning_rate": 1.6741393711878454e-06, "epoch": 14.76923076923077, "percentage": 46.3, "elapsed_time": "7:14:46", "remaining_time": "8:24:19", "throughput": 2130.28, "total_tokens": 55570784} {"current_steps": 3605, "total_steps": 7776, "loss": 0.4488, "learning_rate": 1.6711294207828852e-06, "epoch": 14.78974358974359, "percentage": 46.36, "elapsed_time": "7:15:29", "remaining_time": "8:23:52", "throughput": 2129.54, "total_tokens": 55643936} {"current_steps": 3610, "total_steps": 7776, "loss": 0.5175, "learning_rate": 1.6681187720622627e-06, "epoch": 14.810256410256411, "percentage": 46.42, "elapsed_time": "7:16:28", "remaining_time": "8:23:41", "throughput": 2127.99, "total_tokens": 55727936} {"current_steps": 3615, "total_steps": 7776, "loss": 0.4271, "learning_rate": 1.6651074373113176e-06, "epoch": 14.830769230769231, "percentage": 46.49, "elapsed_time": "7:17:16", "remaining_time": "8:23:18", "throughput": 2127.02, "total_tokens": 55804992} {"current_steps": 3620, "total_steps": 7776, "loss": 0.4631, "learning_rate": 1.66209542881819e-06, "epoch": 14.851282051282052, "percentage": 46.55, "elapsed_time": "7:17:59", "remaining_time": "8:22:50", "throughput": 2126.36, "total_tokens": 55878976} {"current_steps": 3625, "total_steps": 7776, "loss": 0.5453, "learning_rate": 1.6590827588737685e-06, "epoch": 14.871794871794872, "percentage": 46.62, "elapsed_time": "7:19:02", "remaining_time": "8:22:44", "throughput": 2124.71, "total_tokens": 55969376} {"current_steps": 3630, "total_steps": 7776, "loss": 0.5086, "learning_rate": 1.6560694397716412e-06, "epoch": 14.892307692307693, "percentage": 46.68, "elapsed_time": "7:19:41", "remaining_time": "8:22:11", "throughput": 2124.27, "total_tokens": 56041024} {"current_steps": 3635, "total_steps": 7776, "loss": 0.4602, "learning_rate": 1.6530554838080458e-06, "epoch": 14.912820512820513, "percentage": 46.75, "elapsed_time": "7:20:23", "remaining_time": "8:21:41", "throughput": 2123.79, "total_tokens": 56117152} {"current_steps": 3640, "total_steps": 7776, "loss": 0.5046, "learning_rate": 1.6500409032818175e-06, "epoch": 14.933333333333334, "percentage": 46.81, "elapsed_time": "7:21:05", "remaining_time": "8:21:11", "throughput": 2123.18, "total_tokens": 56191264} {"current_steps": 3645, "total_steps": 7776, "loss": 0.53, "learning_rate": 1.6470257104943413e-06, "epoch": 14.953846153846154, "percentage": 46.88, "elapsed_time": "7:22:01", "remaining_time": "8:20:57", "throughput": 2122.03, "total_tokens": 56279264} {"current_steps": 3650, "total_steps": 7776, "loss": 0.4639, "learning_rate": 1.6440099177494991e-06, "epoch": 14.974358974358974, "percentage": 46.94, "elapsed_time": "7:22:37", "remaining_time": "8:20:21", "throughput": 2121.81, "total_tokens": 56350784} {"current_steps": 3655, "total_steps": 7776, "loss": 0.5015, "learning_rate": 1.6409935373536227e-06, "epoch": 14.994871794871795, "percentage": 47.0, "elapsed_time": "7:23:21", "remaining_time": "8:19:53", "throughput": 2121.32, "total_tokens": 56430432} {"current_steps": 3660, "total_steps": 7776, "loss": 0.4503, "learning_rate": 1.6379765816154413e-06, "epoch": 15.015384615384615, "percentage": 47.07, "elapsed_time": "7:24:00", "remaining_time": "8:19:19", "throughput": 2121.17, "total_tokens": 56509056} {"current_steps": 3665, "total_steps": 7776, "loss": 0.4688, "learning_rate": 1.634959062846031e-06, "epoch": 15.035897435897436, "percentage": 47.13, "elapsed_time": "7:24:32", "remaining_time": "8:18:38", "throughput": 2121.19, "total_tokens": 56578016} {"current_steps": 3670, "total_steps": 7776, "loss": 0.4761, "learning_rate": 1.631940993358767e-06, "epoch": 15.056410256410256, "percentage": 47.2, "elapsed_time": "7:25:09", "remaining_time": "8:18:02", "throughput": 2121.11, "total_tokens": 56653536} {"current_steps": 3675, "total_steps": 7776, "loss": 0.4433, "learning_rate": 1.6289223854692708e-06, "epoch": 15.076923076923077, "percentage": 47.26, "elapsed_time": "7:25:45", "remaining_time": "8:17:26", "throughput": 2121.09, "total_tokens": 56730560} {"current_steps": 3680, "total_steps": 7776, "loss": 0.4315, "learning_rate": 1.6259032514953601e-06, "epoch": 15.097435897435897, "percentage": 47.33, "elapsed_time": "7:26:25", "remaining_time": "8:16:52", "throughput": 2121.08, "total_tokens": 56813312} {"current_steps": 3685, "total_steps": 7776, "loss": 0.4885, "learning_rate": 1.6228836037570015e-06, "epoch": 15.117948717948718, "percentage": 47.39, "elapsed_time": "7:27:00", "remaining_time": "8:16:16", "throughput": 2121.15, "total_tokens": 56891264} {"current_steps": 3690, "total_steps": 7776, "loss": 0.4703, "learning_rate": 1.619863454576256e-06, "epoch": 15.138461538461538, "percentage": 47.45, "elapsed_time": "7:27:33", "remaining_time": "8:15:35", "throughput": 2121.32, "total_tokens": 56964864} {"current_steps": 3695, "total_steps": 7776, "loss": 0.4518, "learning_rate": 1.6168428162772322e-06, "epoch": 15.158974358974358, "percentage": 47.52, "elapsed_time": "7:28:59", "remaining_time": "8:15:53", "throughput": 2117.73, "total_tokens": 57050144} {"current_steps": 3700, "total_steps": 7776, "loss": 0.4858, "learning_rate": 1.6138217011860336e-06, "epoch": 15.179487179487179, "percentage": 47.58, "elapsed_time": "7:29:36", "remaining_time": "8:15:17", "throughput": 2117.61, "total_tokens": 57125632} {"current_steps": 3705, "total_steps": 7776, "loss": 0.459, "learning_rate": 1.6108001216307107e-06, "epoch": 15.2, "percentage": 47.65, "elapsed_time": "7:30:09", "remaining_time": "8:14:38", "throughput": 2117.89, "total_tokens": 57204128} {"current_steps": 3710, "total_steps": 7776, "loss": 0.4639, "learning_rate": 1.6077780899412068e-06, "epoch": 15.22051282051282, "percentage": 47.71, "elapsed_time": "7:30:42", "remaining_time": "8:13:57", "throughput": 2118.23, "total_tokens": 57281536} {"current_steps": 3715, "total_steps": 7776, "loss": 0.4496, "learning_rate": 1.6047556184493133e-06, "epoch": 15.24102564102564, "percentage": 47.78, "elapsed_time": "7:31:10", "remaining_time": "8:13:11", "throughput": 2118.73, "total_tokens": 57354816} {"current_steps": 3720, "total_steps": 7776, "loss": 0.5043, "learning_rate": 1.601732719488614e-06, "epoch": 15.261538461538462, "percentage": 47.84, "elapsed_time": "7:31:43", "remaining_time": "8:12:31", "throughput": 2119.14, "total_tokens": 57435328} {"current_steps": 3725, "total_steps": 7776, "loss": 0.4357, "learning_rate": 1.5987094053944384e-06, "epoch": 15.282051282051283, "percentage": 47.9, "elapsed_time": "7:32:10", "remaining_time": "8:11:44", "throughput": 2119.67, "total_tokens": 57507424} {"current_steps": 3730, "total_steps": 7776, "loss": 0.5211, "learning_rate": 1.5956856885038086e-06, "epoch": 15.302564102564103, "percentage": 47.97, "elapsed_time": "7:32:39", "remaining_time": "8:11:00", "throughput": 2120.29, "total_tokens": 57586880} {"current_steps": 3735, "total_steps": 7776, "loss": 0.5036, "learning_rate": 1.592661581155392e-06, "epoch": 15.323076923076924, "percentage": 48.03, "elapsed_time": "7:33:44", "remaining_time": "8:10:54", "throughput": 2118.3, "total_tokens": 57669600} {"current_steps": 3740, "total_steps": 7776, "loss": 0.4751, "learning_rate": 1.5896370956894477e-06, "epoch": 15.343589743589744, "percentage": 48.1, "elapsed_time": "7:34:11", "remaining_time": "8:10:08", "throughput": 2118.97, "total_tokens": 57744608} {"current_steps": 3745, "total_steps": 7776, "loss": 0.4764, "learning_rate": 1.5866122444477794e-06, "epoch": 15.364102564102565, "percentage": 48.16, "elapsed_time": "7:34:36", "remaining_time": "8:09:19", "throughput": 2119.7, "total_tokens": 57818496} {"current_steps": 3750, "total_steps": 7776, "loss": 0.4551, "learning_rate": 1.5835870397736817e-06, "epoch": 15.384615384615385, "percentage": 48.23, "elapsed_time": "7:35:06", "remaining_time": "8:08:36", "throughput": 2120.32, "total_tokens": 57898432} {"current_steps": 3755, "total_steps": 7776, "loss": 0.5198, "learning_rate": 1.5805614940118928e-06, "epoch": 15.405128205128205, "percentage": 48.29, "elapsed_time": "7:35:33", "remaining_time": "8:07:49", "throughput": 2121.01, "total_tokens": 57974624} {"current_steps": 3760, "total_steps": 7776, "loss": 0.5164, "learning_rate": 1.577535619508542e-06, "epoch": 15.425641025641026, "percentage": 48.35, "elapsed_time": "7:35:59", "remaining_time": "8:07:01", "throughput": 2121.88, "total_tokens": 58052576} {"current_steps": 3765, "total_steps": 7776, "loss": 0.4699, "learning_rate": 1.5745094286111004e-06, "epoch": 15.446153846153846, "percentage": 48.42, "elapsed_time": "7:36:21", "remaining_time": "8:06:10", "throughput": 2122.87, "total_tokens": 58126592} {"current_steps": 3770, "total_steps": 7776, "loss": 0.4804, "learning_rate": 1.5714829336683297e-06, "epoch": 15.466666666666667, "percentage": 48.48, "elapsed_time": "7:36:49", "remaining_time": "8:05:25", "throughput": 2123.9, "total_tokens": 58214784} {"current_steps": 3775, "total_steps": 7776, "loss": 0.4731, "learning_rate": 1.5684561470302337e-06, "epoch": 15.487179487179487, "percentage": 48.55, "elapsed_time": "7:37:09", "remaining_time": "8:04:31", "throughput": 2124.92, "total_tokens": 58284480} {"current_steps": 3780, "total_steps": 7776, "loss": 0.5115, "learning_rate": 1.5654290810480041e-06, "epoch": 15.507692307692308, "percentage": 48.61, "elapsed_time": "7:37:30", "remaining_time": "8:03:39", "throughput": 2125.99, "total_tokens": 58359488} {"current_steps": 3785, "total_steps": 7776, "loss": 0.4713, "learning_rate": 1.562401748073975e-06, "epoch": 15.528205128205128, "percentage": 48.68, "elapsed_time": "7:37:49", "remaining_time": "8:02:44", "throughput": 2127.26, "total_tokens": 58433632} {"current_steps": 3790, "total_steps": 7776, "loss": 0.5218, "learning_rate": 1.5593741604615679e-06, "epoch": 15.548717948717949, "percentage": 48.74, "elapsed_time": "7:38:36", "remaining_time": "8:02:19", "throughput": 2126.97, "total_tokens": 58526048} {"current_steps": 3795, "total_steps": 7776, "loss": 0.4432, "learning_rate": 1.5563463305652454e-06, "epoch": 15.569230769230769, "percentage": 48.8, "elapsed_time": "7:38:53", "remaining_time": "8:01:23", "throughput": 2128.05, "total_tokens": 58593440} {"current_steps": 3800, "total_steps": 7776, "loss": 0.4793, "learning_rate": 1.5533182707404563e-06, "epoch": 15.58974358974359, "percentage": 48.87, "elapsed_time": "7:39:10", "remaining_time": "8:00:26", "throughput": 2129.39, "total_tokens": 58664832} {"current_steps": 3805, "total_steps": 7776, "loss": 0.4287, "learning_rate": 1.550289993343591e-06, "epoch": 15.61025641025641, "percentage": 48.93, "elapsed_time": "7:39:25", "remaining_time": "7:59:28", "throughput": 2130.71, "total_tokens": 58734976} {"current_steps": 3810, "total_steps": 7776, "loss": 0.5701, "learning_rate": 1.547261510731924e-06, "epoch": 15.63076923076923, "percentage": 49.0, "elapsed_time": "7:41:24", "remaining_time": "8:00:18", "throughput": 2124.84, "total_tokens": 58826304} {"current_steps": 3815, "total_steps": 7776, "loss": 0.4858, "learning_rate": 1.5442328352635706e-06, "epoch": 15.65128205128205, "percentage": 49.06, "elapsed_time": "7:42:08", "remaining_time": "7:59:50", "throughput": 2124.04, "total_tokens": 58897216} {"current_steps": 3820, "total_steps": 7776, "loss": 0.4541, "learning_rate": 1.54120397929743e-06, "epoch": 15.671794871794871, "percentage": 49.13, "elapsed_time": "7:42:52", "remaining_time": "7:59:21", "throughput": 2123.32, "total_tokens": 58970880} {"current_steps": 3825, "total_steps": 7776, "loss": 0.5178, "learning_rate": 1.5381749551931405e-06, "epoch": 15.692307692307692, "percentage": 49.19, "elapsed_time": "7:43:41", "remaining_time": "7:58:58", "throughput": 2122.4, "total_tokens": 59049408} {"current_steps": 3830, "total_steps": 7776, "loss": 0.4799, "learning_rate": 1.5351457753110244e-06, "epoch": 15.712820512820512, "percentage": 49.25, "elapsed_time": "7:44:25", "remaining_time": "7:58:29", "throughput": 2121.71, "total_tokens": 59122336} {"current_steps": 3835, "total_steps": 7776, "loss": 0.4284, "learning_rate": 1.5321164520120421e-06, "epoch": 15.733333333333333, "percentage": 49.32, "elapsed_time": "7:45:08", "remaining_time": "7:58:00", "throughput": 2121.1, "total_tokens": 59197600} {"current_steps": 3840, "total_steps": 7776, "loss": 0.4343, "learning_rate": 1.5290869976577366e-06, "epoch": 15.753846153846155, "percentage": 49.38, "elapsed_time": "7:45:48", "remaining_time": "7:57:27", "throughput": 2120.63, "total_tokens": 59268224} {"current_steps": 3845, "total_steps": 7776, "loss": 0.4371, "learning_rate": 1.5260574246101875e-06, "epoch": 15.774358974358975, "percentage": 49.45, "elapsed_time": "7:46:29", "remaining_time": "7:56:55", "throughput": 2120.13, "total_tokens": 59341408} {"current_steps": 3850, "total_steps": 7776, "loss": 0.5017, "learning_rate": 1.5230277452319585e-06, "epoch": 15.794871794871796, "percentage": 49.51, "elapsed_time": "7:47:18", "remaining_time": "7:56:32", "throughput": 2119.34, "total_tokens": 59423648} {"current_steps": 3855, "total_steps": 7776, "loss": 0.4473, "learning_rate": 1.519997971886046e-06, "epoch": 15.815384615384616, "percentage": 49.58, "elapsed_time": "7:47:56", "remaining_time": "7:55:57", "throughput": 2119.06, "total_tokens": 59495872} {"current_steps": 3860, "total_steps": 7776, "loss": 0.4693, "learning_rate": 1.5169681169358314e-06, "epoch": 15.835897435897436, "percentage": 49.64, "elapsed_time": "7:48:40", "remaining_time": "7:55:28", "throughput": 2118.54, "total_tokens": 59574880} {"current_steps": 3865, "total_steps": 7776, "loss": 0.4955, "learning_rate": 1.513938192745028e-06, "epoch": 15.856410256410257, "percentage": 49.7, "elapsed_time": "7:49:33", "remaining_time": "7:55:09", "throughput": 2117.48, "total_tokens": 59657472} {"current_steps": 3870, "total_steps": 7776, "loss": 0.4219, "learning_rate": 1.5109082116776328e-06, "epoch": 15.876923076923077, "percentage": 49.77, "elapsed_time": "7:50:13", "remaining_time": "7:54:35", "throughput": 2117.22, "total_tokens": 59733888} {"current_steps": 3875, "total_steps": 7776, "loss": 0.4462, "learning_rate": 1.5078781860978732e-06, "epoch": 15.897435897435898, "percentage": 49.83, "elapsed_time": "7:50:53", "remaining_time": "7:54:03", "throughput": 2116.95, "total_tokens": 59811392} {"current_steps": 3880, "total_steps": 7776, "loss": 0.4938, "learning_rate": 1.5048481283701594e-06, "epoch": 15.917948717948718, "percentage": 49.9, "elapsed_time": "7:51:31", "remaining_time": "7:53:28", "throughput": 2116.78, "total_tokens": 59886784} {"current_steps": 3885, "total_steps": 7776, "loss": 0.4465, "learning_rate": 1.501818050859033e-06, "epoch": 15.938461538461539, "percentage": 49.96, "elapsed_time": "7:52:06", "remaining_time": "7:52:50", "throughput": 2116.68, "total_tokens": 59959072} {"current_steps": 3890, "total_steps": 7776, "loss": 0.462, "learning_rate": 1.498787965929116e-06, "epoch": 15.95897435897436, "percentage": 50.03, "elapsed_time": "7:52:41", "remaining_time": "7:52:12", "throughput": 2116.68, "total_tokens": 60032832} {"current_steps": 3895, "total_steps": 7776, "loss": 0.5279, "learning_rate": 1.49575788594506e-06, "epoch": 15.97948717948718, "percentage": 50.09, "elapsed_time": "7:53:43", "remaining_time": "7:52:01", "throughput": 2115.1, "total_tokens": 60119456} {"current_steps": 3900, "total_steps": 7776, "loss": 0.4908, "learning_rate": 1.4927278232714975e-06, "epoch": 16.0, "percentage": 50.15, "elapsed_time": "7:54:27", "remaining_time": "7:51:31", "throughput": 2114.87, "total_tokens": 60204448} {"current_steps": 3905, "total_steps": 7776, "loss": 0.4607, "learning_rate": 1.4896977902729893e-06, "epoch": 16.02051282051282, "percentage": 50.22, "elapsed_time": "7:55:00", "remaining_time": "7:50:52", "throughput": 2115.01, "total_tokens": 60279104} {"current_steps": 3910, "total_steps": 7776, "loss": 0.4405, "learning_rate": 1.4866677993139761e-06, "epoch": 16.04102564102564, "percentage": 50.28, "elapsed_time": "7:55:31", "remaining_time": "7:50:09", "throughput": 2115.22, "total_tokens": 60349504} {"current_steps": 3915, "total_steps": 7776, "loss": 0.4744, "learning_rate": 1.4836378627587266e-06, "epoch": 16.06153846153846, "percentage": 50.35, "elapsed_time": "7:56:01", "remaining_time": "7:49:27", "throughput": 2115.46, "total_tokens": 60420640} {"current_steps": 3920, "total_steps": 7776, "loss": 0.4868, "learning_rate": 1.4806079929712874e-06, "epoch": 16.08205128205128, "percentage": 50.41, "elapsed_time": "7:56:35", "remaining_time": "7:48:48", "throughput": 2115.64, "total_tokens": 60497728} {"current_steps": 3925, "total_steps": 7776, "loss": 0.5095, "learning_rate": 1.477578202315433e-06, "epoch": 16.102564102564102, "percentage": 50.48, "elapsed_time": "7:57:10", "remaining_time": "7:48:10", "throughput": 2115.91, "total_tokens": 60579008} {"current_steps": 3930, "total_steps": 7776, "loss": 0.5101, "learning_rate": 1.4745485031546143e-06, "epoch": 16.123076923076923, "percentage": 50.54, "elapsed_time": "7:57:49", "remaining_time": "7:47:36", "throughput": 2115.76, "total_tokens": 60657088} {"current_steps": 3935, "total_steps": 7776, "loss": 0.4938, "learning_rate": 1.4715189078519094e-06, "epoch": 16.143589743589743, "percentage": 50.6, "elapsed_time": "7:58:23", "remaining_time": "7:46:58", "throughput": 2115.9, "total_tokens": 60734560} {"current_steps": 3940, "total_steps": 7776, "loss": 0.4785, "learning_rate": 1.468489428769973e-06, "epoch": 16.164102564102564, "percentage": 50.67, "elapsed_time": "7:59:02", "remaining_time": "7:46:23", "throughput": 2115.81, "total_tokens": 60812960} {"current_steps": 3945, "total_steps": 7776, "loss": 0.4953, "learning_rate": 1.4654600782709843e-06, "epoch": 16.184615384615384, "percentage": 50.73, "elapsed_time": "7:59:34", "remaining_time": "7:45:43", "throughput": 2116.18, "total_tokens": 60892768} {"current_steps": 3950, "total_steps": 7776, "loss": 0.4472, "learning_rate": 1.4624308687165985e-06, "epoch": 16.205128205128204, "percentage": 50.8, "elapsed_time": "8:00:00", "remaining_time": "7:44:56", "throughput": 2116.74, "total_tokens": 60964096} {"current_steps": 3955, "total_steps": 7776, "loss": 0.4191, "learning_rate": 1.4594018124678965e-06, "epoch": 16.225641025641025, "percentage": 50.86, "elapsed_time": "8:00:25", "remaining_time": "7:44:09", "throughput": 2117.34, "total_tokens": 61034304} {"current_steps": 3960, "total_steps": 7776, "loss": 0.465, "learning_rate": 1.4563729218853329e-06, "epoch": 16.246153846153845, "percentage": 50.93, "elapsed_time": "8:00:54", "remaining_time": "7:43:24", "throughput": 2118.0, "total_tokens": 61113024} {"current_steps": 3965, "total_steps": 7776, "loss": 0.4703, "learning_rate": 1.4533442093286853e-06, "epoch": 16.266666666666666, "percentage": 50.99, "elapsed_time": "8:01:18", "remaining_time": "7:42:36", "throughput": 2118.71, "total_tokens": 61184256} {"current_steps": 3970, "total_steps": 7776, "loss": 0.4773, "learning_rate": 1.4503156871570062e-06, "epoch": 16.287179487179486, "percentage": 51.05, "elapsed_time": "8:01:45", "remaining_time": "7:41:51", "throughput": 2119.41, "total_tokens": 61262208} {"current_steps": 3975, "total_steps": 7776, "loss": 0.4172, "learning_rate": 1.4472873677285706e-06, "epoch": 16.307692307692307, "percentage": 51.12, "elapsed_time": "8:02:07", "remaining_time": "7:41:01", "throughput": 2120.25, "total_tokens": 61334560} {"current_steps": 3980, "total_steps": 7776, "loss": 0.4326, "learning_rate": 1.4442592634008266e-06, "epoch": 16.328205128205127, "percentage": 51.18, "elapsed_time": "8:02:30", "remaining_time": "7:40:11", "throughput": 2121.08, "total_tokens": 61405888} {"current_steps": 3985, "total_steps": 7776, "loss": 0.5303, "learning_rate": 1.4412313865303438e-06, "epoch": 16.348717948717947, "percentage": 51.25, "elapsed_time": "8:03:01", "remaining_time": "7:39:30", "throughput": 2121.66, "total_tokens": 61489280} {"current_steps": 3990, "total_steps": 7776, "loss": 0.4726, "learning_rate": 1.4382037494727649e-06, "epoch": 16.369230769230768, "percentage": 51.31, "elapsed_time": "8:03:24", "remaining_time": "7:38:41", "throughput": 2122.53, "total_tokens": 61562912} {"current_steps": 3995, "total_steps": 7776, "loss": 0.458, "learning_rate": 1.435176364582752e-06, "epoch": 16.38974358974359, "percentage": 51.38, "elapsed_time": "8:03:54", "remaining_time": "7:37:58", "throughput": 2123.42, "total_tokens": 61652064} {"current_steps": 4000, "total_steps": 7776, "loss": 0.5266, "learning_rate": 1.4321492442139405e-06, "epoch": 16.41025641025641, "percentage": 51.44, "elapsed_time": "8:04:20", "remaining_time": "7:37:13", "throughput": 2124.45, "total_tokens": 61737536} {"current_steps": 4005, "total_steps": 7776, "loss": 0.4394, "learning_rate": 1.4291224007188849e-06, "epoch": 16.43076923076923, "percentage": 51.5, "elapsed_time": "8:04:55", "remaining_time": "7:36:35", "throughput": 2124.44, "total_tokens": 61811840} {"current_steps": 4010, "total_steps": 7776, "loss": 0.4474, "learning_rate": 1.4260958464490104e-06, "epoch": 16.45128205128205, "percentage": 51.57, "elapsed_time": "8:05:13", "remaining_time": "7:35:42", "throughput": 2125.59, "total_tokens": 61884288} {"current_steps": 4015, "total_steps": 7776, "loss": 0.5, "learning_rate": 1.4230695937545616e-06, "epoch": 16.47179487179487, "percentage": 51.63, "elapsed_time": "8:05:33", "remaining_time": "7:34:50", "throughput": 2126.73, "total_tokens": 61958944} {"current_steps": 4020, "total_steps": 7776, "loss": 0.4766, "learning_rate": 1.420043654984553e-06, "epoch": 16.49230769230769, "percentage": 51.7, "elapsed_time": "8:05:56", "remaining_time": "7:34:01", "throughput": 2127.76, "total_tokens": 62038016} {"current_steps": 4025, "total_steps": 7776, "loss": 0.4593, "learning_rate": 1.4170180424867176e-06, "epoch": 16.51282051282051, "percentage": 51.76, "elapsed_time": "8:06:12", "remaining_time": "7:33:06", "throughput": 2128.96, "total_tokens": 62107616} {"current_steps": 4030, "total_steps": 7776, "loss": 0.4446, "learning_rate": 1.4139927686074577e-06, "epoch": 16.533333333333335, "percentage": 51.83, "elapsed_time": "8:06:31", "remaining_time": "7:32:14", "throughput": 2130.37, "total_tokens": 62188352} {"current_steps": 4035, "total_steps": 7776, "loss": 0.4658, "learning_rate": 1.4109678456917926e-06, "epoch": 16.553846153846155, "percentage": 51.89, "elapsed_time": "8:07:10", "remaining_time": "7:31:41", "throughput": 2129.92, "total_tokens": 62259456} {"current_steps": 4040, "total_steps": 7776, "loss": 0.5363, "learning_rate": 1.4079432860833104e-06, "epoch": 16.574358974358976, "percentage": 51.95, "elapsed_time": "8:09:09", "remaining_time": "7:32:20", "throughput": 2124.62, "total_tokens": 62356448} {"current_steps": 4045, "total_steps": 7776, "loss": 0.5006, "learning_rate": 1.4049191021241176e-06, "epoch": 16.594871794871796, "percentage": 52.02, "elapsed_time": "8:09:52", "remaining_time": "7:31:51", "throughput": 2123.98, "total_tokens": 62429824} {"current_steps": 4050, "total_steps": 7776, "loss": 0.4638, "learning_rate": 1.4018953061547853e-06, "epoch": 16.615384615384617, "percentage": 52.08, "elapsed_time": "8:12:17", "remaining_time": "7:32:54", "throughput": 2116.46, "total_tokens": 62514528} {"current_steps": 4055, "total_steps": 7776, "loss": 0.4413, "learning_rate": 1.3988719105143038e-06, "epoch": 16.635897435897437, "percentage": 52.15, "elapsed_time": "8:13:13", "remaining_time": "7:32:35", "throughput": 2115.12, "total_tokens": 62593472} {"current_steps": 4060, "total_steps": 7776, "loss": 0.4506, "learning_rate": 1.395848927540028e-06, "epoch": 16.656410256410258, "percentage": 52.21, "elapsed_time": "8:14:13", "remaining_time": "7:32:21", "throughput": 2113.45, "total_tokens": 62671520} {"current_steps": 4065, "total_steps": 7776, "loss": 0.4616, "learning_rate": 1.39282636956763e-06, "epoch": 16.676923076923078, "percentage": 52.28, "elapsed_time": "8:15:14", "remaining_time": "7:32:07", "throughput": 2111.73, "total_tokens": 62749856} {"current_steps": 4070, "total_steps": 7776, "loss": 0.456, "learning_rate": 1.3898042489310471e-06, "epoch": 16.6974358974359, "percentage": 52.34, "elapsed_time": "8:15:56", "remaining_time": "7:31:35", "throughput": 2111.24, "total_tokens": 62823616} {"current_steps": 4075, "total_steps": 7776, "loss": 0.45, "learning_rate": 1.3867825779624325e-06, "epoch": 16.71794871794872, "percentage": 52.4, "elapsed_time": "8:17:00", "remaining_time": "7:31:23", "throughput": 2109.6, "total_tokens": 62908416} {"current_steps": 4080, "total_steps": 7776, "loss": 0.4563, "learning_rate": 1.3837613689921037e-06, "epoch": 16.73846153846154, "percentage": 52.47, "elapsed_time": "8:17:35", "remaining_time": "7:30:46", "throughput": 2109.39, "total_tokens": 62978016} {"current_steps": 4085, "total_steps": 7776, "loss": 0.4952, "learning_rate": 1.380740634348494e-06, "epoch": 16.75897435897436, "percentage": 52.53, "elapsed_time": "8:19:24", "remaining_time": "7:31:14", "throughput": 2104.71, "total_tokens": 63065952} {"current_steps": 4090, "total_steps": 7776, "loss": 0.4327, "learning_rate": 1.3777203863580993e-06, "epoch": 16.77948717948718, "percentage": 52.6, "elapsed_time": "8:20:03", "remaining_time": "7:30:40", "throughput": 2104.46, "total_tokens": 63141792} {"current_steps": 4095, "total_steps": 7776, "loss": 0.5152, "learning_rate": 1.3747006373454321e-06, "epoch": 16.8, "percentage": 52.66, "elapsed_time": "8:21:00", "remaining_time": "7:30:21", "throughput": 2103.23, "total_tokens": 63223520} {"current_steps": 4100, "total_steps": 7776, "loss": 0.4952, "learning_rate": 1.3716813996329669e-06, "epoch": 16.82051282051282, "percentage": 52.73, "elapsed_time": "8:21:36", "remaining_time": "7:29:43", "throughput": 2103.17, "total_tokens": 63297696} {"current_steps": 4105, "total_steps": 7776, "loss": 0.4873, "learning_rate": 1.3686626855410929e-06, "epoch": 16.84102564102564, "percentage": 52.79, "elapsed_time": "8:22:18", "remaining_time": "7:29:12", "throughput": 2102.88, "total_tokens": 63378304} {"current_steps": 4110, "total_steps": 7776, "loss": 0.4461, "learning_rate": 1.3656445073880615e-06, "epoch": 16.861538461538462, "percentage": 52.85, "elapsed_time": "8:22:56", "remaining_time": "7:28:36", "throughput": 2102.77, "total_tokens": 63454400} {"current_steps": 4115, "total_steps": 7776, "loss": 0.4612, "learning_rate": 1.3626268774899381e-06, "epoch": 16.882051282051282, "percentage": 52.92, "elapsed_time": "8:23:29", "remaining_time": "7:27:56", "throughput": 2102.85, "total_tokens": 63526400} {"current_steps": 4120, "total_steps": 7776, "loss": 0.5061, "learning_rate": 1.3596098081605505e-06, "epoch": 16.902564102564103, "percentage": 52.98, "elapsed_time": "8:24:25", "remaining_time": "7:27:36", "throughput": 2101.82, "total_tokens": 63612448} {"current_steps": 4125, "total_steps": 7776, "loss": 0.486, "learning_rate": 1.3565933117114385e-06, "epoch": 16.923076923076923, "percentage": 53.05, "elapsed_time": "8:25:04", "remaining_time": "7:27:02", "throughput": 2101.76, "total_tokens": 63693248} {"current_steps": 4130, "total_steps": 7776, "loss": 0.4772, "learning_rate": 1.3535774004518057e-06, "epoch": 16.943589743589744, "percentage": 53.11, "elapsed_time": "8:25:37", "remaining_time": "7:26:22", "throughput": 2101.88, "total_tokens": 63765504} {"current_steps": 4135, "total_steps": 7776, "loss": 0.457, "learning_rate": 1.3505620866884666e-06, "epoch": 16.964102564102564, "percentage": 53.18, "elapsed_time": "8:26:09", "remaining_time": "7:25:41", "throughput": 2102.11, "total_tokens": 63839616} {"current_steps": 4140, "total_steps": 7776, "loss": 0.4961, "learning_rate": 1.347547382725797e-06, "epoch": 16.984615384615385, "percentage": 53.24, "elapsed_time": "8:26:50", "remaining_time": "7:25:08", "throughput": 2102.05, "total_tokens": 63924736} {"current_steps": 4145, "total_steps": 7776, "loss": 0.5218, "learning_rate": 1.344533300865686e-06, "epoch": 17.005128205128205, "percentage": 53.31, "elapsed_time": "8:27:23", "remaining_time": "7:24:28", "throughput": 2102.24, "total_tokens": 64000256} {"current_steps": 4150, "total_steps": 7776, "loss": 0.4501, "learning_rate": 1.3415198534074823e-06, "epoch": 17.025641025641026, "percentage": 53.37, "elapsed_time": "8:27:58", "remaining_time": "7:23:50", "throughput": 2102.39, "total_tokens": 64077472} {"current_steps": 4155, "total_steps": 7776, "loss": 0.4704, "learning_rate": 1.3385070526479475e-06, "epoch": 17.046153846153846, "percentage": 53.43, "elapsed_time": "8:28:32", "remaining_time": "7:23:10", "throughput": 2102.65, "total_tokens": 64157024} {"current_steps": 4160, "total_steps": 7776, "loss": 0.485, "learning_rate": 1.3354949108812026e-06, "epoch": 17.066666666666666, "percentage": 53.5, "elapsed_time": "8:28:59", "remaining_time": "7:22:25", "throughput": 2103.06, "total_tokens": 64226656} {"current_steps": 4165, "total_steps": 7776, "loss": 0.4316, "learning_rate": 1.3324834403986815e-06, "epoch": 17.087179487179487, "percentage": 53.56, "elapsed_time": "8:29:29", "remaining_time": "7:21:43", "throughput": 2103.48, "total_tokens": 64302816} {"current_steps": 4170, "total_steps": 7776, "loss": 0.4781, "learning_rate": 1.3294726534890766e-06, "epoch": 17.107692307692307, "percentage": 53.63, "elapsed_time": "8:29:54", "remaining_time": "7:20:56", "throughput": 2104.03, "total_tokens": 64371840} {"current_steps": 4175, "total_steps": 7776, "loss": 0.4331, "learning_rate": 1.326462562438293e-06, "epoch": 17.128205128205128, "percentage": 53.69, "elapsed_time": "8:30:25", "remaining_time": "7:20:15", "throughput": 2104.48, "total_tokens": 64451776} {"current_steps": 4180, "total_steps": 7776, "loss": 0.4754, "learning_rate": 1.3234531795293945e-06, "epoch": 17.148717948717948, "percentage": 53.76, "elapsed_time": "8:30:51", "remaining_time": "7:19:29", "throughput": 2105.05, "total_tokens": 64523712} {"current_steps": 4185, "total_steps": 7776, "loss": 0.4983, "learning_rate": 1.3204445170425565e-06, "epoch": 17.16923076923077, "percentage": 53.82, "elapsed_time": "8:31:15", "remaining_time": "7:18:41", "throughput": 2105.72, "total_tokens": 64594272} {"current_steps": 4190, "total_steps": 7776, "loss": 0.4852, "learning_rate": 1.3174365872550138e-06, "epoch": 17.18974358974359, "percentage": 53.88, "elapsed_time": "8:31:45", "remaining_time": "7:17:59", "throughput": 2106.35, "total_tokens": 64677280} {"current_steps": 4195, "total_steps": 7776, "loss": 0.4843, "learning_rate": 1.3144294024410122e-06, "epoch": 17.21025641025641, "percentage": 53.95, "elapsed_time": "8:32:18", "remaining_time": "7:17:19", "throughput": 2106.71, "total_tokens": 64758080} {"current_steps": 4200, "total_steps": 7776, "loss": 0.4564, "learning_rate": 1.3114229748717563e-06, "epoch": 17.23076923076923, "percentage": 54.01, "elapsed_time": "8:32:42", "remaining_time": "7:16:32", "throughput": 2107.46, "total_tokens": 64830848} {"current_steps": 4205, "total_steps": 7776, "loss": 0.4432, "learning_rate": 1.308417316815362e-06, "epoch": 17.25128205128205, "percentage": 54.08, "elapsed_time": "8:33:11", "remaining_time": "7:15:48", "throughput": 2107.96, "total_tokens": 64907296} {"current_steps": 4210, "total_steps": 7776, "loss": 0.4901, "learning_rate": 1.3054124405368036e-06, "epoch": 17.27179487179487, "percentage": 54.14, "elapsed_time": "8:33:41", "remaining_time": "7:15:06", "throughput": 2108.52, "total_tokens": 64987392} {"current_steps": 4215, "total_steps": 7776, "loss": 0.5076, "learning_rate": 1.3024083582978668e-06, "epoch": 17.29230769230769, "percentage": 54.21, "elapsed_time": "8:34:28", "remaining_time": "7:14:39", "throughput": 2108.2, "total_tokens": 65077408} {"current_steps": 4220, "total_steps": 7776, "loss": 0.4818, "learning_rate": 1.2994050823570968e-06, "epoch": 17.31282051282051, "percentage": 54.27, "elapsed_time": "8:34:53", "remaining_time": "7:13:52", "throughput": 2109.12, "total_tokens": 65159104} {"current_steps": 4225, "total_steps": 7776, "loss": 0.4525, "learning_rate": 1.2964026249697475e-06, "epoch": 17.333333333333332, "percentage": 54.33, "elapsed_time": "8:35:19", "remaining_time": "7:13:06", "throughput": 2110.11, "total_tokens": 65242816} {"current_steps": 4230, "total_steps": 7776, "loss": 0.4444, "learning_rate": 1.293400998387734e-06, "epoch": 17.353846153846153, "percentage": 54.4, "elapsed_time": "8:35:39", "remaining_time": "7:12:16", "throughput": 2111.11, "total_tokens": 65317376} {"current_steps": 4235, "total_steps": 7776, "loss": 0.4897, "learning_rate": 1.2904002148595797e-06, "epoch": 17.374358974358973, "percentage": 54.46, "elapsed_time": "8:35:59", "remaining_time": "7:11:25", "throughput": 2112.18, "total_tokens": 65391264} {"current_steps": 4240, "total_steps": 7776, "loss": 0.5116, "learning_rate": 1.2874002866303695e-06, "epoch": 17.394871794871793, "percentage": 54.53, "elapsed_time": "8:36:17", "remaining_time": "7:10:34", "throughput": 2113.37, "total_tokens": 65467744} {"current_steps": 4245, "total_steps": 7776, "loss": 0.4498, "learning_rate": 1.2844012259416965e-06, "epoch": 17.415384615384614, "percentage": 54.59, "elapsed_time": "8:36:33", "remaining_time": "7:09:40", "throughput": 2114.47, "total_tokens": 65535680} {"current_steps": 4250, "total_steps": 7776, "loss": 0.4984, "learning_rate": 1.2814030450316151e-06, "epoch": 17.435897435897434, "percentage": 54.66, "elapsed_time": "8:36:52", "remaining_time": "7:08:49", "throughput": 2115.65, "total_tokens": 65611680} {"current_steps": 4255, "total_steps": 7776, "loss": 0.5276, "learning_rate": 1.2784057561345885e-06, "epoch": 17.456410256410255, "percentage": 54.72, "elapsed_time": "8:37:08", "remaining_time": "7:07:56", "throughput": 2116.89, "total_tokens": 65684160} {"current_steps": 4260, "total_steps": 7776, "loss": 0.4434, "learning_rate": 1.2754093714814407e-06, "epoch": 17.476923076923075, "percentage": 54.78, "elapsed_time": "8:37:51", "remaining_time": "7:07:24", "throughput": 2116.27, "total_tokens": 65755104} {"current_steps": 4265, "total_steps": 7776, "loss": 0.4743, "learning_rate": 1.2724139032993057e-06, "epoch": 17.4974358974359, "percentage": 54.85, "elapsed_time": "8:38:42", "remaining_time": "7:07:00", "throughput": 2115.38, "total_tokens": 65835072} {"current_steps": 4270, "total_steps": 7776, "loss": 0.4691, "learning_rate": 1.269419363811577e-06, "epoch": 17.51794871794872, "percentage": 54.91, "elapsed_time": "8:39:34", "remaining_time": "7:06:36", "throughput": 2114.44, "total_tokens": 65916704} {"current_steps": 4275, "total_steps": 7776, "loss": 0.5129, "learning_rate": 1.2664257652378598e-06, "epoch": 17.53846153846154, "percentage": 54.98, "elapsed_time": "8:40:23", "remaining_time": "7:06:10", "throughput": 2113.47, "total_tokens": 65989696} {"current_steps": 4280, "total_steps": 7776, "loss": 0.4868, "learning_rate": 1.2634331197939183e-06, "epoch": 17.55897435897436, "percentage": 55.04, "elapsed_time": "8:41:33", "remaining_time": "7:06:01", "throughput": 2111.37, "total_tokens": 66071744} {"current_steps": 4285, "total_steps": 7776, "loss": 0.489, "learning_rate": 1.2604414396916286e-06, "epoch": 17.57948717948718, "percentage": 55.11, "elapsed_time": "8:43:23", "remaining_time": "7:06:24", "throughput": 2106.52, "total_tokens": 66153024} {"current_steps": 4290, "total_steps": 7776, "loss": 0.4855, "learning_rate": 1.2574507371389267e-06, "epoch": 17.6, "percentage": 55.17, "elapsed_time": "8:43:59", "remaining_time": "7:05:47", "throughput": 2106.26, "total_tokens": 66220384} {"current_steps": 4295, "total_steps": 7776, "loss": 0.4791, "learning_rate": 1.25446102433976e-06, "epoch": 17.620512820512822, "percentage": 55.23, "elapsed_time": "8:45:01", "remaining_time": "7:05:31", "throughput": 2104.62, "total_tokens": 66298912} {"current_steps": 4300, "total_steps": 7776, "loss": 0.4563, "learning_rate": 1.2514723134940365e-06, "epoch": 17.641025641025642, "percentage": 55.3, "elapsed_time": "8:45:42", "remaining_time": "7:04:58", "throughput": 2104.24, "total_tokens": 66373120} {"current_steps": 4305, "total_steps": 7776, "loss": 0.4577, "learning_rate": 1.2484846167975767e-06, "epoch": 17.661538461538463, "percentage": 55.36, "elapsed_time": "8:46:27", "remaining_time": "7:04:27", "throughput": 2103.76, "total_tokens": 66452096} {"current_steps": 4310, "total_steps": 7776, "loss": 0.4875, "learning_rate": 1.2454979464420624e-06, "epoch": 17.682051282051283, "percentage": 55.43, "elapsed_time": "8:47:09", "remaining_time": "7:03:55", "throughput": 2103.44, "total_tokens": 66530784} {"current_steps": 4315, "total_steps": 7776, "loss": 0.4551, "learning_rate": 1.2425123146149863e-06, "epoch": 17.702564102564104, "percentage": 55.49, "elapsed_time": "8:47:50", "remaining_time": "7:03:22", "throughput": 2103.12, "total_tokens": 66607264} {"current_steps": 4320, "total_steps": 7776, "loss": 0.5378, "learning_rate": 1.2395277334996047e-06, "epoch": 17.723076923076924, "percentage": 55.56, "elapsed_time": "8:49:00", "remaining_time": "7:03:12", "throughput": 2101.17, "total_tokens": 66692608} {"current_steps": 4325, "total_steps": 7776, "loss": 0.4518, "learning_rate": 1.2365442152748846e-06, "epoch": 17.743589743589745, "percentage": 55.62, "elapsed_time": "8:49:42", "remaining_time": "7:02:40", "throughput": 2100.93, "total_tokens": 66773504} {"current_steps": 4330, "total_steps": 7776, "loss": 0.4412, "learning_rate": 1.2335617721154577e-06, "epoch": 17.764102564102565, "percentage": 55.68, "elapsed_time": "8:50:17", "remaining_time": "7:02:01", "throughput": 2100.9, "total_tokens": 66844928} {"current_steps": 4335, "total_steps": 7776, "loss": 0.5214, "learning_rate": 1.2305804161915671e-06, "epoch": 17.784615384615385, "percentage": 55.75, "elapsed_time": "8:51:03", "remaining_time": "7:01:32", "throughput": 2100.17, "total_tokens": 66918080} {"current_steps": 4340, "total_steps": 7776, "loss": 0.47, "learning_rate": 1.2276001596690205e-06, "epoch": 17.805128205128206, "percentage": 55.81, "elapsed_time": "8:51:36", "remaining_time": "7:00:52", "throughput": 2100.19, "total_tokens": 66988992} {"current_steps": 4345, "total_steps": 7776, "loss": 0.4545, "learning_rate": 1.2246210147091382e-06, "epoch": 17.825641025641026, "percentage": 55.88, "elapsed_time": "8:52:14", "remaining_time": "7:00:17", "throughput": 2100.15, "total_tokens": 67068288} {"current_steps": 4350, "total_steps": 7776, "loss": 0.4574, "learning_rate": 1.2216429934687062e-06, "epoch": 17.846153846153847, "percentage": 55.94, "elapsed_time": "8:52:49", "remaining_time": "6:59:38", "throughput": 2100.21, "total_tokens": 67142560} {"current_steps": 4355, "total_steps": 7776, "loss": 0.4717, "learning_rate": 1.2186661080999234e-06, "epoch": 17.866666666666667, "percentage": 56.01, "elapsed_time": "8:53:27", "remaining_time": "6:59:02", "throughput": 2100.24, "total_tokens": 67222560} {"current_steps": 4360, "total_steps": 7776, "loss": 0.4662, "learning_rate": 1.2156903707503544e-06, "epoch": 17.887179487179488, "percentage": 56.07, "elapsed_time": "8:54:09", "remaining_time": "6:58:30", "throughput": 2099.91, "total_tokens": 67301760} {"current_steps": 4365, "total_steps": 7776, "loss": 0.4958, "learning_rate": 1.2127157935628789e-06, "epoch": 17.907692307692308, "percentage": 56.13, "elapsed_time": "8:54:47", "remaining_time": "6:57:54", "throughput": 2099.93, "total_tokens": 67381856} {"current_steps": 4370, "total_steps": 7776, "loss": 0.5327, "learning_rate": 1.2097423886756433e-06, "epoch": 17.92820512820513, "percentage": 56.2, "elapsed_time": "8:55:27", "remaining_time": "6:57:20", "throughput": 2100.03, "total_tokens": 67467968} {"current_steps": 4375, "total_steps": 7776, "loss": 0.4606, "learning_rate": 1.2067701682220084e-06, "epoch": 17.94871794871795, "percentage": 56.26, "elapsed_time": "8:56:02", "remaining_time": "6:56:42", "throughput": 2100.22, "total_tokens": 67548672} {"current_steps": 4380, "total_steps": 7776, "loss": 0.4451, "learning_rate": 1.2037991443305043e-06, "epoch": 17.96923076923077, "percentage": 56.33, "elapsed_time": "8:56:33", "remaining_time": "6:56:01", "throughput": 2100.59, "total_tokens": 67625248} {"current_steps": 4385, "total_steps": 7776, "loss": 0.4416, "learning_rate": 1.2008293291247754e-06, "epoch": 17.98974358974359, "percentage": 56.39, "elapsed_time": "8:57:01", "remaining_time": "6:55:17", "throughput": 2100.98, "total_tokens": 67695808} {"current_steps": 4390, "total_steps": 7776, "loss": 0.4741, "learning_rate": 1.1978607347235367e-06, "epoch": 18.01025641025641, "percentage": 56.46, "elapsed_time": "8:57:51", "remaining_time": "6:54:50", "throughput": 2100.16, "total_tokens": 67774400} {"current_steps": 4395, "total_steps": 7776, "loss": 0.446, "learning_rate": 1.1948933732405205e-06, "epoch": 18.03076923076923, "percentage": 56.52, "elapsed_time": "8:58:17", "remaining_time": "6:54:05", "throughput": 2100.69, "total_tokens": 67846848} {"current_steps": 4400, "total_steps": 7776, "loss": 0.4315, "learning_rate": 1.191927256784427e-06, "epoch": 18.05128205128205, "percentage": 56.58, "elapsed_time": "8:58:43", "remaining_time": "6:53:20", "throughput": 2101.21, "total_tokens": 67917440} {"current_steps": 4405, "total_steps": 7776, "loss": 0.4055, "learning_rate": 1.1889623974588772e-06, "epoch": 18.07179487179487, "percentage": 56.65, "elapsed_time": "8:59:09", "remaining_time": "6:52:35", "throughput": 2101.78, "total_tokens": 67990656} {"current_steps": 4410, "total_steps": 7776, "loss": 0.499, "learning_rate": 1.185998807362362e-06, "epoch": 18.092307692307692, "percentage": 56.71, "elapsed_time": "8:59:39", "remaining_time": "6:51:54", "throughput": 2102.16, "total_tokens": 68067872} {"current_steps": 4415, "total_steps": 7776, "loss": 0.481, "learning_rate": 1.1830364985881924e-06, "epoch": 18.112820512820512, "percentage": 56.78, "elapsed_time": "9:00:07", "remaining_time": "6:51:10", "throughput": 2102.77, "total_tokens": 68145632} {"current_steps": 4420, "total_steps": 7776, "loss": 0.4931, "learning_rate": 1.1800754832244515e-06, "epoch": 18.133333333333333, "percentage": 56.84, "elapsed_time": "9:00:33", "remaining_time": "6:50:25", "throughput": 2103.43, "total_tokens": 68221472} {"current_steps": 4425, "total_steps": 7776, "loss": 0.4377, "learning_rate": 1.1771157733539442e-06, "epoch": 18.153846153846153, "percentage": 56.91, "elapsed_time": "9:00:56", "remaining_time": "6:49:38", "throughput": 2104.14, "total_tokens": 68292352} {"current_steps": 4430, "total_steps": 7776, "loss": 0.5265, "learning_rate": 1.174157381054148e-06, "epoch": 18.174358974358974, "percentage": 56.97, "elapsed_time": "9:01:23", "remaining_time": "6:48:55", "throughput": 2104.9, "total_tokens": 68374880} {"current_steps": 4435, "total_steps": 7776, "loss": 0.5103, "learning_rate": 1.1712003183971644e-06, "epoch": 18.194871794871794, "percentage": 57.03, "elapsed_time": "9:01:49", "remaining_time": "6:48:10", "throughput": 2105.73, "total_tokens": 68457280} {"current_steps": 4440, "total_steps": 7776, "loss": 0.5133, "learning_rate": 1.1682445974496686e-06, "epoch": 18.215384615384615, "percentage": 57.1, "elapsed_time": "9:02:16", "remaining_time": "6:47:26", "throughput": 2106.56, "total_tokens": 68540224} {"current_steps": 4445, "total_steps": 7776, "loss": 0.4805, "learning_rate": 1.1652902302728607e-06, "epoch": 18.235897435897435, "percentage": 57.16, "elapsed_time": "9:02:41", "remaining_time": "6:46:40", "throughput": 2107.43, "total_tokens": 68621056} {"current_steps": 4450, "total_steps": 7776, "loss": 0.4863, "learning_rate": 1.1623372289224172e-06, "epoch": 18.256410256410255, "percentage": 57.23, "elapsed_time": "9:03:02", "remaining_time": "6:45:52", "throughput": 2108.43, "total_tokens": 68697440} {"current_steps": 4455, "total_steps": 7776, "loss": 0.4685, "learning_rate": 1.1593856054484403e-06, "epoch": 18.276923076923076, "percentage": 57.29, "elapsed_time": "9:03:25", "remaining_time": "6:45:06", "throughput": 2109.41, "total_tokens": 68778944} {"current_steps": 4460, "total_steps": 7776, "loss": 0.4934, "learning_rate": 1.156435371895411e-06, "epoch": 18.297435897435896, "percentage": 57.36, "elapsed_time": "9:03:48", "remaining_time": "6:44:18", "throughput": 2110.45, "total_tokens": 68859712} {"current_steps": 4465, "total_steps": 7776, "loss": 0.4439, "learning_rate": 1.1534865403021366e-06, "epoch": 18.317948717948717, "percentage": 57.42, "elapsed_time": "9:04:05", "remaining_time": "6:43:28", "throughput": 2111.54, "total_tokens": 68932512} {"current_steps": 4470, "total_steps": 7776, "loss": 0.4295, "learning_rate": 1.1505391227017046e-06, "epoch": 18.338461538461537, "percentage": 57.48, "elapsed_time": "9:04:22", "remaining_time": "6:42:37", "throughput": 2112.69, "total_tokens": 69006080} {"current_steps": 4475, "total_steps": 7776, "loss": 0.4644, "learning_rate": 1.1475931311214338e-06, "epoch": 18.358974358974358, "percentage": 57.55, "elapsed_time": "9:04:40", "remaining_time": "6:41:46", "throughput": 2113.87, "total_tokens": 69081984} {"current_steps": 4480, "total_steps": 7776, "loss": 0.4899, "learning_rate": 1.144648577582821e-06, "epoch": 18.379487179487178, "percentage": 57.61, "elapsed_time": "9:05:03", "remaining_time": "6:41:00", "throughput": 2114.69, "total_tokens": 69158240} {"current_steps": 4485, "total_steps": 7776, "loss": 0.4763, "learning_rate": 1.141705474101498e-06, "epoch": 18.4, "percentage": 57.68, "elapsed_time": "9:06:02", "remaining_time": "6:40:40", "throughput": 2113.43, "total_tokens": 69241184} {"current_steps": 4490, "total_steps": 7776, "loss": 0.4784, "learning_rate": 1.138763832687177e-06, "epoch": 18.42051282051282, "percentage": 57.74, "elapsed_time": "9:06:57", "remaining_time": "6:40:17", "throughput": 2112.44, "total_tokens": 69326112} {"current_steps": 4495, "total_steps": 7776, "loss": 0.4624, "learning_rate": 1.1358236653436052e-06, "epoch": 18.44102564102564, "percentage": 57.81, "elapsed_time": "9:07:42", "remaining_time": "6:39:46", "throughput": 2111.87, "total_tokens": 69400832} {"current_steps": 4500, "total_steps": 7776, "loss": 0.4523, "learning_rate": 1.1328849840685143e-06, "epoch": 18.46153846153846, "percentage": 57.87, "elapsed_time": "9:08:28", "remaining_time": "6:39:17", "throughput": 2111.27, "total_tokens": 69478464} {"current_steps": 4505, "total_steps": 7776, "loss": 0.5372, "learning_rate": 1.1299478008535726e-06, "epoch": 18.48205128205128, "percentage": 57.93, "elapsed_time": "9:09:30", "remaining_time": "6:38:59", "throughput": 2109.76, "total_tokens": 69559712} {"current_steps": 4510, "total_steps": 7776, "loss": 0.4224, "learning_rate": 1.1270121276843342e-06, "epoch": 18.5025641025641, "percentage": 58.0, "elapsed_time": "9:10:28", "remaining_time": "6:38:37", "throughput": 2108.46, "total_tokens": 69638528} {"current_steps": 4515, "total_steps": 7776, "loss": 0.4726, "learning_rate": 1.1240779765401926e-06, "epoch": 18.523076923076925, "percentage": 58.06, "elapsed_time": "9:11:15", "remaining_time": "6:38:08", "throughput": 2107.91, "total_tokens": 69719264} {"current_steps": 4520, "total_steps": 7776, "loss": 0.4407, "learning_rate": 1.1211453593943293e-06, "epoch": 18.543589743589745, "percentage": 58.13, "elapsed_time": "9:11:59", "remaining_time": "6:37:37", "throughput": 2107.46, "total_tokens": 69798432} {"current_steps": 4525, "total_steps": 7776, "loss": 0.4594, "learning_rate": 1.118214288213667e-06, "epoch": 18.564102564102566, "percentage": 58.19, "elapsed_time": "9:12:38", "remaining_time": "6:37:02", "throughput": 2107.15, "total_tokens": 69869984} {"current_steps": 4530, "total_steps": 7776, "loss": 0.5029, "learning_rate": 1.1152847749588186e-06, "epoch": 18.584615384615386, "percentage": 58.26, "elapsed_time": "9:13:22", "remaining_time": "6:36:31", "throughput": 2106.72, "total_tokens": 69949088} {"current_steps": 4535, "total_steps": 7776, "loss": 0.4386, "learning_rate": 1.1123568315840419e-06, "epoch": 18.605128205128207, "percentage": 58.32, "elapsed_time": "9:14:01", "remaining_time": "6:35:56", "throughput": 2106.49, "total_tokens": 70023904} {"current_steps": 4540, "total_steps": 7776, "loss": 0.5118, "learning_rate": 1.1094304700371863e-06, "epoch": 18.625641025641027, "percentage": 58.38, "elapsed_time": "9:14:45", "remaining_time": "6:35:24", "throughput": 2105.99, "total_tokens": 70098400} {"current_steps": 4545, "total_steps": 7776, "loss": 0.4559, "learning_rate": 1.1065057022596483e-06, "epoch": 18.646153846153847, "percentage": 58.45, "elapsed_time": "9:15:28", "remaining_time": "6:34:53", "throughput": 2105.6, "total_tokens": 70176576} {"current_steps": 4550, "total_steps": 7776, "loss": 0.4418, "learning_rate": 1.1035825401863185e-06, "epoch": 18.666666666666668, "percentage": 58.51, "elapsed_time": "9:16:12", "remaining_time": "6:34:21", "throughput": 2105.16, "total_tokens": 70255264} {"current_steps": 4555, "total_steps": 7776, "loss": 0.435, "learning_rate": 1.100660995745538e-06, "epoch": 18.68717948717949, "percentage": 58.58, "elapsed_time": "9:16:45", "remaining_time": "6:33:41", "throughput": 2105.19, "total_tokens": 70324160} {"current_steps": 4560, "total_steps": 7776, "loss": 0.5499, "learning_rate": 1.0977410808590437e-06, "epoch": 18.70769230769231, "percentage": 58.64, "elapsed_time": "9:18:09", "remaining_time": "6:33:38", "throughput": 2102.51, "total_tokens": 70411616} {"current_steps": 4565, "total_steps": 7776, "loss": 0.4705, "learning_rate": 1.0948228074419269e-06, "epoch": 18.72820512820513, "percentage": 58.71, "elapsed_time": "9:18:43", "remaining_time": "6:33:00", "throughput": 2102.47, "total_tokens": 70482592} {"current_steps": 4570, "total_steps": 7776, "loss": 0.4466, "learning_rate": 1.0919061874025774e-06, "epoch": 18.74871794871795, "percentage": 58.77, "elapsed_time": "9:19:31", "remaining_time": "6:32:31", "throughput": 2101.93, "total_tokens": 70565120} {"current_steps": 4575, "total_steps": 7776, "loss": 0.4323, "learning_rate": 1.0889912326426393e-06, "epoch": 18.76923076923077, "percentage": 58.83, "elapsed_time": "9:20:02", "remaining_time": "6:31:50", "throughput": 2102.07, "total_tokens": 70635168} {"current_steps": 4580, "total_steps": 7776, "loss": 0.5235, "learning_rate": 1.0860779550569609e-06, "epoch": 18.78974358974359, "percentage": 58.9, "elapsed_time": "9:20:51", "remaining_time": "6:31:22", "throughput": 2101.54, "total_tokens": 70720096} {"current_steps": 4585, "total_steps": 7776, "loss": 0.4659, "learning_rate": 1.083166366533548e-06, "epoch": 18.81025641025641, "percentage": 58.96, "elapsed_time": "9:21:36", "remaining_time": "6:30:51", "throughput": 2101.31, "total_tokens": 70807648} {"current_steps": 4590, "total_steps": 7776, "loss": 0.4968, "learning_rate": 1.080256478953512e-06, "epoch": 18.83076923076923, "percentage": 59.03, "elapsed_time": "9:22:12", "remaining_time": "6:30:14", "throughput": 2101.48, "total_tokens": 70888832} {"current_steps": 4595, "total_steps": 7776, "loss": 0.5112, "learning_rate": 1.0773483041910247e-06, "epoch": 18.851282051282052, "percentage": 59.09, "elapsed_time": "9:22:50", "remaining_time": "6:29:38", "throughput": 2101.6, "total_tokens": 70971136} {"current_steps": 4600, "total_steps": 7776, "loss": 0.4414, "learning_rate": 1.0744418541132676e-06, "epoch": 18.871794871794872, "percentage": 59.16, "elapsed_time": "9:23:17", "remaining_time": "6:28:54", "throughput": 2101.9, "total_tokens": 71038816} {"current_steps": 4605, "total_steps": 7776, "loss": 0.4874, "learning_rate": 1.0715371405803858e-06, "epoch": 18.892307692307693, "percentage": 59.22, "elapsed_time": "9:23:48", "remaining_time": "6:28:14", "throughput": 2102.23, "total_tokens": 71114720} {"current_steps": 4610, "total_steps": 7776, "loss": 0.4571, "learning_rate": 1.0686341754454364e-06, "epoch": 18.912820512820513, "percentage": 59.28, "elapsed_time": "9:24:17", "remaining_time": "6:27:32", "throughput": 2102.62, "total_tokens": 71189856} {"current_steps": 4615, "total_steps": 7776, "loss": 0.4661, "learning_rate": 1.0657329705543439e-06, "epoch": 18.933333333333334, "percentage": 59.35, "elapsed_time": "9:24:50", "remaining_time": "6:26:52", "throughput": 2102.98, "total_tokens": 71271136} {"current_steps": 4620, "total_steps": 7776, "loss": 0.435, "learning_rate": 1.0628335377458477e-06, "epoch": 18.953846153846154, "percentage": 59.41, "elapsed_time": "9:25:17", "remaining_time": "6:26:09", "throughput": 2103.44, "total_tokens": 71343488} {"current_steps": 4625, "total_steps": 7776, "loss": 0.4845, "learning_rate": 1.0599358888514582e-06, "epoch": 18.974358974358974, "percentage": 59.48, "elapsed_time": "9:25:52", "remaining_time": "6:25:31", "throughput": 2103.48, "total_tokens": 71419104} {"current_steps": 4630, "total_steps": 7776, "loss": 0.5111, "learning_rate": 1.0570400356954044e-06, "epoch": 18.994871794871795, "percentage": 59.54, "elapsed_time": "9:26:24", "remaining_time": "6:24:51", "throughput": 2103.65, "total_tokens": 71491776} {"current_steps": 4635, "total_steps": 7776, "loss": 0.5006, "learning_rate": 1.0541459900945892e-06, "epoch": 19.015384615384615, "percentage": 59.61, "elapsed_time": "9:26:54", "remaining_time": "6:24:10", "throughput": 2104.19, "total_tokens": 71573184} {"current_steps": 4640, "total_steps": 7776, "loss": 0.4828, "learning_rate": 1.0512537638585379e-06, "epoch": 19.035897435897436, "percentage": 59.67, "elapsed_time": "9:27:23", "remaining_time": "6:23:28", "throughput": 2104.6, "total_tokens": 71648768} {"current_steps": 4645, "total_steps": 7776, "loss": 0.4607, "learning_rate": 1.0483633687893526e-06, "epoch": 19.056410256410256, "percentage": 59.74, "elapsed_time": "9:27:46", "remaining_time": "6:22:43", "throughput": 2105.32, "total_tokens": 71721824} {"current_steps": 4650, "total_steps": 7776, "loss": 0.497, "learning_rate": 1.0454748166816645e-06, "epoch": 19.076923076923077, "percentage": 59.8, "elapsed_time": "9:28:11", "remaining_time": "6:21:58", "throughput": 2106.01, "total_tokens": 71797568} {"current_steps": 4655, "total_steps": 7776, "loss": 0.4607, "learning_rate": 1.0425881193225808e-06, "epoch": 19.097435897435897, "percentage": 59.86, "elapsed_time": "9:28:34", "remaining_time": "6:21:12", "throughput": 2106.77, "total_tokens": 71871136} {"current_steps": 4660, "total_steps": 7776, "loss": 0.4232, "learning_rate": 1.0397032884916438e-06, "epoch": 19.117948717948718, "percentage": 59.93, "elapsed_time": "9:28:54", "remaining_time": "6:20:24", "throughput": 2107.58, "total_tokens": 71941984} {"current_steps": 4665, "total_steps": 7776, "loss": 0.5216, "learning_rate": 1.0368203359607767e-06, "epoch": 19.138461538461538, "percentage": 59.99, "elapsed_time": "9:29:23", "remaining_time": "6:19:43", "throughput": 2108.21, "total_tokens": 72024736} {"current_steps": 4670, "total_steps": 7776, "loss": 0.4565, "learning_rate": 1.0339392734942393e-06, "epoch": 19.15897435897436, "percentage": 60.06, "elapsed_time": "9:29:43", "remaining_time": "6:18:55", "throughput": 2109.08, "total_tokens": 72096064} {"current_steps": 4675, "total_steps": 7776, "loss": 0.4488, "learning_rate": 1.031060112848578e-06, "epoch": 19.17948717948718, "percentage": 60.12, "elapsed_time": "9:30:03", "remaining_time": "6:18:07", "throughput": 2110.04, "total_tokens": 72171168} {"current_steps": 4680, "total_steps": 7776, "loss": 0.4567, "learning_rate": 1.0281828657725798e-06, "epoch": 19.2, "percentage": 60.19, "elapsed_time": "9:30:24", "remaining_time": "6:17:21", "throughput": 2111.01, "total_tokens": 72249056} {"current_steps": 4685, "total_steps": 7776, "loss": 0.4556, "learning_rate": 1.0253075440072212e-06, "epoch": 19.22051282051282, "percentage": 60.25, "elapsed_time": "9:30:51", "remaining_time": "6:16:38", "throughput": 2111.99, "total_tokens": 72338944} {"current_steps": 4690, "total_steps": 7776, "loss": 0.4686, "learning_rate": 1.0224341592856245e-06, "epoch": 19.24102564102564, "percentage": 60.31, "elapsed_time": "9:31:09", "remaining_time": "6:15:48", "throughput": 2113.05, "total_tokens": 72412032} {"current_steps": 4695, "total_steps": 7776, "loss": 0.4087, "learning_rate": 1.0195627233330052e-06, "epoch": 19.26153846153846, "percentage": 60.38, "elapsed_time": "9:31:25", "remaining_time": "6:14:59", "throughput": 2114.17, "total_tokens": 72485760} {"current_steps": 4700, "total_steps": 7776, "loss": 0.4634, "learning_rate": 1.0166932478666292e-06, "epoch": 19.28205128205128, "percentage": 60.44, "elapsed_time": "9:31:44", "remaining_time": "6:14:10", "throughput": 2115.35, "total_tokens": 72565344} {"current_steps": 4705, "total_steps": 7776, "loss": 0.5316, "learning_rate": 1.0138257445957601e-06, "epoch": 19.3025641025641, "percentage": 60.51, "elapsed_time": "9:32:18", "remaining_time": "6:13:32", "throughput": 2115.57, "total_tokens": 72644800} {"current_steps": 4710, "total_steps": 7776, "loss": 0.4929, "learning_rate": 1.0109602252216153e-06, "epoch": 19.323076923076922, "percentage": 60.57, "elapsed_time": "9:33:12", "remaining_time": "6:13:08", "throughput": 2114.54, "total_tokens": 72725440} {"current_steps": 4715, "total_steps": 7776, "loss": 0.442, "learning_rate": 1.0080967014373152e-06, "epoch": 19.343589743589742, "percentage": 60.64, "elapsed_time": "9:33:55", "remaining_time": "6:12:35", "throughput": 2113.96, "total_tokens": 72796064} {"current_steps": 4720, "total_steps": 7776, "loss": 0.4442, "learning_rate": 1.0052351849278385e-06, "epoch": 19.364102564102563, "percentage": 60.7, "elapsed_time": "9:34:41", "remaining_time": "6:12:05", "throughput": 2113.3, "total_tokens": 72870080} {"current_steps": 4725, "total_steps": 7776, "loss": 0.4751, "learning_rate": 1.0023756873699723e-06, "epoch": 19.384615384615383, "percentage": 60.76, "elapsed_time": "9:35:27", "remaining_time": "6:11:34", "throughput": 2112.66, "total_tokens": 72944288} {"current_steps": 4730, "total_steps": 7776, "loss": 0.5129, "learning_rate": 9.995182204322637e-07, "epoch": 19.405128205128204, "percentage": 60.83, "elapsed_time": "9:36:18", "remaining_time": "6:11:07", "throughput": 2111.76, "total_tokens": 73021664} {"current_steps": 4735, "total_steps": 7776, "loss": 0.4796, "learning_rate": 9.966627957749767e-07, "epoch": 19.425641025641024, "percentage": 60.89, "elapsed_time": "9:37:01", "remaining_time": "6:10:35", "throughput": 2111.33, "total_tokens": 73097920} {"current_steps": 4740, "total_steps": 7776, "loss": 0.4785, "learning_rate": 9.93809425050039e-07, "epoch": 19.446153846153845, "percentage": 60.96, "elapsed_time": "9:37:41", "remaining_time": "6:10:00", "throughput": 2111.01, "total_tokens": 73170112} {"current_steps": 4745, "total_steps": 7776, "loss": 0.4379, "learning_rate": 9.909581199009971e-07, "epoch": 19.466666666666665, "percentage": 61.02, "elapsed_time": "9:38:19", "remaining_time": "6:09:25", "throughput": 2110.74, "total_tokens": 73241312} {"current_steps": 4750, "total_steps": 7776, "loss": 0.5408, "learning_rate": 9.8810889196297e-07, "epoch": 19.487179487179485, "percentage": 61.09, "elapsed_time": "9:39:06", "remaining_time": "6:08:55", "throughput": 2110.14, "total_tokens": 73319936} {"current_steps": 4755, "total_steps": 7776, "loss": 0.4878, "learning_rate": 9.852617528625992e-07, "epoch": 19.50769230769231, "percentage": 61.15, "elapsed_time": "9:39:51", "remaining_time": "6:08:23", "throughput": 2109.67, "total_tokens": 73397824} {"current_steps": 4760, "total_steps": 7776, "loss": 0.4627, "learning_rate": 9.824167142180032e-07, "epoch": 19.52820512820513, "percentage": 61.21, "elapsed_time": "9:40:29", "remaining_time": "6:07:48", "throughput": 2109.44, "total_tokens": 73470688} {"current_steps": 4765, "total_steps": 7776, "loss": 0.4799, "learning_rate": 9.795737876387285e-07, "epoch": 19.54871794871795, "percentage": 61.28, "elapsed_time": "9:41:08", "remaining_time": "6:07:13", "throughput": 2109.23, "total_tokens": 73545792} {"current_steps": 4770, "total_steps": 7776, "loss": 0.428, "learning_rate": 9.76732984725704e-07, "epoch": 19.56923076923077, "percentage": 61.34, "elapsed_time": "9:41:44", "remaining_time": "6:06:36", "throughput": 2109.13, "total_tokens": 73617760} {"current_steps": 4775, "total_steps": 7776, "loss": 0.4608, "learning_rate": 9.738943170711916e-07, "epoch": 19.58974358974359, "percentage": 61.41, "elapsed_time": "9:43:27", "remaining_time": "6:06:41", "throughput": 2105.47, "total_tokens": 73707328} {"current_steps": 4780, "total_steps": 7776, "loss": 0.4951, "learning_rate": 9.710577962587412e-07, "epoch": 19.61025641025641, "percentage": 61.47, "elapsed_time": "9:44:17", "remaining_time": "6:06:13", "throughput": 2104.64, "total_tokens": 73782976} {"current_steps": 4785, "total_steps": 7776, "loss": 0.53, "learning_rate": 9.68223433863141e-07, "epoch": 19.630769230769232, "percentage": 61.54, "elapsed_time": "9:45:36", "remaining_time": "6:06:02", "throughput": 2102.44, "total_tokens": 73872256} {"current_steps": 4790, "total_steps": 7776, "loss": 0.45, "learning_rate": 9.653912414503731e-07, "epoch": 19.651282051282053, "percentage": 61.6, "elapsed_time": "9:46:13", "remaining_time": "6:05:26", "throughput": 2102.39, "total_tokens": 73947520} {"current_steps": 4795, "total_steps": 7776, "loss": 0.4218, "learning_rate": 9.625612305775626e-07, "epoch": 19.671794871794873, "percentage": 61.66, "elapsed_time": "9:46:49", "remaining_time": "6:04:49", "throughput": 2102.36, "total_tokens": 74023104} {"current_steps": 4800, "total_steps": 7776, "loss": 0.4531, "learning_rate": 9.597334127929346e-07, "epoch": 19.692307692307693, "percentage": 61.73, "elapsed_time": "9:47:39", "remaining_time": "6:04:20", "throughput": 2101.74, "total_tokens": 74105920} {"current_steps": 4805, "total_steps": 7776, "loss": 0.4142, "learning_rate": 9.569077996357638e-07, "epoch": 19.712820512820514, "percentage": 61.79, "elapsed_time": "9:48:13", "remaining_time": "6:03:42", "throughput": 2101.9, "total_tokens": 74182752} {"current_steps": 4810, "total_steps": 7776, "loss": 0.5121, "learning_rate": 9.54084402636329e-07, "epoch": 19.733333333333334, "percentage": 61.86, "elapsed_time": "9:49:26", "remaining_time": "6:03:28", "throughput": 2099.85, "total_tokens": 74265248} {"current_steps": 4815, "total_steps": 7776, "loss": 0.523, "learning_rate": 9.512632333158653e-07, "epoch": 19.753846153846155, "percentage": 61.92, "elapsed_time": "9:50:15", "remaining_time": "6:02:58", "throughput": 2099.75, "total_tokens": 74363232} {"current_steps": 4820, "total_steps": 7776, "loss": 0.5103, "learning_rate": 9.484443031865176e-07, "epoch": 19.774358974358975, "percentage": 61.99, "elapsed_time": "9:50:49", "remaining_time": "6:02:20", "throughput": 2099.97, "total_tokens": 74442848} {"current_steps": 4825, "total_steps": 7776, "loss": 0.4725, "learning_rate": 9.456276237512949e-07, "epoch": 19.794871794871796, "percentage": 62.05, "elapsed_time": "9:51:16", "remaining_time": "6:01:37", "throughput": 2100.33, "total_tokens": 74513376} {"current_steps": 4830, "total_steps": 7776, "loss": 0.4921, "learning_rate": 9.428132065040198e-07, "epoch": 19.815384615384616, "percentage": 62.11, "elapsed_time": "9:51:47", "remaining_time": "6:00:57", "throughput": 2100.63, "total_tokens": 74588928} {"current_steps": 4835, "total_steps": 7776, "loss": 0.4331, "learning_rate": 9.40001062929285e-07, "epoch": 19.835897435897436, "percentage": 62.18, "elapsed_time": "9:52:13", "remaining_time": "6:00:14", "throughput": 2101.08, "total_tokens": 74659040} {"current_steps": 4840, "total_steps": 7776, "loss": 0.44, "learning_rate": 9.371912045024046e-07, "epoch": 19.856410256410257, "percentage": 62.24, "elapsed_time": "9:52:43", "remaining_time": "5:59:32", "throughput": 2101.55, "total_tokens": 74737472} {"current_steps": 4845, "total_steps": 7776, "loss": 0.4831, "learning_rate": 9.343836426893687e-07, "epoch": 19.876923076923077, "percentage": 62.31, "elapsed_time": "9:53:09", "remaining_time": "5:58:50", "throughput": 2102.02, "total_tokens": 74810592} {"current_steps": 4850, "total_steps": 7776, "loss": 0.4494, "learning_rate": 9.315783889467943e-07, "epoch": 19.897435897435898, "percentage": 62.37, "elapsed_time": "9:53:34", "remaining_time": "5:58:06", "throughput": 2102.53, "total_tokens": 74880096} {"current_steps": 4855, "total_steps": 7776, "loss": 0.5063, "learning_rate": 9.287754547218821e-07, "epoch": 19.91794871794872, "percentage": 62.44, "elapsed_time": "9:53:58", "remaining_time": "5:57:21", "throughput": 2103.11, "total_tokens": 74951168} {"current_steps": 4860, "total_steps": 7776, "loss": 0.4975, "learning_rate": 9.259748514523654e-07, "epoch": 19.93846153846154, "percentage": 62.5, "elapsed_time": "9:54:35", "remaining_time": "5:56:45", "throughput": 2103.25, "total_tokens": 75034592} {"current_steps": 4865, "total_steps": 7776, "loss": 0.4802, "learning_rate": 9.231765905664677e-07, "epoch": 19.95897435897436, "percentage": 62.56, "elapsed_time": "9:55:00", "remaining_time": "5:56:01", "throughput": 2103.88, "total_tokens": 75108992} {"current_steps": 4870, "total_steps": 7776, "loss": 0.4473, "learning_rate": 9.20380683482853e-07, "epoch": 19.97948717948718, "percentage": 62.63, "elapsed_time": "9:55:26", "remaining_time": "5:55:18", "throughput": 2104.46, "total_tokens": 75185824} {"current_steps": 4875, "total_steps": 7776, "loss": 0.4971, "learning_rate": 9.175871416105802e-07, "epoch": 20.0, "percentage": 62.69, "elapsed_time": "9:55:52", "remaining_time": "5:54:35", "throughput": 2105.14, "total_tokens": 75263936} {"current_steps": 4880, "total_steps": 7776, "loss": 0.493, "learning_rate": 9.147959763490578e-07, "epoch": 20.02051282051282, "percentage": 62.76, "elapsed_time": "9:56:19", "remaining_time": "5:53:52", "throughput": 2105.76, "total_tokens": 75342752} {"current_steps": 4885, "total_steps": 7776, "loss": 0.4709, "learning_rate": 9.120071990879949e-07, "epoch": 20.04102564102564, "percentage": 62.82, "elapsed_time": "9:56:45", "remaining_time": "5:53:10", "throughput": 2106.37, "total_tokens": 75420704} {"current_steps": 4890, "total_steps": 7776, "loss": 0.5248, "learning_rate": 9.092208212073569e-07, "epoch": 20.06153846153846, "percentage": 62.89, "elapsed_time": "9:57:07", "remaining_time": "5:52:24", "throughput": 2107.21, "total_tokens": 75496128} {"current_steps": 4895, "total_steps": 7776, "loss": 0.525, "learning_rate": 9.064368540773177e-07, "epoch": 20.08205128205128, "percentage": 62.95, "elapsed_time": "9:57:34", "remaining_time": "5:51:42", "throughput": 2108.11, "total_tokens": 75585984} {"current_steps": 4900, "total_steps": 7776, "loss": 0.5186, "learning_rate": 9.036553090582145e-07, "epoch": 20.102564102564102, "percentage": 63.01, "elapsed_time": "9:58:01", "remaining_time": "5:51:00", "throughput": 2108.84, "total_tokens": 75668416} {"current_steps": 4905, "total_steps": 7776, "loss": 0.456, "learning_rate": 9.008761975004994e-07, "epoch": 20.123076923076923, "percentage": 63.08, "elapsed_time": "9:58:21", "remaining_time": "5:50:13", "throughput": 2109.83, "total_tokens": 75744960} {"current_steps": 4910, "total_steps": 7776, "loss": 0.4507, "learning_rate": 8.98099530744696e-07, "epoch": 20.143589743589743, "percentage": 63.14, "elapsed_time": "9:58:39", "remaining_time": "5:49:26", "throughput": 2110.82, "total_tokens": 75818688} {"current_steps": 4915, "total_steps": 7776, "loss": 0.4552, "learning_rate": 8.953253201213517e-07, "epoch": 20.164102564102564, "percentage": 63.21, "elapsed_time": "9:59:00", "remaining_time": "5:48:40", "throughput": 2111.9, "total_tokens": 75901824} {"current_steps": 4920, "total_steps": 7776, "loss": 0.4153, "learning_rate": 8.925535769509895e-07, "epoch": 20.184615384615384, "percentage": 63.27, "elapsed_time": "9:59:16", "remaining_time": "5:47:52", "throughput": 2112.92, "total_tokens": 75973248} {"current_steps": 4925, "total_steps": 7776, "loss": 0.4452, "learning_rate": 8.897843125440653e-07, "epoch": 20.205128205128204, "percentage": 63.34, "elapsed_time": "9:59:31", "remaining_time": "5:47:03", "throughput": 2113.98, "total_tokens": 76043840} {"current_steps": 4928, "total_steps": 7776, "epoch": 20.217435897435898, "percentage": 63.37, "elapsed_time": "10:00:17", "remaining_time": "5:46:55", "throughput": 2113.04, "total_tokens": 76105440}