{"current_steps": 1, "total_steps": 40, "loss": 1.4129, "learning_rate": 0.0001996917333733128, "epoch": 0.17391304347826086, "percentage": 2.5, "elapsed_time": "0:00:12", "remaining_time": "0:08:15", "throughput": "1290.60", "total_tokens": 16384} {"current_steps": 2, "total_steps": 40, "loss": 1.3486, "learning_rate": 0.00019876883405951377, "epoch": 0.34782608695652173, "percentage": 5.0, "elapsed_time": "0:00:24", "remaining_time": "0:07:49", "throughput": "1327.07", "total_tokens": 32768} {"current_steps": 3, "total_steps": 40, "loss": 1.394, "learning_rate": 0.00019723699203976766, "epoch": 0.5217391304347826, "percentage": 7.5, "elapsed_time": "0:00:36", "remaining_time": "0:07:32", "throughput": "1338.81", "total_tokens": 49152} {"current_steps": 4, "total_steps": 40, "loss": 1.3051, "learning_rate": 0.00019510565162951537, "epoch": 0.6956521739130435, "percentage": 10.0, "elapsed_time": "0:00:48", "remaining_time": "0:07:18", "throughput": "1343.63", "total_tokens": 65536} {"current_steps": 5, "total_steps": 40, "loss": 1.3236, "learning_rate": 0.0001923879532511287, "epoch": 0.8695652173913043, "percentage": 12.5, "elapsed_time": "0:01:01", "remaining_time": "0:07:10", "throughput": "1332.49", "total_tokens": 81920} {"current_steps": 6, "total_steps": 40, "loss": 1.4556, "learning_rate": 0.0001891006524188368, "epoch": 1.0434782608695652, "percentage": 15.0, "elapsed_time": "0:01:14", "remaining_time": "0:07:01", "throughput": "1321.22", "total_tokens": 98304} {"current_steps": 7, "total_steps": 40, "loss": 1.3086, "learning_rate": 0.00018526401643540922, "epoch": 1.2173913043478262, "percentage": 17.5, "elapsed_time": "0:01:26", "remaining_time": "0:06:49", "throughput": "1318.95", "total_tokens": 114688} {"current_steps": 8, "total_steps": 40, "loss": 1.1029, "learning_rate": 0.00018090169943749476, "epoch": 1.391304347826087, "percentage": 20.0, "elapsed_time": "0:01:39", "remaining_time": "0:06:39", "throughput": "1313.23", "total_tokens": 131072} {"current_steps": 9, "total_steps": 40, "loss": 1.2992, "learning_rate": 0.0001760405965600031, "epoch": 1.5652173913043477, "percentage": 22.5, "elapsed_time": "0:01:52", "remaining_time": "0:06:28", "throughput": "1307.87", "total_tokens": 147456} {"current_steps": 10, "total_steps": 40, "loss": 1.1914, "learning_rate": 0.00017071067811865476, "epoch": 1.7391304347826086, "percentage": 25.0, "elapsed_time": "0:02:05", "remaining_time": "0:06:16", "throughput": "1306.85", "total_tokens": 163840} {"current_steps": 11, "total_steps": 40, "loss": 1.2417, "learning_rate": 0.00016494480483301836, "epoch": 1.9130434782608696, "percentage": 27.5, "elapsed_time": "0:02:18", "remaining_time": "0:06:04", "throughput": "1303.78", "total_tokens": 180224} {"current_steps": 12, "total_steps": 40, "loss": 1.3909, "learning_rate": 0.00015877852522924732, "epoch": 2.0869565217391304, "percentage": 30.0, "elapsed_time": "0:02:31", "remaining_time": "0:05:52", "throughput": "1301.25", "total_tokens": 196608} {"current_steps": 13, "total_steps": 40, "loss": 1.1383, "learning_rate": 0.0001522498564715949, "epoch": 2.260869565217391, "percentage": 32.5, "elapsed_time": "0:02:43", "remaining_time": "0:05:40", "throughput": "1300.97", "total_tokens": 212992} {"current_steps": 14, "total_steps": 40, "loss": 1.2009, "learning_rate": 0.00014539904997395468, "epoch": 2.4347826086956523, "percentage": 35.0, "elapsed_time": "0:02:56", "remaining_time": "0:05:28", "throughput": "1298.29", "total_tokens": 229376} {"current_steps": 15, "total_steps": 40, "loss": 1.1918, "learning_rate": 0.000138268343236509, "epoch": 2.608695652173913, "percentage": 37.5, "elapsed_time": "0:03:09", "remaining_time": "0:05:15", "throughput": "1296.23", "total_tokens": 245760} {"current_steps": 16, "total_steps": 40, "loss": 1.0642, "learning_rate": 0.00013090169943749476, "epoch": 2.782608695652174, "percentage": 40.0, "elapsed_time": "0:03:22", "remaining_time": "0:05:03", "throughput": "1296.29", "total_tokens": 262144} {"current_steps": 17, "total_steps": 40, "loss": 1.2661, "learning_rate": 0.00012334453638559057, "epoch": 2.9565217391304346, "percentage": 42.5, "elapsed_time": "0:03:35", "remaining_time": "0:04:51", "throughput": "1294.50", "total_tokens": 278528} {"current_steps": 18, "total_steps": 40, "loss": 1.0416, "learning_rate": 0.0001156434465040231, "epoch": 3.130434782608696, "percentage": 45.0, "elapsed_time": "0:03:48", "remaining_time": "0:04:38", "throughput": "1293.00", "total_tokens": 294912} {"current_steps": 19, "total_steps": 40, "loss": 1.0564, "learning_rate": 0.0001078459095727845, "epoch": 3.3043478260869565, "percentage": 47.5, "elapsed_time": "0:04:00", "remaining_time": "0:04:26", "throughput": "1293.37", "total_tokens": 311296} {"current_steps": 20, "total_steps": 40, "loss": 0.9894, "learning_rate": 0.0001, "epoch": 3.4782608695652173, "percentage": 50.0, "elapsed_time": "0:04:13", "remaining_time": "0:04:13", "throughput": "1292.09", "total_tokens": 327680} {"current_steps": 21, "total_steps": 40, "loss": 1.0994, "learning_rate": 9.215409042721552e-05, "epoch": 3.6521739130434785, "percentage": 52.5, "elapsed_time": "0:04:26", "remaining_time": "0:04:01", "throughput": "1291.15", "total_tokens": 344064} {"current_steps": 22, "total_steps": 40, "loss": 1.3105, "learning_rate": 8.435655349597689e-05, "epoch": 3.8260869565217392, "percentage": 55.0, "elapsed_time": "0:04:39", "remaining_time": "0:03:48", "throughput": "1291.31", "total_tokens": 360448} {"current_steps": 23, "total_steps": 40, "loss": 1.0337, "learning_rate": 7.66554636144095e-05, "epoch": 4.0, "percentage": 57.5, "elapsed_time": "0:04:52", "remaining_time": "0:03:35", "throughput": "1290.40", "total_tokens": 376832} {"current_steps": 24, "total_steps": 40, "loss": 1.0329, "learning_rate": 6.909830056250527e-05, "epoch": 4.173913043478261, "percentage": 60.0, "elapsed_time": "0:05:04", "remaining_time": "0:03:23", "throughput": "1289.52", "total_tokens": 393216} {"current_steps": 25, "total_steps": 40, "loss": 0.9724, "learning_rate": 6.173165676349103e-05, "epoch": 4.3478260869565215, "percentage": 62.5, "elapsed_time": "0:05:17", "remaining_time": "0:03:10", "throughput": "1289.76", "total_tokens": 409600} {"current_steps": 26, "total_steps": 40, "loss": 1.1225, "learning_rate": 5.4600950026045326e-05, "epoch": 4.521739130434782, "percentage": 65.0, "elapsed_time": "0:05:30", "remaining_time": "0:02:57", "throughput": "1288.92", "total_tokens": 425984} {"current_steps": 27, "total_steps": 40, "loss": 0.95, "learning_rate": 4.7750143528405126e-05, "epoch": 4.695652173913043, "percentage": 67.5, "elapsed_time": "0:05:43", "remaining_time": "0:02:45", "throughput": "1288.18", "total_tokens": 442368} {"current_steps": 28, "total_steps": 40, "loss": 1.0672, "learning_rate": 4.12214747707527e-05, "epoch": 4.869565217391305, "percentage": 70.0, "elapsed_time": "0:05:56", "remaining_time": "0:02:32", "throughput": "1288.47", "total_tokens": 458752} {"current_steps": 29, "total_steps": 40, "loss": 0.997, "learning_rate": 3.5055195166981645e-05, "epoch": 5.043478260869565, "percentage": 72.5, "elapsed_time": "0:06:08", "remaining_time": "0:02:19", "throughput": "1287.83", "total_tokens": 475136} {"current_steps": 30, "total_steps": 40, "loss": 0.8303, "learning_rate": 2.9289321881345254e-05, "epoch": 5.217391304347826, "percentage": 75.0, "elapsed_time": "0:06:21", "remaining_time": "0:02:07", "throughput": "1287.20", "total_tokens": 491520} {"current_steps": 31, "total_steps": 40, "loss": 0.8613, "learning_rate": 2.3959403439996907e-05, "epoch": 5.391304347826087, "percentage": 77.5, "elapsed_time": "0:06:34", "remaining_time": "0:01:54", "throughput": "1287.49", "total_tokens": 507904} {"current_steps": 32, "total_steps": 40, "loss": 0.8735, "learning_rate": 1.9098300562505266e-05, "epoch": 5.565217391304348, "percentage": 80.0, "elapsed_time": "0:06:47", "remaining_time": "0:01:41", "throughput": "1286.95", "total_tokens": 524288} {"current_steps": 33, "total_steps": 40, "loss": 1.1102, "learning_rate": 1.4735983564590783e-05, "epoch": 5.739130434782608, "percentage": 82.5, "elapsed_time": "0:07:00", "remaining_time": "0:01:29", "throughput": "1286.34", "total_tokens": 540672} {"current_steps": 34, "total_steps": 40, "loss": 1.2143, "learning_rate": 1.0899347581163221e-05, "epoch": 5.913043478260869, "percentage": 85.0, "elapsed_time": "0:07:12", "remaining_time": "0:01:16", "throughput": "1286.56", "total_tokens": 557056} {"current_steps": 35, "total_steps": 40, "loss": 1.1449, "learning_rate": 7.612046748871327e-06, "epoch": 6.086956521739131, "percentage": 87.5, "elapsed_time": "0:07:25", "remaining_time": "0:01:03", "throughput": "1286.09", "total_tokens": 573440} {"current_steps": 36, "total_steps": 40, "loss": 1.0676, "learning_rate": 4.8943483704846475e-06, "epoch": 6.260869565217392, "percentage": 90.0, "elapsed_time": "0:07:38", "remaining_time": "0:00:50", "throughput": "1285.62", "total_tokens": 589824} {"current_steps": 37, "total_steps": 40, "loss": 0.981, "learning_rate": 2.7630079602323442e-06, "epoch": 6.434782608695652, "percentage": 92.5, "elapsed_time": "0:07:51", "remaining_time": "0:00:38", "throughput": "1285.96", "total_tokens": 606208} {"current_steps": 38, "total_steps": 40, "loss": 0.8797, "learning_rate": 1.231165940486234e-06, "epoch": 6.608695652173913, "percentage": 95.0, "elapsed_time": "0:08:04", "remaining_time": "0:00:25", "throughput": "1285.52", "total_tokens": 622592} {"current_steps": 39, "total_steps": 40, "loss": 0.8676, "learning_rate": 3.0826662668720364e-07, "epoch": 6.782608695652174, "percentage": 97.5, "elapsed_time": "0:08:17", "remaining_time": "0:00:12", "throughput": "1285.12", "total_tokens": 638976} {"current_steps": 40, "total_steps": 40, "loss": 1.0274, "learning_rate": 0.0, "epoch": 6.956521739130435, "percentage": 100.0, "elapsed_time": "0:08:29", "remaining_time": "0:00:00", "throughput": "1285.35", "total_tokens": 655360} {"current_steps": 40, "total_steps": 40, "epoch": 6.956521739130435, "percentage": 100.0, "elapsed_time": "0:08:29", "remaining_time": "0:00:00", "throughput": "1285.34", "total_tokens": 655360}