{"current_steps": 5, "total_steps": 350, "loss": 1.887, "learning_rate": 1.4285714285714285e-05, "epoch": 0.028429282160625444, "percentage": 1.43, "elapsed_time": "0:11:18", "remaining_time": "12:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 350, "loss": 1.5936, "learning_rate": 2.857142857142857e-05, "epoch": 0.05685856432125089, "percentage": 2.86, "elapsed_time": "0:22:39", "remaining_time": "12:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 350, "loss": 0.5385, "learning_rate": 4.2857142857142856e-05, "epoch": 0.08528784648187633, "percentage": 4.29, "elapsed_time": "0:34:01", "remaining_time": "12:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 350, "loss": 0.4072, "learning_rate": 5.714285714285714e-05, "epoch": 0.11371712864250177, "percentage": 5.71, "elapsed_time": "0:45:24", "remaining_time": "12:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 350, "loss": 0.3629, "learning_rate": 7.142857142857143e-05, "epoch": 0.14214641080312723, "percentage": 7.14, "elapsed_time": "0:56:47", "remaining_time": "12:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 350, "loss": 0.3385, "learning_rate": 8.571428571428571e-05, "epoch": 0.17057569296375266, "percentage": 8.57, "elapsed_time": "1:08:12", "remaining_time": "12:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 350, "loss": 0.3051, "learning_rate": 0.0001, "epoch": 0.19900497512437812, "percentage": 10.0, "elapsed_time": "1:19:31", "remaining_time": "11:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 350, "eval_loss": 0.25876832008361816, "epoch": 0.19900497512437812, "percentage": 10.0, "elapsed_time": "1:46:13", "remaining_time": "15:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 350, "loss": 0.2997, "learning_rate": 9.993784606094612e-05, "epoch": 0.22743425728500355, "percentage": 11.43, "elapsed_time": "1:57:39", "remaining_time": "15:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 350, "loss": 0.2794, "learning_rate": 9.975153876827008e-05, "epoch": 0.255863539445629, "percentage": 12.86, "elapsed_time": "2:09:01", "remaining_time": "14:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 350, "loss": 0.2777, "learning_rate": 9.944154131125642e-05, "epoch": 0.28429282160625446, "percentage": 14.29, "elapsed_time": "2:20:25", "remaining_time": "14:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 350, "loss": 0.2866, "learning_rate": 9.900862439242719e-05, "epoch": 0.31272210376687987, "percentage": 15.71, "elapsed_time": "2:31:49", "remaining_time": "13:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 350, "loss": 0.2993, "learning_rate": 9.84538643114539e-05, "epoch": 0.3411513859275053, "percentage": 17.14, "elapsed_time": "2:43:17", "remaining_time": "13:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 350, "loss": 0.2459, "learning_rate": 9.777864028930705e-05, "epoch": 0.3695806680881308, "percentage": 18.57, "elapsed_time": "2:54:37", "remaining_time": "12:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 350, "loss": 0.2726, "learning_rate": 9.698463103929542e-05, "epoch": 0.39800995024875624, "percentage": 20.0, "elapsed_time": "3:05:57", "remaining_time": "12:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 350, "eval_loss": 0.24190224707126617, "epoch": 0.39800995024875624, "percentage": 20.0, "elapsed_time": "3:32:38", "remaining_time": "14:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 350, "loss": 0.2722, "learning_rate": 9.607381059352038e-05, "epoch": 0.42643923240938164, "percentage": 21.43, "elapsed_time": "3:44:05", "remaining_time": "13:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 350, "loss": 0.2427, "learning_rate": 9.504844339512095e-05, "epoch": 0.4548685145700071, "percentage": 22.86, "elapsed_time": "3:55:32", "remaining_time": "13:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 350, "loss": 0.2672, "learning_rate": 9.391107866851143e-05, "epoch": 0.48329779673063256, "percentage": 24.29, "elapsed_time": "4:06:54", "remaining_time": "12:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 350, "loss": 0.2195, "learning_rate": 9.266454408160779e-05, "epoch": 0.511727078891258, "percentage": 25.71, "elapsed_time": "4:18:16", "remaining_time": "12:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 350, "loss": 0.2454, "learning_rate": 9.131193871579975e-05, "epoch": 0.5401563610518835, "percentage": 27.14, "elapsed_time": "4:29:36", "remaining_time": "12:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 350, "loss": 0.3725, "learning_rate": 8.985662536114613e-05, "epoch": 0.5685856432125089, "percentage": 28.57, "elapsed_time": "4:40:59", "remaining_time": "11:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 350, "loss": 0.2387, "learning_rate": 8.83022221559489e-05, "epoch": 0.5970149253731343, "percentage": 30.0, "elapsed_time": "4:52:18", "remaining_time": "11:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 350, "eval_loss": 0.23953676223754883, "epoch": 0.5970149253731343, "percentage": 30.0, "elapsed_time": "5:18:59", "remaining_time": "12:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 350, "loss": 0.2324, "learning_rate": 8.665259359149132e-05, "epoch": 0.6254442075337597, "percentage": 31.43, "elapsed_time": "5:30:28", "remaining_time": "12:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 350, "loss": 0.2409, "learning_rate": 8.491184090430364e-05, "epoch": 0.6538734896943852, "percentage": 32.86, "elapsed_time": "5:41:50", "remaining_time": "11:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 350, "loss": 0.2512, "learning_rate": 8.308429187984297e-05, "epoch": 0.6823027718550106, "percentage": 34.29, "elapsed_time": "5:53:15", "remaining_time": "11:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 350, "loss": 0.2347, "learning_rate": 8.117449009293668e-05, "epoch": 0.7107320540156361, "percentage": 35.71, "elapsed_time": "6:04:36", "remaining_time": "10:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 350, "loss": 0.2357, "learning_rate": 7.91871836117395e-05, "epoch": 0.7391613361762616, "percentage": 37.14, "elapsed_time": "6:16:03", "remaining_time": "10:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 350, "loss": 0.2607, "learning_rate": 7.712731319328798e-05, "epoch": 0.767590618336887, "percentage": 38.57, "elapsed_time": "6:27:28", "remaining_time": "10:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 350, "loss": 0.2508, "learning_rate": 7.500000000000001e-05, "epoch": 0.7960199004975125, "percentage": 40.0, "elapsed_time": "6:38:57", "remaining_time": "9:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 350, "eval_loss": 0.22614409029483795, "epoch": 0.7960199004975125, "percentage": 40.0, "elapsed_time": "7:05:38", "remaining_time": "10:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 350, "loss": 0.2338, "learning_rate": 7.281053286765815e-05, "epoch": 0.8244491826581379, "percentage": 41.43, "elapsed_time": "7:17:07", "remaining_time": "10:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 350, "loss": 0.2547, "learning_rate": 7.056435515653059e-05, "epoch": 0.8528784648187633, "percentage": 42.86, "elapsed_time": "7:28:28", "remaining_time": "9:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 350, "loss": 0.2481, "learning_rate": 6.826705121831976e-05, "epoch": 0.8813077469793887, "percentage": 44.29, "elapsed_time": "7:39:56", "remaining_time": "9:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 350, "loss": 0.2431, "learning_rate": 6.592433251258423e-05, "epoch": 0.9097370291400142, "percentage": 45.71, "elapsed_time": "7:51:18", "remaining_time": "9:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 350, "loss": 0.228, "learning_rate": 6.354202340715026e-05, "epoch": 0.9381663113006397, "percentage": 47.14, "elapsed_time": "8:02:39", "remaining_time": "9:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 350, "loss": 0.2229, "learning_rate": 6.112604669781572e-05, "epoch": 0.9665955934612651, "percentage": 48.57, "elapsed_time": "8:14:06", "remaining_time": "8:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 350, "loss": 0.2356, "learning_rate": 5.868240888334653e-05, "epoch": 0.9950248756218906, "percentage": 50.0, "elapsed_time": "8:25:33", "remaining_time": "8:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 350, "eval_loss": 0.21728534996509552, "epoch": 0.9950248756218906, "percentage": 50.0, "elapsed_time": "8:52:16", "remaining_time": "8:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 350, "loss": 0.2172, "learning_rate": 5.621718523237427e-05, "epoch": 1.023454157782516, "percentage": 51.43, "elapsed_time": "9:03:32", "remaining_time": "8:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 350, "loss": 0.2047, "learning_rate": 5.373650467932122e-05, "epoch": 1.0518834399431414, "percentage": 52.86, "elapsed_time": "9:14:59", "remaining_time": "8:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 350, "loss": 0.2212, "learning_rate": 5.124653458690365e-05, "epoch": 1.080312722103767, "percentage": 54.29, "elapsed_time": "9:26:29", "remaining_time": "7:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 350, "loss": 0.211, "learning_rate": 4.875346541309637e-05, "epoch": 1.1087420042643923, "percentage": 55.71, "elapsed_time": "9:37:51", "remaining_time": "7:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 350, "loss": 0.2332, "learning_rate": 4.626349532067879e-05, "epoch": 1.1371712864250179, "percentage": 57.14, "elapsed_time": "9:49:13", "remaining_time": "7:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 350, "loss": 0.2216, "learning_rate": 4.378281476762576e-05, "epoch": 1.1656005685856432, "percentage": 58.57, "elapsed_time": "10:00:34", "remaining_time": "7:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 350, "loss": 0.2079, "learning_rate": 4.131759111665349e-05, "epoch": 1.1940298507462686, "percentage": 60.0, "elapsed_time": "10:11:55", "remaining_time": "6:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 350, "eval_loss": 0.22092726826667786, "epoch": 1.1940298507462686, "percentage": 60.0, "elapsed_time": "10:38:36", "remaining_time": "7:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 350, "loss": 0.2088, "learning_rate": 3.887395330218429e-05, "epoch": 1.2224591329068941, "percentage": 61.43, "elapsed_time": "10:50:03", "remaining_time": "6:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 350, "loss": 0.1963, "learning_rate": 3.6457976592849754e-05, "epoch": 1.2508884150675195, "percentage": 62.86, "elapsed_time": "11:01:27", "remaining_time": "6:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 350, "loss": 0.2277, "learning_rate": 3.4075667487415785e-05, "epoch": 1.279317697228145, "percentage": 64.29, "elapsed_time": "11:12:49", "remaining_time": "6:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 350, "loss": 0.2113, "learning_rate": 3.173294878168025e-05, "epoch": 1.3077469793887704, "percentage": 65.71, "elapsed_time": "11:24:11", "remaining_time": "5:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 350, "loss": 0.2135, "learning_rate": 2.9435644843469436e-05, "epoch": 1.336176261549396, "percentage": 67.14, "elapsed_time": "11:35:36", "remaining_time": "5:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 350, "loss": 0.2165, "learning_rate": 2.718946713234185e-05, "epoch": 1.3646055437100213, "percentage": 68.57, "elapsed_time": "11:46:59", "remaining_time": "5:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 350, "loss": 0.2293, "learning_rate": 2.500000000000001e-05, "epoch": 1.3930348258706466, "percentage": 70.0, "elapsed_time": "11:58:21", "remaining_time": "5:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 350, "eval_loss": 0.21432924270629883, "epoch": 1.3930348258706466, "percentage": 70.0, "elapsed_time": "12:25:04", "remaining_time": "5:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 350, "loss": 0.2125, "learning_rate": 2.2872686806712035e-05, "epoch": 1.4214641080312722, "percentage": 71.43, "elapsed_time": "12:36:33", "remaining_time": "5:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 350, "loss": 0.2045, "learning_rate": 2.0812816388260518e-05, "epoch": 1.4498933901918978, "percentage": 72.86, "elapsed_time": "12:47:54", "remaining_time": "4:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 350, "loss": 0.1835, "learning_rate": 1.8825509907063327e-05, "epoch": 1.4783226723525231, "percentage": 74.29, "elapsed_time": "12:59:16", "remaining_time": "4:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 350, "loss": 0.2045, "learning_rate": 1.691570812015704e-05, "epoch": 1.5067519545131485, "percentage": 75.71, "elapsed_time": "13:10:45", "remaining_time": "4:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 350, "loss": 0.2137, "learning_rate": 1.5088159095696363e-05, "epoch": 1.535181236673774, "percentage": 77.14, "elapsed_time": "13:22:08", "remaining_time": "3:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 350, "loss": 0.1994, "learning_rate": 1.3347406408508695e-05, "epoch": 1.5636105188343994, "percentage": 78.57, "elapsed_time": "13:33:30", "remaining_time": "3:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 350, "loss": 0.2129, "learning_rate": 1.1697777844051105e-05, "epoch": 1.5920398009950247, "percentage": 80.0, "elapsed_time": "13:44:53", "remaining_time": "3:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 350, "eval_loss": 0.2167833000421524, "epoch": 1.5920398009950247, "percentage": 80.0, "elapsed_time": "14:11:37", "remaining_time": "3:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 350, "loss": 0.2216, "learning_rate": 1.0143374638853891e-05, "epoch": 1.6204690831556503, "percentage": 81.43, "elapsed_time": "14:23:09", "remaining_time": "3:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 350, "loss": 0.2125, "learning_rate": 8.688061284200266e-06, "epoch": 1.6488983653162759, "percentage": 82.86, "elapsed_time": "14:34:30", "remaining_time": "3:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 350, "loss": 0.1947, "learning_rate": 7.33545591839222e-06, "epoch": 1.6773276474769012, "percentage": 84.29, "elapsed_time": "14:45:53", "remaining_time": "2:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 350, "loss": 0.2093, "learning_rate": 6.088921331488568e-06, "epoch": 1.7057569296375266, "percentage": 85.71, "elapsed_time": "14:57:18", "remaining_time": "2:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 350, "loss": 0.2002, "learning_rate": 4.951556604879048e-06, "epoch": 1.7341862117981521, "percentage": 87.14, "elapsed_time": "15:08:39", "remaining_time": "2:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 350, "loss": 0.1749, "learning_rate": 3.9261894064796135e-06, "epoch": 1.7626154939587777, "percentage": 88.57, "elapsed_time": "15:20:06", "remaining_time": "1:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 350, "loss": 0.1974, "learning_rate": 3.0153689607045845e-06, "epoch": 1.7910447761194028, "percentage": 90.0, "elapsed_time": "15:31:29", "remaining_time": "1:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 350, "eval_loss": 0.21316008269786835, "epoch": 1.7910447761194028, "percentage": 90.0, "elapsed_time": "15:58:13", "remaining_time": "1:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 350, "loss": 0.2004, "learning_rate": 2.221359710692961e-06, "epoch": 1.8194740582800284, "percentage": 91.43, "elapsed_time": "16:09:42", "remaining_time": "1:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 350, "loss": 0.207, "learning_rate": 1.5461356885461075e-06, "epoch": 1.847903340440654, "percentage": 92.86, "elapsed_time": "16:21:03", "remaining_time": "1:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 350, "loss": 0.1933, "learning_rate": 9.913756075728087e-07, "epoch": 1.8763326226012793, "percentage": 94.29, "elapsed_time": "16:32:25", "remaining_time": "1:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 350, "loss": 0.2096, "learning_rate": 5.584586887435739e-07, "epoch": 1.9047619047619047, "percentage": 95.71, "elapsed_time": "16:43:51", "remaining_time": "0:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 350, "loss": 0.1997, "learning_rate": 2.4846123172992954e-07, "epoch": 1.9331911869225302, "percentage": 97.14, "elapsed_time": "16:55:17", "remaining_time": "0:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 350, "loss": 0.2084, "learning_rate": 6.215393905388278e-08, "epoch": 1.9616204690831558, "percentage": 98.57, "elapsed_time": "17:06:40", "remaining_time": "0:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "loss": 0.2068, "learning_rate": 0.0, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "17:18:06", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "eval_loss": 0.2134595662355423, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "17:44:51", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "17:44:54", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}