open-lilm / trainer_log.jsonl
0xtaipoian's picture
Upload folder using huggingface_hub
b9a0edf verified
raw
history blame contribute delete
No virus
248 kB
{"current_steps": 5, "total_steps": 5309, "loss": 4.0168, "learning_rate": 1e-05, "epoch": 0.0009416306689108865, "percentage": 0.09, "elapsed_time": "0:01:02", "remaining_time": "18:33:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 10, "total_steps": 5309, "loss": 3.4972, "learning_rate": 1e-05, "epoch": 0.001883261337821773, "percentage": 0.19, "elapsed_time": "0:01:56", "remaining_time": "17:10:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 15, "total_steps": 5309, "loss": 3.5447, "learning_rate": 1e-05, "epoch": 0.0028248920067326594, "percentage": 0.28, "elapsed_time": "0:02:48", "remaining_time": "16:30:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 5309, "loss": 3.4348, "learning_rate": 1e-05, "epoch": 0.003766522675643546, "percentage": 0.38, "elapsed_time": "0:03:48", "remaining_time": "16:47:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 25, "total_steps": 5309, "loss": 3.4288, "learning_rate": 1e-05, "epoch": 0.004708153344554432, "percentage": 0.47, "elapsed_time": "0:04:51", "remaining_time": "17:06:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 5309, "loss": 3.4199, "learning_rate": 1e-05, "epoch": 0.005649784013465319, "percentage": 0.57, "elapsed_time": "0:05:53", "remaining_time": "17:16:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 35, "total_steps": 5309, "loss": 3.4564, "learning_rate": 1e-05, "epoch": 0.006591414682376205, "percentage": 0.66, "elapsed_time": "0:06:56", "remaining_time": "17:26:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 5309, "loss": 3.4071, "learning_rate": 1e-05, "epoch": 0.007533045351287092, "percentage": 0.75, "elapsed_time": "0:07:53", "remaining_time": "17:20:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 45, "total_steps": 5309, "loss": 3.3169, "learning_rate": 1e-05, "epoch": 0.008474676020197977, "percentage": 0.85, "elapsed_time": "0:08:48", "remaining_time": "17:09:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 5309, "loss": 3.4083, "learning_rate": 1e-05, "epoch": 0.009416306689108865, "percentage": 0.94, "elapsed_time": "0:09:41", "remaining_time": "16:59:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 55, "total_steps": 5309, "loss": 3.3384, "learning_rate": 1e-05, "epoch": 0.01035793735801975, "percentage": 1.04, "elapsed_time": "0:10:36", "remaining_time": "16:53:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 5309, "loss": 3.2959, "learning_rate": 1e-05, "epoch": 0.011299568026930638, "percentage": 1.13, "elapsed_time": "0:11:31", "remaining_time": "16:48:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 65, "total_steps": 5309, "loss": 3.3513, "learning_rate": 1e-05, "epoch": 0.012241198695841523, "percentage": 1.22, "elapsed_time": "0:12:25", "remaining_time": "16:42:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 5309, "loss": 3.1843, "learning_rate": 1e-05, "epoch": 0.01318282936475241, "percentage": 1.32, "elapsed_time": "0:13:16", "remaining_time": "16:33:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 75, "total_steps": 5309, "loss": 3.2907, "learning_rate": 1e-05, "epoch": 0.014124460033663296, "percentage": 1.41, "elapsed_time": "0:14:09", "remaining_time": "16:28:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 5309, "loss": 3.3033, "learning_rate": 1e-05, "epoch": 0.015066090702574184, "percentage": 1.51, "elapsed_time": "0:15:02", "remaining_time": "16:23:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 85, "total_steps": 5309, "loss": 3.402, "learning_rate": 1e-05, "epoch": 0.01600772137148507, "percentage": 1.6, "elapsed_time": "0:15:56", "remaining_time": "16:19:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 90, "total_steps": 5309, "loss": 3.3137, "learning_rate": 1e-05, "epoch": 0.016949352040395955, "percentage": 1.7, "elapsed_time": "0:16:49", "remaining_time": "16:15:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 95, "total_steps": 5309, "loss": 3.3074, "learning_rate": 1e-05, "epoch": 0.017890982709306842, "percentage": 1.79, "elapsed_time": "0:17:41", "remaining_time": "16:11:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 100, "total_steps": 5309, "loss": 3.3329, "learning_rate": 1e-05, "epoch": 0.01883261337821773, "percentage": 1.88, "elapsed_time": "0:18:35", "remaining_time": "16:08:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 105, "total_steps": 5309, "loss": 3.3839, "learning_rate": 1e-05, "epoch": 0.019774244047128613, "percentage": 1.98, "elapsed_time": "0:19:25", "remaining_time": "16:02:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 110, "total_steps": 5309, "loss": 3.3383, "learning_rate": 1e-05, "epoch": 0.0207158747160395, "percentage": 2.07, "elapsed_time": "0:20:18", "remaining_time": "15:59:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 115, "total_steps": 5309, "loss": 3.2845, "learning_rate": 1e-05, "epoch": 0.021657505384950388, "percentage": 2.17, "elapsed_time": "0:21:12", "remaining_time": "15:57:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 120, "total_steps": 5309, "loss": 3.2918, "learning_rate": 1e-05, "epoch": 0.022599136053861275, "percentage": 2.26, "elapsed_time": "0:22:06", "remaining_time": "15:55:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 125, "total_steps": 5309, "loss": 3.3509, "learning_rate": 1e-05, "epoch": 0.02354076672277216, "percentage": 2.35, "elapsed_time": "0:22:58", "remaining_time": "15:52:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 130, "total_steps": 5309, "loss": 3.3196, "learning_rate": 1e-05, "epoch": 0.024482397391683047, "percentage": 2.45, "elapsed_time": "0:23:53", "remaining_time": "15:51:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 135, "total_steps": 5309, "loss": 3.2702, "learning_rate": 1e-05, "epoch": 0.025424028060593934, "percentage": 2.54, "elapsed_time": "0:24:44", "remaining_time": "15:48:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 140, "total_steps": 5309, "loss": 3.3639, "learning_rate": 1e-05, "epoch": 0.02636565872950482, "percentage": 2.64, "elapsed_time": "0:25:37", "remaining_time": "15:46:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 145, "total_steps": 5309, "loss": 3.3693, "learning_rate": 1e-05, "epoch": 0.027307289398415705, "percentage": 2.73, "elapsed_time": "0:26:32", "remaining_time": "15:45:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 150, "total_steps": 5309, "loss": 3.2754, "learning_rate": 1e-05, "epoch": 0.028248920067326592, "percentage": 2.83, "elapsed_time": "0:27:26", "remaining_time": "15:43:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 155, "total_steps": 5309, "loss": 3.2058, "learning_rate": 1e-05, "epoch": 0.02919055073623748, "percentage": 2.92, "elapsed_time": "0:28:19", "remaining_time": "15:41:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 160, "total_steps": 5309, "loss": 3.216, "learning_rate": 1e-05, "epoch": 0.030132181405148367, "percentage": 3.01, "elapsed_time": "0:29:13", "remaining_time": "15:40:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 165, "total_steps": 5309, "loss": 3.3169, "learning_rate": 1e-05, "epoch": 0.03107381207405925, "percentage": 3.11, "elapsed_time": "0:30:05", "remaining_time": "15:38:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 170, "total_steps": 5309, "loss": 3.3579, "learning_rate": 1e-05, "epoch": 0.03201544274297014, "percentage": 3.2, "elapsed_time": "0:30:57", "remaining_time": "15:35:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 175, "total_steps": 5309, "loss": 3.3376, "learning_rate": 1e-05, "epoch": 0.032957073411881026, "percentage": 3.3, "elapsed_time": "0:31:48", "remaining_time": "15:33:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 180, "total_steps": 5309, "loss": 3.2441, "learning_rate": 1e-05, "epoch": 0.03389870408079191, "percentage": 3.39, "elapsed_time": "0:32:41", "remaining_time": "15:31:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 185, "total_steps": 5309, "loss": 3.3118, "learning_rate": 1e-05, "epoch": 0.0348403347497028, "percentage": 3.48, "elapsed_time": "0:33:35", "remaining_time": "15:30:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 190, "total_steps": 5309, "loss": 3.2795, "learning_rate": 1e-05, "epoch": 0.035781965418613684, "percentage": 3.58, "elapsed_time": "0:34:30", "remaining_time": "15:29:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 195, "total_steps": 5309, "loss": 3.1868, "learning_rate": 1e-05, "epoch": 0.03672359608752457, "percentage": 3.67, "elapsed_time": "0:35:22", "remaining_time": "15:27:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 5309, "loss": 3.2716, "learning_rate": 1e-05, "epoch": 0.03766522675643546, "percentage": 3.77, "elapsed_time": "0:36:16", "remaining_time": "15:26:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 205, "total_steps": 5309, "loss": 3.2368, "learning_rate": 1e-05, "epoch": 0.03860685742534634, "percentage": 3.86, "elapsed_time": "0:38:29", "remaining_time": "15:58:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 210, "total_steps": 5309, "loss": 3.237, "learning_rate": 1e-05, "epoch": 0.03954848809425723, "percentage": 3.96, "elapsed_time": "0:39:22", "remaining_time": "15:55:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 215, "total_steps": 5309, "loss": 3.2724, "learning_rate": 1e-05, "epoch": 0.04049011876316812, "percentage": 4.05, "elapsed_time": "0:40:16", "remaining_time": "15:54:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 220, "total_steps": 5309, "loss": 3.2741, "learning_rate": 1e-05, "epoch": 0.041431749432079, "percentage": 4.14, "elapsed_time": "0:41:08", "remaining_time": "15:51:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 225, "total_steps": 5309, "loss": 3.2725, "learning_rate": 1e-05, "epoch": 0.04237338010098989, "percentage": 4.24, "elapsed_time": "0:42:03", "remaining_time": "15:50:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 230, "total_steps": 5309, "loss": 3.2604, "learning_rate": 1e-05, "epoch": 0.043315010769900776, "percentage": 4.33, "elapsed_time": "0:42:56", "remaining_time": "15:48:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 235, "total_steps": 5309, "loss": 3.3685, "learning_rate": 1e-05, "epoch": 0.04425664143881166, "percentage": 4.43, "elapsed_time": "0:43:48", "remaining_time": "15:45:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 240, "total_steps": 5309, "loss": 3.3883, "learning_rate": 1e-05, "epoch": 0.04519827210772255, "percentage": 4.52, "elapsed_time": "0:44:42", "remaining_time": "15:44:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 245, "total_steps": 5309, "loss": 3.2377, "learning_rate": 1e-05, "epoch": 0.046139902776633435, "percentage": 4.61, "elapsed_time": "0:45:32", "remaining_time": "15:41:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 5309, "loss": 3.1805, "learning_rate": 1e-05, "epoch": 0.04708153344554432, "percentage": 4.71, "elapsed_time": "0:46:25", "remaining_time": "15:39:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 255, "total_steps": 5309, "loss": 3.1641, "learning_rate": 1e-05, "epoch": 0.04802316411445521, "percentage": 4.8, "elapsed_time": "0:47:19", "remaining_time": "15:38:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 260, "total_steps": 5309, "loss": 3.2127, "learning_rate": 1e-05, "epoch": 0.04896479478336609, "percentage": 4.9, "elapsed_time": "0:48:13", "remaining_time": "15:36:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 265, "total_steps": 5309, "loss": 3.2503, "learning_rate": 1e-05, "epoch": 0.049906425452276984, "percentage": 4.99, "elapsed_time": "0:49:07", "remaining_time": "15:35:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 270, "total_steps": 5309, "loss": 3.2276, "learning_rate": 1e-05, "epoch": 0.05084805612118787, "percentage": 5.09, "elapsed_time": "0:50:01", "remaining_time": "15:33:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 275, "total_steps": 5309, "loss": 3.2853, "learning_rate": 1e-05, "epoch": 0.05178968679009875, "percentage": 5.18, "elapsed_time": "0:50:52", "remaining_time": "15:31:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 280, "total_steps": 5309, "loss": 3.3613, "learning_rate": 1e-05, "epoch": 0.05273131745900964, "percentage": 5.27, "elapsed_time": "0:51:46", "remaining_time": "15:29:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 285, "total_steps": 5309, "loss": 3.1688, "learning_rate": 1e-05, "epoch": 0.053672948127920526, "percentage": 5.37, "elapsed_time": "0:52:38", "remaining_time": "15:27:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 290, "total_steps": 5309, "loss": 3.2417, "learning_rate": 1e-05, "epoch": 0.05461457879683141, "percentage": 5.46, "elapsed_time": "0:53:29", "remaining_time": "15:25:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 295, "total_steps": 5309, "loss": 3.3112, "learning_rate": 1e-05, "epoch": 0.0555562094657423, "percentage": 5.56, "elapsed_time": "0:54:21", "remaining_time": "15:23:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 300, "total_steps": 5309, "loss": 3.2811, "learning_rate": 1e-05, "epoch": 0.056497840134653185, "percentage": 5.65, "elapsed_time": "0:55:13", "remaining_time": "15:21:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 305, "total_steps": 5309, "loss": 3.2543, "learning_rate": 1e-05, "epoch": 0.05743947080356407, "percentage": 5.74, "elapsed_time": "0:56:05", "remaining_time": "15:20:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 310, "total_steps": 5309, "loss": 3.3047, "learning_rate": 1e-05, "epoch": 0.05838110147247496, "percentage": 5.84, "elapsed_time": "0:56:58", "remaining_time": "15:18:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 315, "total_steps": 5309, "loss": 3.2744, "learning_rate": 1e-05, "epoch": 0.059322732141385844, "percentage": 5.93, "elapsed_time": "0:57:51", "remaining_time": "15:17:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 320, "total_steps": 5309, "loss": 3.3184, "learning_rate": 1e-05, "epoch": 0.060264362810296734, "percentage": 6.03, "elapsed_time": "0:58:45", "remaining_time": "15:16:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 325, "total_steps": 5309, "loss": 3.3169, "learning_rate": 1e-05, "epoch": 0.06120599347920762, "percentage": 6.12, "elapsed_time": "0:59:52", "remaining_time": "15:18:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 330, "total_steps": 5309, "loss": 3.3267, "learning_rate": 1e-05, "epoch": 0.0621476241481185, "percentage": 6.22, "elapsed_time": "1:00:54", "remaining_time": "15:18:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 335, "total_steps": 5309, "loss": 3.1593, "learning_rate": 1e-05, "epoch": 0.06308925481702939, "percentage": 6.31, "elapsed_time": "1:01:55", "remaining_time": "15:19:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 340, "total_steps": 5309, "loss": 3.252, "learning_rate": 1e-05, "epoch": 0.06403088548594028, "percentage": 6.4, "elapsed_time": "1:02:56", "remaining_time": "15:19:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 345, "total_steps": 5309, "loss": 3.3233, "learning_rate": 1e-05, "epoch": 0.06497251615485117, "percentage": 6.5, "elapsed_time": "1:03:55", "remaining_time": "15:19:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 350, "total_steps": 5309, "loss": 3.1951, "learning_rate": 1e-05, "epoch": 0.06591414682376205, "percentage": 6.59, "elapsed_time": "1:04:51", "remaining_time": "15:18:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 355, "total_steps": 5309, "loss": 3.3024, "learning_rate": 1e-05, "epoch": 0.06685577749267294, "percentage": 6.69, "elapsed_time": "1:05:53", "remaining_time": "15:19:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 360, "total_steps": 5309, "loss": 3.2833, "learning_rate": 1e-05, "epoch": 0.06779740816158382, "percentage": 6.78, "elapsed_time": "1:06:51", "remaining_time": "15:19:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 365, "total_steps": 5309, "loss": 3.3022, "learning_rate": 1e-05, "epoch": 0.0687390388304947, "percentage": 6.88, "elapsed_time": "1:07:48", "remaining_time": "15:18:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 370, "total_steps": 5309, "loss": 3.1566, "learning_rate": 1e-05, "epoch": 0.0696806694994056, "percentage": 6.97, "elapsed_time": "1:08:43", "remaining_time": "15:17:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 375, "total_steps": 5309, "loss": 3.2279, "learning_rate": 1e-05, "epoch": 0.07062230016831648, "percentage": 7.06, "elapsed_time": "1:09:39", "remaining_time": "15:16:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 380, "total_steps": 5309, "loss": 3.1227, "learning_rate": 1e-05, "epoch": 0.07156393083722737, "percentage": 7.16, "elapsed_time": "1:10:36", "remaining_time": "15:15:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 385, "total_steps": 5309, "loss": 3.2537, "learning_rate": 1e-05, "epoch": 0.07250556150613825, "percentage": 7.25, "elapsed_time": "1:11:32", "remaining_time": "15:15:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 390, "total_steps": 5309, "loss": 3.335, "learning_rate": 1e-05, "epoch": 0.07344719217504914, "percentage": 7.35, "elapsed_time": "1:12:30", "remaining_time": "15:14:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 395, "total_steps": 5309, "loss": 3.2609, "learning_rate": 1e-05, "epoch": 0.07438882284396003, "percentage": 7.44, "elapsed_time": "1:13:28", "remaining_time": "15:14:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 400, "total_steps": 5309, "loss": 3.1916, "learning_rate": 1e-05, "epoch": 0.07533045351287092, "percentage": 7.53, "elapsed_time": "1:14:23", "remaining_time": "15:13:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 405, "total_steps": 5309, "loss": 3.2404, "learning_rate": 1e-05, "epoch": 0.0762720841817818, "percentage": 7.63, "elapsed_time": "1:16:39", "remaining_time": "15:28:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 410, "total_steps": 5309, "loss": 3.1984, "learning_rate": 1e-05, "epoch": 0.07721371485069269, "percentage": 7.72, "elapsed_time": "1:17:36", "remaining_time": "15:27:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 415, "total_steps": 5309, "loss": 3.2435, "learning_rate": 1e-05, "epoch": 0.07815534551960357, "percentage": 7.82, "elapsed_time": "1:18:32", "remaining_time": "15:26:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 420, "total_steps": 5309, "loss": 3.271, "learning_rate": 1e-05, "epoch": 0.07909697618851445, "percentage": 7.91, "elapsed_time": "1:19:29", "remaining_time": "15:25:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 425, "total_steps": 5309, "loss": 3.2629, "learning_rate": 1e-05, "epoch": 0.08003860685742535, "percentage": 8.01, "elapsed_time": "1:20:24", "remaining_time": "15:24:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 430, "total_steps": 5309, "loss": 3.2466, "learning_rate": 1e-05, "epoch": 0.08098023752633624, "percentage": 8.1, "elapsed_time": "1:21:19", "remaining_time": "15:22:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 435, "total_steps": 5309, "loss": 3.303, "learning_rate": 1e-05, "epoch": 0.08192186819524712, "percentage": 8.19, "elapsed_time": "1:22:14", "remaining_time": "15:21:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 440, "total_steps": 5309, "loss": 3.1332, "learning_rate": 1e-05, "epoch": 0.082863498864158, "percentage": 8.29, "elapsed_time": "1:23:10", "remaining_time": "15:20:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 445, "total_steps": 5309, "loss": 3.2161, "learning_rate": 1e-05, "epoch": 0.08380512953306889, "percentage": 8.38, "elapsed_time": "1:24:04", "remaining_time": "15:19:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 450, "total_steps": 5309, "loss": 3.2558, "learning_rate": 1e-05, "epoch": 0.08474676020197978, "percentage": 8.48, "elapsed_time": "1:24:59", "remaining_time": "15:17:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 455, "total_steps": 5309, "loss": 3.1148, "learning_rate": 1e-05, "epoch": 0.08568839087089067, "percentage": 8.57, "elapsed_time": "1:25:54", "remaining_time": "15:16:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 460, "total_steps": 5309, "loss": 3.2366, "learning_rate": 1e-05, "epoch": 0.08663002153980155, "percentage": 8.66, "elapsed_time": "1:26:49", "remaining_time": "15:15:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 465, "total_steps": 5309, "loss": 3.3596, "learning_rate": 1e-05, "epoch": 0.08757165220871244, "percentage": 8.76, "elapsed_time": "1:27:43", "remaining_time": "15:13:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 470, "total_steps": 5309, "loss": 3.2823, "learning_rate": 1e-05, "epoch": 0.08851328287762332, "percentage": 8.85, "elapsed_time": "1:28:38", "remaining_time": "15:12:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 475, "total_steps": 5309, "loss": 3.2593, "learning_rate": 1e-05, "epoch": 0.0894549135465342, "percentage": 8.95, "elapsed_time": "1:29:34", "remaining_time": "15:11:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 480, "total_steps": 5309, "loss": 3.1761, "learning_rate": 1e-05, "epoch": 0.0903965442154451, "percentage": 9.04, "elapsed_time": "1:30:29", "remaining_time": "15:10:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 485, "total_steps": 5309, "loss": 3.2005, "learning_rate": 1e-05, "epoch": 0.09133817488435599, "percentage": 9.14, "elapsed_time": "1:31:22", "remaining_time": "15:08:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 490, "total_steps": 5309, "loss": 3.2414, "learning_rate": 1e-05, "epoch": 0.09227980555326687, "percentage": 9.23, "elapsed_time": "1:32:18", "remaining_time": "15:07:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 495, "total_steps": 5309, "loss": 3.2309, "learning_rate": 1e-05, "epoch": 0.09322143622217775, "percentage": 9.32, "elapsed_time": "1:33:13", "remaining_time": "15:06:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 500, "total_steps": 5309, "loss": 3.2978, "learning_rate": 1e-05, "epoch": 0.09416306689108864, "percentage": 9.42, "elapsed_time": "1:34:08", "remaining_time": "15:05:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 505, "total_steps": 5309, "loss": 3.2522, "learning_rate": 1e-05, "epoch": 0.09510469755999953, "percentage": 9.51, "elapsed_time": "1:35:02", "remaining_time": "15:04:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 510, "total_steps": 5309, "loss": 3.1128, "learning_rate": 1e-05, "epoch": 0.09604632822891042, "percentage": 9.61, "elapsed_time": "1:35:57", "remaining_time": "15:02:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 515, "total_steps": 5309, "loss": 3.2469, "learning_rate": 1e-05, "epoch": 0.0969879588978213, "percentage": 9.7, "elapsed_time": "1:36:50", "remaining_time": "15:01:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 520, "total_steps": 5309, "loss": 3.1663, "learning_rate": 1e-05, "epoch": 0.09792958956673219, "percentage": 9.79, "elapsed_time": "1:37:45", "remaining_time": "15:00:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 525, "total_steps": 5309, "loss": 3.2616, "learning_rate": 1e-05, "epoch": 0.09887122023564307, "percentage": 9.89, "elapsed_time": "1:38:38", "remaining_time": "14:58:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 530, "total_steps": 5309, "loss": 3.2367, "learning_rate": 1e-05, "epoch": 0.09981285090455397, "percentage": 9.98, "elapsed_time": "1:39:31", "remaining_time": "14:57:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 535, "total_steps": 5309, "loss": 3.1932, "learning_rate": 1e-05, "epoch": 0.10075448157346485, "percentage": 10.08, "elapsed_time": "1:40:26", "remaining_time": "14:56:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 540, "total_steps": 5309, "loss": 3.1863, "learning_rate": 1e-05, "epoch": 0.10169611224237574, "percentage": 10.17, "elapsed_time": "1:41:22", "remaining_time": "14:55:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 545, "total_steps": 5309, "loss": 3.3411, "learning_rate": 1e-05, "epoch": 0.10263774291128662, "percentage": 10.27, "elapsed_time": "1:42:16", "remaining_time": "14:53:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 550, "total_steps": 5309, "loss": 3.2209, "learning_rate": 1e-05, "epoch": 0.1035793735801975, "percentage": 10.36, "elapsed_time": "1:43:13", "remaining_time": "14:53:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 555, "total_steps": 5309, "loss": 3.1653, "learning_rate": 1e-05, "epoch": 0.10452100424910839, "percentage": 10.45, "elapsed_time": "1:44:07", "remaining_time": "14:51:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 560, "total_steps": 5309, "loss": 3.2451, "learning_rate": 1e-05, "epoch": 0.10546263491801929, "percentage": 10.55, "elapsed_time": "1:45:03", "remaining_time": "14:50:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 565, "total_steps": 5309, "loss": 3.2327, "learning_rate": 1e-05, "epoch": 0.10640426558693017, "percentage": 10.64, "elapsed_time": "1:45:59", "remaining_time": "14:49:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 570, "total_steps": 5309, "loss": 3.177, "learning_rate": 1e-05, "epoch": 0.10734589625584105, "percentage": 10.74, "elapsed_time": "1:46:55", "remaining_time": "14:48:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 575, "total_steps": 5309, "loss": 3.2389, "learning_rate": 1e-05, "epoch": 0.10828752692475194, "percentage": 10.83, "elapsed_time": "1:47:52", "remaining_time": "14:48:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 580, "total_steps": 5309, "loss": 3.2133, "learning_rate": 1e-05, "epoch": 0.10922915759366282, "percentage": 10.92, "elapsed_time": "1:48:46", "remaining_time": "14:46:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 585, "total_steps": 5309, "loss": 3.1059, "learning_rate": 1e-05, "epoch": 0.11017078826257372, "percentage": 11.02, "elapsed_time": "1:49:40", "remaining_time": "14:45:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 590, "total_steps": 5309, "loss": 3.2737, "learning_rate": 1e-05, "epoch": 0.1111124189314846, "percentage": 11.11, "elapsed_time": "1:50:36", "remaining_time": "14:44:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 595, "total_steps": 5309, "loss": 3.181, "learning_rate": 1e-05, "epoch": 0.11205404960039549, "percentage": 11.21, "elapsed_time": "1:51:30", "remaining_time": "14:43:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 600, "total_steps": 5309, "loss": 3.1989, "learning_rate": 1e-05, "epoch": 0.11299568026930637, "percentage": 11.3, "elapsed_time": "1:52:24", "remaining_time": "14:42:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 605, "total_steps": 5309, "loss": 3.165, "learning_rate": 1e-05, "epoch": 0.11393731093821725, "percentage": 11.4, "elapsed_time": "1:54:36", "remaining_time": "14:51:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 610, "total_steps": 5309, "loss": 3.2167, "learning_rate": 1e-05, "epoch": 0.11487894160712814, "percentage": 11.49, "elapsed_time": "1:55:29", "remaining_time": "14:49:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 615, "total_steps": 5309, "loss": 3.1573, "learning_rate": 1e-05, "epoch": 0.11582057227603904, "percentage": 11.58, "elapsed_time": "1:56:22", "remaining_time": "14:48:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 620, "total_steps": 5309, "loss": 3.2069, "learning_rate": 1e-05, "epoch": 0.11676220294494992, "percentage": 11.68, "elapsed_time": "1:57:17", "remaining_time": "14:47:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 625, "total_steps": 5309, "loss": 3.184, "learning_rate": 1e-05, "epoch": 0.1177038336138608, "percentage": 11.77, "elapsed_time": "1:58:11", "remaining_time": "14:45:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 630, "total_steps": 5309, "loss": 3.2377, "learning_rate": 1e-05, "epoch": 0.11864546428277169, "percentage": 11.87, "elapsed_time": "1:59:06", "remaining_time": "14:44:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 635, "total_steps": 5309, "loss": 3.2338, "learning_rate": 1e-05, "epoch": 0.11958709495168257, "percentage": 11.96, "elapsed_time": "1:59:58", "remaining_time": "14:43:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 640, "total_steps": 5309, "loss": 3.3123, "learning_rate": 1e-05, "epoch": 0.12052872562059347, "percentage": 12.06, "elapsed_time": "2:00:51", "remaining_time": "14:41:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 645, "total_steps": 5309, "loss": 3.1506, "learning_rate": 1e-05, "epoch": 0.12147035628950435, "percentage": 12.15, "elapsed_time": "2:01:44", "remaining_time": "14:40:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 650, "total_steps": 5309, "loss": 3.1423, "learning_rate": 1e-05, "epoch": 0.12241198695841524, "percentage": 12.24, "elapsed_time": "2:02:37", "remaining_time": "14:38:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 655, "total_steps": 5309, "loss": 3.0779, "learning_rate": 1e-05, "epoch": 0.12335361762732612, "percentage": 12.34, "elapsed_time": "2:03:31", "remaining_time": "14:37:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 660, "total_steps": 5309, "loss": 3.1623, "learning_rate": 1e-05, "epoch": 0.124295248296237, "percentage": 12.43, "elapsed_time": "2:04:24", "remaining_time": "14:36:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 665, "total_steps": 5309, "loss": 3.2047, "learning_rate": 1e-05, "epoch": 0.1252368789651479, "percentage": 12.53, "elapsed_time": "2:05:17", "remaining_time": "14:34:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 670, "total_steps": 5309, "loss": 3.1688, "learning_rate": 1e-05, "epoch": 0.12617850963405877, "percentage": 12.62, "elapsed_time": "2:06:11", "remaining_time": "14:33:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 675, "total_steps": 5309, "loss": 3.2182, "learning_rate": 1e-05, "epoch": 0.12712014030296967, "percentage": 12.71, "elapsed_time": "2:07:05", "remaining_time": "14:32:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 680, "total_steps": 5309, "loss": 3.2553, "learning_rate": 1e-05, "epoch": 0.12806177097188057, "percentage": 12.81, "elapsed_time": "2:07:58", "remaining_time": "14:31:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 685, "total_steps": 5309, "loss": 3.1702, "learning_rate": 1e-05, "epoch": 0.12900340164079144, "percentage": 12.9, "elapsed_time": "2:08:54", "remaining_time": "14:30:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 690, "total_steps": 5309, "loss": 3.1752, "learning_rate": 1e-05, "epoch": 0.12994503230970234, "percentage": 13.0, "elapsed_time": "2:09:48", "remaining_time": "14:28:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 695, "total_steps": 5309, "loss": 3.2211, "learning_rate": 1e-05, "epoch": 0.1308866629786132, "percentage": 13.09, "elapsed_time": "2:10:47", "remaining_time": "14:28:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 700, "total_steps": 5309, "loss": 3.1846, "learning_rate": 1e-05, "epoch": 0.1318282936475241, "percentage": 13.19, "elapsed_time": "2:11:41", "remaining_time": "14:27:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 705, "total_steps": 5309, "loss": 3.2351, "learning_rate": 1e-05, "epoch": 0.13276992431643497, "percentage": 13.28, "elapsed_time": "2:12:39", "remaining_time": "14:26:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 710, "total_steps": 5309, "loss": 3.2312, "learning_rate": 1e-05, "epoch": 0.13371155498534587, "percentage": 13.37, "elapsed_time": "2:13:34", "remaining_time": "14:25:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 715, "total_steps": 5309, "loss": 3.218, "learning_rate": 1e-05, "epoch": 0.13465318565425677, "percentage": 13.47, "elapsed_time": "2:14:31", "remaining_time": "14:24:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 720, "total_steps": 5309, "loss": 3.279, "learning_rate": 1e-05, "epoch": 0.13559481632316764, "percentage": 13.56, "elapsed_time": "2:15:24", "remaining_time": "14:23:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 725, "total_steps": 5309, "loss": 3.2876, "learning_rate": 1e-05, "epoch": 0.13653644699207854, "percentage": 13.66, "elapsed_time": "2:16:20", "remaining_time": "14:22:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 730, "total_steps": 5309, "loss": 3.2547, "learning_rate": 1e-05, "epoch": 0.1374780776609894, "percentage": 13.75, "elapsed_time": "2:17:16", "remaining_time": "14:21:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 735, "total_steps": 5309, "loss": 3.2795, "learning_rate": 1e-05, "epoch": 0.1384197083299003, "percentage": 13.84, "elapsed_time": "2:18:09", "remaining_time": "14:19:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 740, "total_steps": 5309, "loss": 3.0988, "learning_rate": 1e-05, "epoch": 0.1393613389988112, "percentage": 13.94, "elapsed_time": "2:19:04", "remaining_time": "14:18:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 745, "total_steps": 5309, "loss": 3.1612, "learning_rate": 1e-05, "epoch": 0.14030296966772207, "percentage": 14.03, "elapsed_time": "2:19:56", "remaining_time": "14:17:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 750, "total_steps": 5309, "loss": 3.1921, "learning_rate": 1e-05, "epoch": 0.14124460033663297, "percentage": 14.13, "elapsed_time": "2:20:51", "remaining_time": "14:16:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 755, "total_steps": 5309, "loss": 3.2371, "learning_rate": 1e-05, "epoch": 0.14218623100554384, "percentage": 14.22, "elapsed_time": "2:21:44", "remaining_time": "14:14:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 760, "total_steps": 5309, "loss": 3.2239, "learning_rate": 1e-05, "epoch": 0.14312786167445474, "percentage": 14.32, "elapsed_time": "2:22:39", "remaining_time": "14:13:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 765, "total_steps": 5309, "loss": 3.267, "learning_rate": 1e-05, "epoch": 0.14406949234336563, "percentage": 14.41, "elapsed_time": "2:23:33", "remaining_time": "14:12:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 770, "total_steps": 5309, "loss": 3.2387, "learning_rate": 1e-05, "epoch": 0.1450111230122765, "percentage": 14.5, "elapsed_time": "2:24:28", "remaining_time": "14:11:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 775, "total_steps": 5309, "loss": 3.1542, "learning_rate": 1e-05, "epoch": 0.1459527536811874, "percentage": 14.6, "elapsed_time": "2:25:25", "remaining_time": "14:10:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 780, "total_steps": 5309, "loss": 3.1742, "learning_rate": 1e-05, "epoch": 0.14689438435009827, "percentage": 14.69, "elapsed_time": "2:26:18", "remaining_time": "14:09:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 785, "total_steps": 5309, "loss": 3.2441, "learning_rate": 1e-05, "epoch": 0.14783601501900917, "percentage": 14.79, "elapsed_time": "2:27:14", "remaining_time": "14:08:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 790, "total_steps": 5309, "loss": 3.133, "learning_rate": 1e-05, "epoch": 0.14877764568792007, "percentage": 14.88, "elapsed_time": "2:28:08", "remaining_time": "14:07:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 795, "total_steps": 5309, "loss": 3.1822, "learning_rate": 1e-05, "epoch": 0.14971927635683094, "percentage": 14.97, "elapsed_time": "2:29:02", "remaining_time": "14:06:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 800, "total_steps": 5309, "loss": 3.2068, "learning_rate": 1e-05, "epoch": 0.15066090702574184, "percentage": 15.07, "elapsed_time": "2:29:59", "remaining_time": "14:05:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 805, "total_steps": 5309, "loss": 3.2194, "learning_rate": 1e-05, "epoch": 0.1516025376946527, "percentage": 15.16, "elapsed_time": "2:32:18", "remaining_time": "14:12:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 810, "total_steps": 5309, "loss": 3.1456, "learning_rate": 1e-05, "epoch": 0.1525441683635636, "percentage": 15.26, "elapsed_time": "2:33:16", "remaining_time": "14:11:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 815, "total_steps": 5309, "loss": 3.1675, "learning_rate": 1e-05, "epoch": 0.1534857990324745, "percentage": 15.35, "elapsed_time": "2:34:16", "remaining_time": "14:10:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 820, "total_steps": 5309, "loss": 3.1728, "learning_rate": 1e-05, "epoch": 0.15442742970138537, "percentage": 15.45, "elapsed_time": "2:35:15", "remaining_time": "14:09:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 825, "total_steps": 5309, "loss": 3.2012, "learning_rate": 1e-05, "epoch": 0.15536906037029627, "percentage": 15.54, "elapsed_time": "2:36:15", "remaining_time": "14:09:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 830, "total_steps": 5309, "loss": 3.1008, "learning_rate": 1e-05, "epoch": 0.15631069103920714, "percentage": 15.63, "elapsed_time": "2:37:14", "remaining_time": "14:08:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 835, "total_steps": 5309, "loss": 3.0711, "learning_rate": 1e-05, "epoch": 0.15725232170811804, "percentage": 15.73, "elapsed_time": "2:38:14", "remaining_time": "14:07:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 840, "total_steps": 5309, "loss": 3.1625, "learning_rate": 1e-05, "epoch": 0.1581939523770289, "percentage": 15.82, "elapsed_time": "2:39:12", "remaining_time": "14:07:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 845, "total_steps": 5309, "loss": 3.066, "learning_rate": 1e-05, "epoch": 0.1591355830459398, "percentage": 15.92, "elapsed_time": "2:40:14", "remaining_time": "14:06:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 850, "total_steps": 5309, "loss": 3.2498, "learning_rate": 1e-05, "epoch": 0.1600772137148507, "percentage": 16.01, "elapsed_time": "2:41:15", "remaining_time": "14:05:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 855, "total_steps": 5309, "loss": 3.2414, "learning_rate": 1e-05, "epoch": 0.16101884438376157, "percentage": 16.1, "elapsed_time": "2:42:16", "remaining_time": "14:05:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 860, "total_steps": 5309, "loss": 3.1307, "learning_rate": 1e-05, "epoch": 0.16196047505267247, "percentage": 16.2, "elapsed_time": "2:43:18", "remaining_time": "14:04:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 865, "total_steps": 5309, "loss": 3.1473, "learning_rate": 1e-05, "epoch": 0.16290210572158334, "percentage": 16.29, "elapsed_time": "2:44:19", "remaining_time": "14:04:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 870, "total_steps": 5309, "loss": 3.1971, "learning_rate": 1e-05, "epoch": 0.16384373639049424, "percentage": 16.39, "elapsed_time": "2:45:20", "remaining_time": "14:03:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 875, "total_steps": 5309, "loss": 3.1617, "learning_rate": 1e-05, "epoch": 0.16478536705940514, "percentage": 16.48, "elapsed_time": "2:46:19", "remaining_time": "14:02:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 880, "total_steps": 5309, "loss": 3.1806, "learning_rate": 1e-05, "epoch": 0.165726997728316, "percentage": 16.58, "elapsed_time": "2:47:20", "remaining_time": "14:02:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 885, "total_steps": 5309, "loss": 3.2673, "learning_rate": 1e-05, "epoch": 0.1666686283972269, "percentage": 16.67, "elapsed_time": "2:48:21", "remaining_time": "14:01:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 890, "total_steps": 5309, "loss": 3.273, "learning_rate": 1e-05, "epoch": 0.16761025906613777, "percentage": 16.76, "elapsed_time": "2:49:21", "remaining_time": "14:00:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 895, "total_steps": 5309, "loss": 3.1663, "learning_rate": 1e-05, "epoch": 0.16855188973504867, "percentage": 16.86, "elapsed_time": "2:50:21", "remaining_time": "14:00:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 900, "total_steps": 5309, "loss": 3.1979, "learning_rate": 1e-05, "epoch": 0.16949352040395957, "percentage": 16.95, "elapsed_time": "2:51:21", "remaining_time": "13:59:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 905, "total_steps": 5309, "loss": 3.2013, "learning_rate": 1e-05, "epoch": 0.17043515107287044, "percentage": 17.05, "elapsed_time": "2:52:22", "remaining_time": "13:58:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 910, "total_steps": 5309, "loss": 3.1721, "learning_rate": 1e-05, "epoch": 0.17137678174178134, "percentage": 17.14, "elapsed_time": "2:53:22", "remaining_time": "13:58:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 915, "total_steps": 5309, "loss": 3.1774, "learning_rate": 1e-05, "epoch": 0.1723184124106922, "percentage": 17.23, "elapsed_time": "2:54:20", "remaining_time": "13:57:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 920, "total_steps": 5309, "loss": 3.095, "learning_rate": 1e-05, "epoch": 0.1732600430796031, "percentage": 17.33, "elapsed_time": "2:55:21", "remaining_time": "13:56:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 925, "total_steps": 5309, "loss": 3.1806, "learning_rate": 1e-05, "epoch": 0.174201673748514, "percentage": 17.42, "elapsed_time": "2:56:21", "remaining_time": "13:55:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 930, "total_steps": 5309, "loss": 3.2352, "learning_rate": 1e-05, "epoch": 0.17514330441742487, "percentage": 17.52, "elapsed_time": "2:57:20", "remaining_time": "13:55:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 935, "total_steps": 5309, "loss": 3.2167, "learning_rate": 1e-05, "epoch": 0.17608493508633577, "percentage": 17.61, "elapsed_time": "2:58:16", "remaining_time": "13:53:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 940, "total_steps": 5309, "loss": 3.12, "learning_rate": 1e-05, "epoch": 0.17702656575524664, "percentage": 17.71, "elapsed_time": "2:59:10", "remaining_time": "13:52:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 945, "total_steps": 5309, "loss": 3.1027, "learning_rate": 1e-05, "epoch": 0.17796819642415754, "percentage": 17.8, "elapsed_time": "3:00:06", "remaining_time": "13:51:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 950, "total_steps": 5309, "loss": 2.9981, "learning_rate": 1e-05, "epoch": 0.1789098270930684, "percentage": 17.89, "elapsed_time": "3:01:00", "remaining_time": "13:50:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 955, "total_steps": 5309, "loss": 3.0539, "learning_rate": 1e-05, "epoch": 0.1798514577619793, "percentage": 17.99, "elapsed_time": "3:01:57", "remaining_time": "13:49:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 960, "total_steps": 5309, "loss": 3.1362, "learning_rate": 1e-05, "epoch": 0.1807930884308902, "percentage": 18.08, "elapsed_time": "3:02:53", "remaining_time": "13:48:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 965, "total_steps": 5309, "loss": 3.1821, "learning_rate": 1e-05, "epoch": 0.18173471909980107, "percentage": 18.18, "elapsed_time": "3:03:47", "remaining_time": "13:47:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 970, "total_steps": 5309, "loss": 3.1523, "learning_rate": 1e-05, "epoch": 0.18267634976871197, "percentage": 18.27, "elapsed_time": "3:04:41", "remaining_time": "13:46:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 975, "total_steps": 5309, "loss": 3.2531, "learning_rate": 1e-05, "epoch": 0.18361798043762284, "percentage": 18.37, "elapsed_time": "3:05:33", "remaining_time": "13:44:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 980, "total_steps": 5309, "loss": 3.1006, "learning_rate": 1e-05, "epoch": 0.18455961110653374, "percentage": 18.46, "elapsed_time": "3:06:28", "remaining_time": "13:43:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 985, "total_steps": 5309, "loss": 3.1259, "learning_rate": 1e-05, "epoch": 0.18550124177544464, "percentage": 18.55, "elapsed_time": "3:07:23", "remaining_time": "13:42:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 990, "total_steps": 5309, "loss": 3.1813, "learning_rate": 1e-05, "epoch": 0.1864428724443555, "percentage": 18.65, "elapsed_time": "3:08:16", "remaining_time": "13:41:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 995, "total_steps": 5309, "loss": 3.1389, "learning_rate": 1e-05, "epoch": 0.1873845031132664, "percentage": 18.74, "elapsed_time": "3:09:10", "remaining_time": "13:40:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1000, "total_steps": 5309, "loss": 3.1203, "learning_rate": 1e-05, "epoch": 0.18832613378217727, "percentage": 18.84, "elapsed_time": "3:10:04", "remaining_time": "13:39:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1000, "total_steps": 5309, "eval_loss": 3.179180860519409, "epoch": 0.18832613378217727, "percentage": 18.84, "elapsed_time": "3:28:34", "remaining_time": "14:58:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1005, "total_steps": 5309, "loss": 3.2909, "learning_rate": 1e-05, "epoch": 0.18926776445108817, "percentage": 18.93, "elapsed_time": "3:30:47", "remaining_time": "15:02:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1010, "total_steps": 5309, "loss": 3.1388, "learning_rate": 1e-05, "epoch": 0.19020939511999907, "percentage": 19.02, "elapsed_time": "3:31:40", "remaining_time": "15:00:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1015, "total_steps": 5309, "loss": 3.1176, "learning_rate": 1e-05, "epoch": 0.19115102578890994, "percentage": 19.12, "elapsed_time": "3:32:33", "remaining_time": "14:59:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1020, "total_steps": 5309, "loss": 3.1302, "learning_rate": 1e-05, "epoch": 0.19209265645782084, "percentage": 19.21, "elapsed_time": "3:33:26", "remaining_time": "14:57:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1025, "total_steps": 5309, "loss": 3.1978, "learning_rate": 1e-05, "epoch": 0.1930342871267317, "percentage": 19.31, "elapsed_time": "3:34:23", "remaining_time": "14:56:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1030, "total_steps": 5309, "loss": 3.2441, "learning_rate": 1e-05, "epoch": 0.1939759177956426, "percentage": 19.4, "elapsed_time": "3:35:17", "remaining_time": "14:54:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1035, "total_steps": 5309, "loss": 3.209, "learning_rate": 1e-05, "epoch": 0.1949175484645535, "percentage": 19.5, "elapsed_time": "3:36:14", "remaining_time": "14:52:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1040, "total_steps": 5309, "loss": 3.0915, "learning_rate": 1e-05, "epoch": 0.19585917913346437, "percentage": 19.59, "elapsed_time": "3:37:09", "remaining_time": "14:51:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1045, "total_steps": 5309, "loss": 3.2262, "learning_rate": 1e-05, "epoch": 0.19680080980237527, "percentage": 19.68, "elapsed_time": "3:37:59", "remaining_time": "14:49:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1050, "total_steps": 5309, "loss": 3.1164, "learning_rate": 1e-05, "epoch": 0.19774244047128614, "percentage": 19.78, "elapsed_time": "3:38:55", "remaining_time": "14:48:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1055, "total_steps": 5309, "loss": 3.2323, "learning_rate": 1e-05, "epoch": 0.19868407114019704, "percentage": 19.87, "elapsed_time": "3:39:49", "remaining_time": "14:46:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1060, "total_steps": 5309, "loss": 3.1852, "learning_rate": 1e-05, "epoch": 0.19962570180910794, "percentage": 19.97, "elapsed_time": "3:40:43", "remaining_time": "14:44:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1065, "total_steps": 5309, "loss": 3.2516, "learning_rate": 1e-05, "epoch": 0.2005673324780188, "percentage": 20.06, "elapsed_time": "3:41:37", "remaining_time": "14:43:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1070, "total_steps": 5309, "loss": 3.1669, "learning_rate": 1e-05, "epoch": 0.2015089631469297, "percentage": 20.15, "elapsed_time": "3:42:32", "remaining_time": "14:41:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1075, "total_steps": 5309, "loss": 3.1575, "learning_rate": 1e-05, "epoch": 0.20245059381584057, "percentage": 20.25, "elapsed_time": "3:43:26", "remaining_time": "14:40:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1080, "total_steps": 5309, "loss": 3.182, "learning_rate": 1e-05, "epoch": 0.20339222448475147, "percentage": 20.34, "elapsed_time": "3:44:21", "remaining_time": "14:38:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1085, "total_steps": 5309, "loss": 3.1049, "learning_rate": 1e-05, "epoch": 0.20433385515366234, "percentage": 20.44, "elapsed_time": "3:45:16", "remaining_time": "14:37:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1090, "total_steps": 5309, "loss": 3.0769, "learning_rate": 1e-05, "epoch": 0.20527548582257324, "percentage": 20.53, "elapsed_time": "3:46:10", "remaining_time": "14:35:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1095, "total_steps": 5309, "loss": 3.0977, "learning_rate": 1e-05, "epoch": 0.20621711649148414, "percentage": 20.63, "elapsed_time": "3:47:04", "remaining_time": "14:33:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1100, "total_steps": 5309, "loss": 3.1317, "learning_rate": 1e-05, "epoch": 0.207158747160395, "percentage": 20.72, "elapsed_time": "3:47:59", "remaining_time": "14:32:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1105, "total_steps": 5309, "loss": 3.2471, "learning_rate": 1e-05, "epoch": 0.2081003778293059, "percentage": 20.81, "elapsed_time": "3:48:54", "remaining_time": "14:30:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1110, "total_steps": 5309, "loss": 3.183, "learning_rate": 1e-05, "epoch": 0.20904200849821677, "percentage": 20.91, "elapsed_time": "3:49:49", "remaining_time": "14:29:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1115, "total_steps": 5309, "loss": 3.2104, "learning_rate": 1e-05, "epoch": 0.20998363916712767, "percentage": 21.0, "elapsed_time": "3:50:43", "remaining_time": "14:27:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1120, "total_steps": 5309, "loss": 3.0842, "learning_rate": 1e-05, "epoch": 0.21092526983603857, "percentage": 21.1, "elapsed_time": "3:51:37", "remaining_time": "14:26:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1125, "total_steps": 5309, "loss": 3.2527, "learning_rate": 1e-05, "epoch": 0.21186690050494944, "percentage": 21.19, "elapsed_time": "3:52:30", "remaining_time": "14:24:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1130, "total_steps": 5309, "loss": 3.2335, "learning_rate": 1e-05, "epoch": 0.21280853117386034, "percentage": 21.28, "elapsed_time": "3:53:26", "remaining_time": "14:23:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1135, "total_steps": 5309, "loss": 3.1974, "learning_rate": 1e-05, "epoch": 0.2137501618427712, "percentage": 21.38, "elapsed_time": "3:54:21", "remaining_time": "14:21:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1140, "total_steps": 5309, "loss": 3.0964, "learning_rate": 1e-05, "epoch": 0.2146917925116821, "percentage": 21.47, "elapsed_time": "3:55:14", "remaining_time": "14:20:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1145, "total_steps": 5309, "loss": 3.1731, "learning_rate": 1e-05, "epoch": 0.215633423180593, "percentage": 21.57, "elapsed_time": "3:56:07", "remaining_time": "14:18:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1150, "total_steps": 5309, "loss": 3.203, "learning_rate": 1e-05, "epoch": 0.21657505384950387, "percentage": 21.66, "elapsed_time": "3:57:01", "remaining_time": "14:17:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1155, "total_steps": 5309, "loss": 3.0797, "learning_rate": 1e-05, "epoch": 0.21751668451841477, "percentage": 21.76, "elapsed_time": "3:57:56", "remaining_time": "14:15:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1160, "total_steps": 5309, "loss": 3.1964, "learning_rate": 1e-05, "epoch": 0.21845831518732564, "percentage": 21.85, "elapsed_time": "3:58:50", "remaining_time": "14:14:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1165, "total_steps": 5309, "loss": 3.0157, "learning_rate": 1e-05, "epoch": 0.21939994585623654, "percentage": 21.94, "elapsed_time": "3:59:42", "remaining_time": "14:12:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1170, "total_steps": 5309, "loss": 3.1937, "learning_rate": 1e-05, "epoch": 0.22034157652514744, "percentage": 22.04, "elapsed_time": "4:00:35", "remaining_time": "14:11:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1175, "total_steps": 5309, "loss": 3.1185, "learning_rate": 1e-05, "epoch": 0.2212832071940583, "percentage": 22.13, "elapsed_time": "4:01:31", "remaining_time": "14:09:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1180, "total_steps": 5309, "loss": 3.0673, "learning_rate": 1e-05, "epoch": 0.2222248378629692, "percentage": 22.23, "elapsed_time": "4:02:25", "remaining_time": "14:08:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1185, "total_steps": 5309, "loss": 3.1101, "learning_rate": 1e-05, "epoch": 0.22316646853188007, "percentage": 22.32, "elapsed_time": "4:03:19", "remaining_time": "14:06:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1190, "total_steps": 5309, "loss": 3.2017, "learning_rate": 1e-05, "epoch": 0.22410809920079097, "percentage": 22.41, "elapsed_time": "4:04:15", "remaining_time": "14:05:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1195, "total_steps": 5309, "loss": 3.1853, "learning_rate": 1e-05, "epoch": 0.22504972986970187, "percentage": 22.51, "elapsed_time": "4:05:09", "remaining_time": "14:04:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1200, "total_steps": 5309, "loss": 3.0598, "learning_rate": 1e-05, "epoch": 0.22599136053861274, "percentage": 22.6, "elapsed_time": "4:06:02", "remaining_time": "14:02:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1205, "total_steps": 5309, "loss": 3.2231, "learning_rate": 1e-05, "epoch": 0.22693299120752364, "percentage": 22.7, "elapsed_time": "4:08:13", "remaining_time": "14:05:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1210, "total_steps": 5309, "loss": 3.0795, "learning_rate": 1e-05, "epoch": 0.2278746218764345, "percentage": 22.79, "elapsed_time": "4:09:06", "remaining_time": "14:03:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1215, "total_steps": 5309, "loss": 3.1155, "learning_rate": 1e-05, "epoch": 0.2288162525453454, "percentage": 22.89, "elapsed_time": "4:10:01", "remaining_time": "14:02:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1220, "total_steps": 5309, "loss": 3.1393, "learning_rate": 1e-05, "epoch": 0.22975788321425628, "percentage": 22.98, "elapsed_time": "4:10:56", "remaining_time": "14:01:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1225, "total_steps": 5309, "loss": 3.1817, "learning_rate": 1e-05, "epoch": 0.23069951388316717, "percentage": 23.07, "elapsed_time": "4:11:50", "remaining_time": "13:59:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1230, "total_steps": 5309, "loss": 3.1628, "learning_rate": 1e-05, "epoch": 0.23164114455207807, "percentage": 23.17, "elapsed_time": "4:12:45", "remaining_time": "13:58:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1235, "total_steps": 5309, "loss": 3.1317, "learning_rate": 1e-05, "epoch": 0.23258277522098894, "percentage": 23.26, "elapsed_time": "4:13:41", "remaining_time": "13:56:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1240, "total_steps": 5309, "loss": 3.1783, "learning_rate": 1e-05, "epoch": 0.23352440588989984, "percentage": 23.36, "elapsed_time": "4:14:35", "remaining_time": "13:55:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1245, "total_steps": 5309, "loss": 3.1752, "learning_rate": 1e-05, "epoch": 0.2344660365588107, "percentage": 23.45, "elapsed_time": "4:15:31", "remaining_time": "13:54:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1250, "total_steps": 5309, "loss": 3.2413, "learning_rate": 1e-05, "epoch": 0.2354076672277216, "percentage": 23.54, "elapsed_time": "4:16:27", "remaining_time": "13:52:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1255, "total_steps": 5309, "loss": 3.1678, "learning_rate": 1e-05, "epoch": 0.2363492978966325, "percentage": 23.64, "elapsed_time": "4:17:22", "remaining_time": "13:51:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1260, "total_steps": 5309, "loss": 3.1669, "learning_rate": 1e-05, "epoch": 0.23729092856554337, "percentage": 23.73, "elapsed_time": "4:18:16", "remaining_time": "13:49:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1265, "total_steps": 5309, "loss": 3.1201, "learning_rate": 1e-05, "epoch": 0.23823255923445427, "percentage": 23.83, "elapsed_time": "4:19:11", "remaining_time": "13:48:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1270, "total_steps": 5309, "loss": 3.1909, "learning_rate": 1e-05, "epoch": 0.23917418990336514, "percentage": 23.92, "elapsed_time": "4:20:03", "remaining_time": "13:47:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1275, "total_steps": 5309, "loss": 3.2572, "learning_rate": 1e-05, "epoch": 0.24011582057227604, "percentage": 24.02, "elapsed_time": "4:20:57", "remaining_time": "13:45:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1280, "total_steps": 5309, "loss": 3.1206, "learning_rate": 1e-05, "epoch": 0.24105745124118694, "percentage": 24.11, "elapsed_time": "4:21:51", "remaining_time": "13:44:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1285, "total_steps": 5309, "loss": 3.2485, "learning_rate": 1e-05, "epoch": 0.2419990819100978, "percentage": 24.2, "elapsed_time": "4:22:45", "remaining_time": "13:42:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1290, "total_steps": 5309, "loss": 3.1398, "learning_rate": 1e-05, "epoch": 0.2429407125790087, "percentage": 24.3, "elapsed_time": "4:23:41", "remaining_time": "13:41:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1295, "total_steps": 5309, "loss": 3.0652, "learning_rate": 1e-05, "epoch": 0.24388234324791958, "percentage": 24.39, "elapsed_time": "4:24:35", "remaining_time": "13:40:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1300, "total_steps": 5309, "loss": 3.0686, "learning_rate": 1e-05, "epoch": 0.24482397391683047, "percentage": 24.49, "elapsed_time": "4:25:29", "remaining_time": "13:38:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1305, "total_steps": 5309, "loss": 3.2359, "learning_rate": 1e-05, "epoch": 0.24576560458574137, "percentage": 24.58, "elapsed_time": "4:26:23", "remaining_time": "13:37:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1310, "total_steps": 5309, "loss": 3.0857, "learning_rate": 1e-05, "epoch": 0.24670723525465224, "percentage": 24.68, "elapsed_time": "4:27:17", "remaining_time": "13:35:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1315, "total_steps": 5309, "loss": 3.244, "learning_rate": 1e-05, "epoch": 0.24764886592356314, "percentage": 24.77, "elapsed_time": "4:28:11", "remaining_time": "13:34:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1320, "total_steps": 5309, "loss": 3.1444, "learning_rate": 1e-05, "epoch": 0.248590496592474, "percentage": 24.86, "elapsed_time": "4:29:06", "remaining_time": "13:33:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1325, "total_steps": 5309, "loss": 3.2096, "learning_rate": 1e-05, "epoch": 0.2495321272613849, "percentage": 24.96, "elapsed_time": "4:30:00", "remaining_time": "13:31:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1330, "total_steps": 5309, "loss": 3.139, "learning_rate": 1e-05, "epoch": 0.2504737579302958, "percentage": 25.05, "elapsed_time": "4:30:54", "remaining_time": "13:30:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1335, "total_steps": 5309, "loss": 3.1436, "learning_rate": 1e-05, "epoch": 0.2514153885992067, "percentage": 25.15, "elapsed_time": "4:31:48", "remaining_time": "13:29:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1340, "total_steps": 5309, "loss": 3.1479, "learning_rate": 1e-05, "epoch": 0.25235701926811754, "percentage": 25.24, "elapsed_time": "4:32:40", "remaining_time": "13:27:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1345, "total_steps": 5309, "loss": 3.0753, "learning_rate": 1e-05, "epoch": 0.25329864993702844, "percentage": 25.33, "elapsed_time": "4:33:33", "remaining_time": "13:26:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1350, "total_steps": 5309, "loss": 3.0703, "learning_rate": 1e-05, "epoch": 0.25424028060593934, "percentage": 25.43, "elapsed_time": "4:34:27", "remaining_time": "13:24:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1355, "total_steps": 5309, "loss": 3.0837, "learning_rate": 1e-05, "epoch": 0.25518191127485024, "percentage": 25.52, "elapsed_time": "4:35:25", "remaining_time": "13:23:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1360, "total_steps": 5309, "loss": 3.121, "learning_rate": 1e-05, "epoch": 0.25612354194376113, "percentage": 25.62, "elapsed_time": "4:36:17", "remaining_time": "13:22:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1365, "total_steps": 5309, "loss": 3.122, "learning_rate": 1e-05, "epoch": 0.257065172612672, "percentage": 25.71, "elapsed_time": "4:37:10", "remaining_time": "13:20:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1370, "total_steps": 5309, "loss": 3.1381, "learning_rate": 1e-05, "epoch": 0.2580068032815829, "percentage": 25.81, "elapsed_time": "4:38:04", "remaining_time": "13:19:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1375, "total_steps": 5309, "loss": 3.1744, "learning_rate": 1e-05, "epoch": 0.2589484339504938, "percentage": 25.9, "elapsed_time": "4:38:56", "remaining_time": "13:18:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1380, "total_steps": 5309, "loss": 3.1222, "learning_rate": 1e-05, "epoch": 0.25989006461940467, "percentage": 25.99, "elapsed_time": "4:39:51", "remaining_time": "13:16:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1385, "total_steps": 5309, "loss": 3.1122, "learning_rate": 1e-05, "epoch": 0.26083169528831557, "percentage": 26.09, "elapsed_time": "4:40:44", "remaining_time": "13:15:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1390, "total_steps": 5309, "loss": 3.0969, "learning_rate": 1e-05, "epoch": 0.2617733259572264, "percentage": 26.18, "elapsed_time": "4:41:37", "remaining_time": "13:14:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1395, "total_steps": 5309, "loss": 3.0817, "learning_rate": 1e-05, "epoch": 0.2627149566261373, "percentage": 26.28, "elapsed_time": "4:42:30", "remaining_time": "13:12:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1400, "total_steps": 5309, "loss": 3.105, "learning_rate": 1e-05, "epoch": 0.2636565872950482, "percentage": 26.37, "elapsed_time": "4:43:23", "remaining_time": "13:11:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1405, "total_steps": 5309, "loss": 3.2028, "learning_rate": 1e-05, "epoch": 0.2645982179639591, "percentage": 26.46, "elapsed_time": "4:45:39", "remaining_time": "13:13:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1410, "total_steps": 5309, "loss": 3.014, "learning_rate": 1e-05, "epoch": 0.26553984863286995, "percentage": 26.56, "elapsed_time": "4:46:33", "remaining_time": "13:12:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1415, "total_steps": 5309, "loss": 3.143, "learning_rate": 1e-05, "epoch": 0.26648147930178084, "percentage": 26.65, "elapsed_time": "4:47:26", "remaining_time": "13:11:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1420, "total_steps": 5309, "loss": 3.1865, "learning_rate": 1e-05, "epoch": 0.26742310997069174, "percentage": 26.75, "elapsed_time": "4:48:20", "remaining_time": "13:09:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1425, "total_steps": 5309, "loss": 3.0858, "learning_rate": 1e-05, "epoch": 0.26836474063960264, "percentage": 26.84, "elapsed_time": "4:49:15", "remaining_time": "13:08:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1430, "total_steps": 5309, "loss": 2.9854, "learning_rate": 1e-05, "epoch": 0.26930637130851354, "percentage": 26.94, "elapsed_time": "4:50:09", "remaining_time": "13:07:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1435, "total_steps": 5309, "loss": 3.0504, "learning_rate": 1e-05, "epoch": 0.2702480019774244, "percentage": 27.03, "elapsed_time": "4:51:02", "remaining_time": "13:05:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1440, "total_steps": 5309, "loss": 3.0354, "learning_rate": 1e-05, "epoch": 0.2711896326463353, "percentage": 27.12, "elapsed_time": "4:51:59", "remaining_time": "13:04:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1445, "total_steps": 5309, "loss": 3.067, "learning_rate": 1e-05, "epoch": 0.2721312633152462, "percentage": 27.22, "elapsed_time": "4:52:53", "remaining_time": "13:03:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1450, "total_steps": 5309, "loss": 3.1172, "learning_rate": 1e-05, "epoch": 0.2730728939841571, "percentage": 27.31, "elapsed_time": "4:53:48", "remaining_time": "13:01:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1455, "total_steps": 5309, "loss": 3.139, "learning_rate": 1e-05, "epoch": 0.27401452465306797, "percentage": 27.41, "elapsed_time": "4:54:41", "remaining_time": "13:00:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1460, "total_steps": 5309, "loss": 3.1805, "learning_rate": 1e-05, "epoch": 0.2749561553219788, "percentage": 27.5, "elapsed_time": "4:55:35", "remaining_time": "12:59:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1465, "total_steps": 5309, "loss": 3.1389, "learning_rate": 1e-05, "epoch": 0.2758977859908897, "percentage": 27.59, "elapsed_time": "4:56:29", "remaining_time": "12:57:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1470, "total_steps": 5309, "loss": 3.0739, "learning_rate": 1e-05, "epoch": 0.2768394166598006, "percentage": 27.69, "elapsed_time": "4:57:23", "remaining_time": "12:56:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1475, "total_steps": 5309, "loss": 3.043, "learning_rate": 1e-05, "epoch": 0.2777810473287115, "percentage": 27.78, "elapsed_time": "4:58:17", "remaining_time": "12:55:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1480, "total_steps": 5309, "loss": 3.2218, "learning_rate": 1e-05, "epoch": 0.2787226779976224, "percentage": 27.88, "elapsed_time": "4:59:10", "remaining_time": "12:54:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1485, "total_steps": 5309, "loss": 3.1249, "learning_rate": 1e-05, "epoch": 0.27966430866653325, "percentage": 27.97, "elapsed_time": "5:00:03", "remaining_time": "12:52:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1490, "total_steps": 5309, "loss": 3.0944, "learning_rate": 1e-05, "epoch": 0.28060593933544414, "percentage": 28.07, "elapsed_time": "5:00:57", "remaining_time": "12:51:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1495, "total_steps": 5309, "loss": 3.0844, "learning_rate": 1e-05, "epoch": 0.28154757000435504, "percentage": 28.16, "elapsed_time": "5:01:50", "remaining_time": "12:50:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1500, "total_steps": 5309, "loss": 3.2153, "learning_rate": 1e-05, "epoch": 0.28248920067326594, "percentage": 28.25, "elapsed_time": "5:02:43", "remaining_time": "12:48:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1505, "total_steps": 5309, "loss": 3.0676, "learning_rate": 1e-05, "epoch": 0.28343083134217684, "percentage": 28.35, "elapsed_time": "5:03:37", "remaining_time": "12:47:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1510, "total_steps": 5309, "loss": 3.0716, "learning_rate": 1e-05, "epoch": 0.2843724620110877, "percentage": 28.44, "elapsed_time": "5:04:30", "remaining_time": "12:46:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1515, "total_steps": 5309, "loss": 3.142, "learning_rate": 1e-05, "epoch": 0.2853140926799986, "percentage": 28.54, "elapsed_time": "5:05:23", "remaining_time": "12:44:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1520, "total_steps": 5309, "loss": 3.2461, "learning_rate": 1e-05, "epoch": 0.2862557233489095, "percentage": 28.63, "elapsed_time": "5:06:16", "remaining_time": "12:43:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1525, "total_steps": 5309, "loss": 3.1051, "learning_rate": 1e-05, "epoch": 0.28719735401782037, "percentage": 28.72, "elapsed_time": "5:07:09", "remaining_time": "12:42:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1530, "total_steps": 5309, "loss": 3.1131, "learning_rate": 1e-05, "epoch": 0.28813898468673127, "percentage": 28.82, "elapsed_time": "5:08:04", "remaining_time": "12:40:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1535, "total_steps": 5309, "loss": 3.1323, "learning_rate": 1e-05, "epoch": 0.2890806153556421, "percentage": 28.91, "elapsed_time": "5:08:58", "remaining_time": "12:39:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1540, "total_steps": 5309, "loss": 3.1595, "learning_rate": 1e-05, "epoch": 0.290022246024553, "percentage": 29.01, "elapsed_time": "5:09:52", "remaining_time": "12:38:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1545, "total_steps": 5309, "loss": 3.0943, "learning_rate": 1e-05, "epoch": 0.2909638766934639, "percentage": 29.1, "elapsed_time": "5:10:47", "remaining_time": "12:37:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1550, "total_steps": 5309, "loss": 3.194, "learning_rate": 1e-05, "epoch": 0.2919055073623748, "percentage": 29.2, "elapsed_time": "5:11:41", "remaining_time": "12:35:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1555, "total_steps": 5309, "loss": 3.0033, "learning_rate": 1e-05, "epoch": 0.2928471380312857, "percentage": 29.29, "elapsed_time": "5:12:35", "remaining_time": "12:34:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1560, "total_steps": 5309, "loss": 3.1661, "learning_rate": 1e-05, "epoch": 0.29378876870019655, "percentage": 29.38, "elapsed_time": "5:13:29", "remaining_time": "12:33:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1565, "total_steps": 5309, "loss": 3.1411, "learning_rate": 1e-05, "epoch": 0.29473039936910744, "percentage": 29.48, "elapsed_time": "5:14:23", "remaining_time": "12:32:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1570, "total_steps": 5309, "loss": 3.0471, "learning_rate": 1e-05, "epoch": 0.29567203003801834, "percentage": 29.57, "elapsed_time": "5:15:17", "remaining_time": "12:30:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1575, "total_steps": 5309, "loss": 3.1417, "learning_rate": 1e-05, "epoch": 0.29661366070692924, "percentage": 29.67, "elapsed_time": "5:16:09", "remaining_time": "12:29:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1580, "total_steps": 5309, "loss": 3.13, "learning_rate": 1e-05, "epoch": 0.29755529137584014, "percentage": 29.76, "elapsed_time": "5:17:04", "remaining_time": "12:28:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1585, "total_steps": 5309, "loss": 3.1489, "learning_rate": 1e-05, "epoch": 0.298496922044751, "percentage": 29.85, "elapsed_time": "5:17:59", "remaining_time": "12:27:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1590, "total_steps": 5309, "loss": 3.1203, "learning_rate": 1e-05, "epoch": 0.2994385527136619, "percentage": 29.95, "elapsed_time": "5:18:52", "remaining_time": "12:25:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1595, "total_steps": 5309, "loss": 3.1018, "learning_rate": 1e-05, "epoch": 0.3003801833825728, "percentage": 30.04, "elapsed_time": "5:19:46", "remaining_time": "12:24:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1600, "total_steps": 5309, "loss": 3.209, "learning_rate": 1e-05, "epoch": 0.30132181405148367, "percentage": 30.14, "elapsed_time": "5:20:40", "remaining_time": "12:23:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1605, "total_steps": 5309, "loss": 3.2921, "learning_rate": 1e-05, "epoch": 0.30226344472039457, "percentage": 30.23, "elapsed_time": "5:22:55", "remaining_time": "12:25:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1610, "total_steps": 5309, "loss": 3.1812, "learning_rate": 1e-05, "epoch": 0.3032050753893054, "percentage": 30.33, "elapsed_time": "5:23:50", "remaining_time": "12:24:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1615, "total_steps": 5309, "loss": 3.0092, "learning_rate": 1e-05, "epoch": 0.3041467060582163, "percentage": 30.42, "elapsed_time": "5:24:43", "remaining_time": "12:22:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1620, "total_steps": 5309, "loss": 3.1616, "learning_rate": 1e-05, "epoch": 0.3050883367271272, "percentage": 30.51, "elapsed_time": "5:25:37", "remaining_time": "12:21:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1625, "total_steps": 5309, "loss": 3.1064, "learning_rate": 1e-05, "epoch": 0.3060299673960381, "percentage": 30.61, "elapsed_time": "5:26:32", "remaining_time": "12:20:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1630, "total_steps": 5309, "loss": 3.1486, "learning_rate": 1e-05, "epoch": 0.306971598064949, "percentage": 30.7, "elapsed_time": "5:27:26", "remaining_time": "12:19:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1635, "total_steps": 5309, "loss": 2.995, "learning_rate": 1e-05, "epoch": 0.30791322873385985, "percentage": 30.8, "elapsed_time": "5:28:20", "remaining_time": "12:17:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1640, "total_steps": 5309, "loss": 3.1971, "learning_rate": 1e-05, "epoch": 0.30885485940277074, "percentage": 30.89, "elapsed_time": "5:29:13", "remaining_time": "12:16:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1645, "total_steps": 5309, "loss": 3.1604, "learning_rate": 1e-05, "epoch": 0.30979649007168164, "percentage": 30.99, "elapsed_time": "5:30:07", "remaining_time": "12:15:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1650, "total_steps": 5309, "loss": 3.0831, "learning_rate": 1e-05, "epoch": 0.31073812074059254, "percentage": 31.08, "elapsed_time": "5:31:01", "remaining_time": "12:14:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1655, "total_steps": 5309, "loss": 3.1665, "learning_rate": 1e-05, "epoch": 0.3116797514095034, "percentage": 31.17, "elapsed_time": "5:31:56", "remaining_time": "12:12:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1660, "total_steps": 5309, "loss": 3.0876, "learning_rate": 1e-05, "epoch": 0.3126213820784143, "percentage": 31.27, "elapsed_time": "5:32:50", "remaining_time": "12:11:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1665, "total_steps": 5309, "loss": 3.1172, "learning_rate": 1e-05, "epoch": 0.3135630127473252, "percentage": 31.36, "elapsed_time": "5:33:43", "remaining_time": "12:10:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1670, "total_steps": 5309, "loss": 3.1627, "learning_rate": 1e-05, "epoch": 0.3145046434162361, "percentage": 31.46, "elapsed_time": "5:34:37", "remaining_time": "12:09:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1675, "total_steps": 5309, "loss": 3.0749, "learning_rate": 1e-05, "epoch": 0.31544627408514697, "percentage": 31.55, "elapsed_time": "5:35:30", "remaining_time": "12:07:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1680, "total_steps": 5309, "loss": 3.0414, "learning_rate": 1e-05, "epoch": 0.3163879047540578, "percentage": 31.64, "elapsed_time": "5:36:25", "remaining_time": "12:06:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1685, "total_steps": 5309, "loss": 3.1829, "learning_rate": 1e-05, "epoch": 0.3173295354229687, "percentage": 31.74, "elapsed_time": "5:37:18", "remaining_time": "12:05:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1690, "total_steps": 5309, "loss": 3.0745, "learning_rate": 1e-05, "epoch": 0.3182711660918796, "percentage": 31.83, "elapsed_time": "5:38:12", "remaining_time": "12:04:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1695, "total_steps": 5309, "loss": 3.1691, "learning_rate": 1e-05, "epoch": 0.3192127967607905, "percentage": 31.93, "elapsed_time": "5:39:05", "remaining_time": "12:02:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1700, "total_steps": 5309, "loss": 3.0937, "learning_rate": 1e-05, "epoch": 0.3201544274297014, "percentage": 32.02, "elapsed_time": "5:39:58", "remaining_time": "12:01:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1705, "total_steps": 5309, "loss": 3.0187, "learning_rate": 1e-05, "epoch": 0.32109605809861225, "percentage": 32.12, "elapsed_time": "5:40:53", "remaining_time": "12:00:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1710, "total_steps": 5309, "loss": 3.0608, "learning_rate": 1e-05, "epoch": 0.32203768876752314, "percentage": 32.21, "elapsed_time": "5:41:47", "remaining_time": "11:59:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1715, "total_steps": 5309, "loss": 3.1721, "learning_rate": 1e-05, "epoch": 0.32297931943643404, "percentage": 32.3, "elapsed_time": "5:42:40", "remaining_time": "11:58:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1720, "total_steps": 5309, "loss": 3.0493, "learning_rate": 1e-05, "epoch": 0.32392095010534494, "percentage": 32.4, "elapsed_time": "5:43:34", "remaining_time": "11:56:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1725, "total_steps": 5309, "loss": 3.0396, "learning_rate": 1e-05, "epoch": 0.32486258077425584, "percentage": 32.49, "elapsed_time": "5:44:28", "remaining_time": "11:55:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1730, "total_steps": 5309, "loss": 3.0956, "learning_rate": 1e-05, "epoch": 0.3258042114431667, "percentage": 32.59, "elapsed_time": "5:45:22", "remaining_time": "11:54:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1735, "total_steps": 5309, "loss": 3.1334, "learning_rate": 1e-05, "epoch": 0.3267458421120776, "percentage": 32.68, "elapsed_time": "5:46:13", "remaining_time": "11:53:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1740, "total_steps": 5309, "loss": 3.1312, "learning_rate": 1e-05, "epoch": 0.3276874727809885, "percentage": 32.77, "elapsed_time": "5:47:06", "remaining_time": "11:51:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1745, "total_steps": 5309, "loss": 2.9995, "learning_rate": 1e-05, "epoch": 0.3286291034498994, "percentage": 32.87, "elapsed_time": "5:48:00", "remaining_time": "11:50:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1750, "total_steps": 5309, "loss": 3.1386, "learning_rate": 1e-05, "epoch": 0.32957073411881027, "percentage": 32.96, "elapsed_time": "5:48:52", "remaining_time": "11:49:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1755, "total_steps": 5309, "loss": 3.0442, "learning_rate": 1e-05, "epoch": 0.3305123647877211, "percentage": 33.06, "elapsed_time": "5:49:47", "remaining_time": "11:48:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1760, "total_steps": 5309, "loss": 3.0377, "learning_rate": 1e-05, "epoch": 0.331453995456632, "percentage": 33.15, "elapsed_time": "5:50:46", "remaining_time": "11:47:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1765, "total_steps": 5309, "loss": 3.1311, "learning_rate": 1e-05, "epoch": 0.3323956261255429, "percentage": 33.25, "elapsed_time": "5:51:39", "remaining_time": "11:46:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1770, "total_steps": 5309, "loss": 3.0599, "learning_rate": 1e-05, "epoch": 0.3333372567944538, "percentage": 33.34, "elapsed_time": "5:52:32", "remaining_time": "11:44:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1775, "total_steps": 5309, "loss": 3.222, "learning_rate": 1e-05, "epoch": 0.3342788874633647, "percentage": 33.43, "elapsed_time": "5:53:25", "remaining_time": "11:43:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1780, "total_steps": 5309, "loss": 3.0587, "learning_rate": 1e-05, "epoch": 0.33522051813227555, "percentage": 33.53, "elapsed_time": "5:54:19", "remaining_time": "11:42:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1785, "total_steps": 5309, "loss": 3.2038, "learning_rate": 1e-05, "epoch": 0.33616214880118644, "percentage": 33.62, "elapsed_time": "5:55:12", "remaining_time": "11:41:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1790, "total_steps": 5309, "loss": 3.1324, "learning_rate": 1e-05, "epoch": 0.33710377947009734, "percentage": 33.72, "elapsed_time": "5:56:07", "remaining_time": "11:40:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1795, "total_steps": 5309, "loss": 3.1101, "learning_rate": 1e-05, "epoch": 0.33804541013900824, "percentage": 33.81, "elapsed_time": "5:57:01", "remaining_time": "11:38:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1800, "total_steps": 5309, "loss": 3.0915, "learning_rate": 1e-05, "epoch": 0.33898704080791914, "percentage": 33.9, "elapsed_time": "5:57:53", "remaining_time": "11:37:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1805, "total_steps": 5309, "loss": 3.2059, "learning_rate": 1e-05, "epoch": 0.33992867147683, "percentage": 34.0, "elapsed_time": "6:00:08", "remaining_time": "11:39:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1810, "total_steps": 5309, "loss": 3.1364, "learning_rate": 1e-05, "epoch": 0.3408703021457409, "percentage": 34.09, "elapsed_time": "6:01:02", "remaining_time": "11:37:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1815, "total_steps": 5309, "loss": 3.0507, "learning_rate": 1e-05, "epoch": 0.3418119328146518, "percentage": 34.19, "elapsed_time": "6:01:58", "remaining_time": "11:36:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1820, "total_steps": 5309, "loss": 3.0383, "learning_rate": 1e-05, "epoch": 0.3427535634835627, "percentage": 34.28, "elapsed_time": "6:02:51", "remaining_time": "11:35:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1825, "total_steps": 5309, "loss": 3.1888, "learning_rate": 1e-05, "epoch": 0.34369519415247357, "percentage": 34.38, "elapsed_time": "6:03:45", "remaining_time": "11:34:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1830, "total_steps": 5309, "loss": 3.089, "learning_rate": 1e-05, "epoch": 0.3446368248213844, "percentage": 34.47, "elapsed_time": "6:04:37", "remaining_time": "11:33:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1835, "total_steps": 5309, "loss": 3.1111, "learning_rate": 1e-05, "epoch": 0.3455784554902953, "percentage": 34.56, "elapsed_time": "6:05:30", "remaining_time": "11:31:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1840, "total_steps": 5309, "loss": 3.0944, "learning_rate": 1e-05, "epoch": 0.3465200861592062, "percentage": 34.66, "elapsed_time": "6:06:24", "remaining_time": "11:30:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1845, "total_steps": 5309, "loss": 3.1129, "learning_rate": 1e-05, "epoch": 0.3474617168281171, "percentage": 34.75, "elapsed_time": "6:07:19", "remaining_time": "11:29:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1850, "total_steps": 5309, "loss": 3.1843, "learning_rate": 1e-05, "epoch": 0.348403347497028, "percentage": 34.85, "elapsed_time": "6:08:13", "remaining_time": "11:28:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1855, "total_steps": 5309, "loss": 3.0514, "learning_rate": 1e-05, "epoch": 0.34934497816593885, "percentage": 34.94, "elapsed_time": "6:09:07", "remaining_time": "11:27:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1860, "total_steps": 5309, "loss": 3.1919, "learning_rate": 1e-05, "epoch": 0.35028660883484974, "percentage": 35.03, "elapsed_time": "6:09:59", "remaining_time": "11:26:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1865, "total_steps": 5309, "loss": 3.1084, "learning_rate": 1e-05, "epoch": 0.35122823950376064, "percentage": 35.13, "elapsed_time": "6:10:56", "remaining_time": "11:25:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1870, "total_steps": 5309, "loss": 3.0292, "learning_rate": 1e-05, "epoch": 0.35216987017267154, "percentage": 35.22, "elapsed_time": "6:11:51", "remaining_time": "11:23:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1875, "total_steps": 5309, "loss": 3.0266, "learning_rate": 1e-05, "epoch": 0.35311150084158244, "percentage": 35.32, "elapsed_time": "6:12:45", "remaining_time": "11:22:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1880, "total_steps": 5309, "loss": 3.1074, "learning_rate": 1e-05, "epoch": 0.3540531315104933, "percentage": 35.41, "elapsed_time": "6:13:39", "remaining_time": "11:21:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1885, "total_steps": 5309, "loss": 3.1157, "learning_rate": 1e-05, "epoch": 0.3549947621794042, "percentage": 35.51, "elapsed_time": "6:14:34", "remaining_time": "11:20:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1890, "total_steps": 5309, "loss": 3.0207, "learning_rate": 1e-05, "epoch": 0.3559363928483151, "percentage": 35.6, "elapsed_time": "6:15:27", "remaining_time": "11:19:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1895, "total_steps": 5309, "loss": 3.1247, "learning_rate": 1e-05, "epoch": 0.356878023517226, "percentage": 35.69, "elapsed_time": "6:16:19", "remaining_time": "11:17:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1900, "total_steps": 5309, "loss": 3.1562, "learning_rate": 1e-05, "epoch": 0.3578196541861368, "percentage": 35.79, "elapsed_time": "6:17:14", "remaining_time": "11:16:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1905, "total_steps": 5309, "loss": 3.0676, "learning_rate": 1e-05, "epoch": 0.3587612848550477, "percentage": 35.88, "elapsed_time": "6:18:09", "remaining_time": "11:15:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1910, "total_steps": 5309, "loss": 3.1094, "learning_rate": 1e-05, "epoch": 0.3597029155239586, "percentage": 35.98, "elapsed_time": "6:19:03", "remaining_time": "11:14:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1915, "total_steps": 5309, "loss": 3.12, "learning_rate": 1e-05, "epoch": 0.3606445461928695, "percentage": 36.07, "elapsed_time": "6:19:56", "remaining_time": "11:13:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1920, "total_steps": 5309, "loss": 3.189, "learning_rate": 1e-05, "epoch": 0.3615861768617804, "percentage": 36.17, "elapsed_time": "6:20:50", "remaining_time": "11:12:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1925, "total_steps": 5309, "loss": 3.1649, "learning_rate": 1e-05, "epoch": 0.36252780753069125, "percentage": 36.26, "elapsed_time": "6:21:45", "remaining_time": "11:11:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1930, "total_steps": 5309, "loss": 3.103, "learning_rate": 1e-05, "epoch": 0.36346943819960215, "percentage": 36.35, "elapsed_time": "6:22:41", "remaining_time": "11:10:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1935, "total_steps": 5309, "loss": 3.1464, "learning_rate": 1e-05, "epoch": 0.36441106886851304, "percentage": 36.45, "elapsed_time": "6:23:36", "remaining_time": "11:08:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1940, "total_steps": 5309, "loss": 3.0434, "learning_rate": 1e-05, "epoch": 0.36535269953742394, "percentage": 36.54, "elapsed_time": "6:24:29", "remaining_time": "11:07:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1945, "total_steps": 5309, "loss": 3.077, "learning_rate": 1e-05, "epoch": 0.36629433020633484, "percentage": 36.64, "elapsed_time": "6:25:23", "remaining_time": "11:06:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1950, "total_steps": 5309, "loss": 3.0714, "learning_rate": 1e-05, "epoch": 0.3672359608752457, "percentage": 36.73, "elapsed_time": "6:26:17", "remaining_time": "11:05:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1955, "total_steps": 5309, "loss": 3.1796, "learning_rate": 1e-05, "epoch": 0.3681775915441566, "percentage": 36.82, "elapsed_time": "6:27:17", "remaining_time": "11:04:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1960, "total_steps": 5309, "loss": 3.1673, "learning_rate": 1e-05, "epoch": 0.3691192222130675, "percentage": 36.92, "elapsed_time": "6:28:11", "remaining_time": "11:03:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1965, "total_steps": 5309, "loss": 2.955, "learning_rate": 1e-05, "epoch": 0.3700608528819784, "percentage": 37.01, "elapsed_time": "6:29:05", "remaining_time": "11:02:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1970, "total_steps": 5309, "loss": 2.9934, "learning_rate": 1e-05, "epoch": 0.3710024835508893, "percentage": 37.11, "elapsed_time": "6:29:58", "remaining_time": "11:00:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1975, "total_steps": 5309, "loss": 3.0656, "learning_rate": 1e-05, "epoch": 0.3719441142198001, "percentage": 37.2, "elapsed_time": "6:30:54", "remaining_time": "10:59:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1980, "total_steps": 5309, "loss": 3.2, "learning_rate": 1e-05, "epoch": 0.372885744888711, "percentage": 37.3, "elapsed_time": "6:31:45", "remaining_time": "10:58:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1985, "total_steps": 5309, "loss": 3.129, "learning_rate": 1e-05, "epoch": 0.3738273755576219, "percentage": 37.39, "elapsed_time": "6:32:39", "remaining_time": "10:57:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1990, "total_steps": 5309, "loss": 3.1392, "learning_rate": 1e-05, "epoch": 0.3747690062265328, "percentage": 37.48, "elapsed_time": "6:33:33", "remaining_time": "10:56:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1995, "total_steps": 5309, "loss": 3.1261, "learning_rate": 1e-05, "epoch": 0.3757106368954437, "percentage": 37.58, "elapsed_time": "6:34:29", "remaining_time": "10:55:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2000, "total_steps": 5309, "loss": 3.1165, "learning_rate": 1e-05, "epoch": 0.37665226756435455, "percentage": 37.67, "elapsed_time": "6:35:23", "remaining_time": "10:54:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2000, "total_steps": 5309, "eval_loss": 3.105938673019409, "epoch": 0.37665226756435455, "percentage": 37.67, "elapsed_time": "6:52:40", "remaining_time": "11:22:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2005, "total_steps": 5309, "loss": 3.0121, "learning_rate": 1e-05, "epoch": 0.37759389823326545, "percentage": 37.77, "elapsed_time": "6:54:54", "remaining_time": "11:23:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2010, "total_steps": 5309, "loss": 3.0836, "learning_rate": 1e-05, "epoch": 0.37853552890217634, "percentage": 37.86, "elapsed_time": "6:55:47", "remaining_time": "11:22:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2015, "total_steps": 5309, "loss": 3.0859, "learning_rate": 1e-05, "epoch": 0.37947715957108724, "percentage": 37.95, "elapsed_time": "6:56:40", "remaining_time": "11:21:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2020, "total_steps": 5309, "loss": 3.0992, "learning_rate": 1e-05, "epoch": 0.38041879023999814, "percentage": 38.05, "elapsed_time": "6:57:34", "remaining_time": "11:19:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2025, "total_steps": 5309, "loss": 3.0912, "learning_rate": 1e-05, "epoch": 0.381360420908909, "percentage": 38.14, "elapsed_time": "6:58:26", "remaining_time": "11:18:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2030, "total_steps": 5309, "loss": 3.0669, "learning_rate": 1e-05, "epoch": 0.3823020515778199, "percentage": 38.24, "elapsed_time": "6:59:20", "remaining_time": "11:17:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2035, "total_steps": 5309, "loss": 3.1704, "learning_rate": 1e-05, "epoch": 0.3832436822467308, "percentage": 38.33, "elapsed_time": "7:00:14", "remaining_time": "11:16:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2040, "total_steps": 5309, "loss": 3.0961, "learning_rate": 1e-05, "epoch": 0.3841853129156417, "percentage": 38.43, "elapsed_time": "7:01:08", "remaining_time": "11:14:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2045, "total_steps": 5309, "loss": 3.1942, "learning_rate": 1e-05, "epoch": 0.3851269435845526, "percentage": 38.52, "elapsed_time": "7:02:01", "remaining_time": "11:13:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2050, "total_steps": 5309, "loss": 3.0334, "learning_rate": 1e-05, "epoch": 0.3860685742534634, "percentage": 38.61, "elapsed_time": "7:02:55", "remaining_time": "11:12:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2055, "total_steps": 5309, "loss": 3.1301, "learning_rate": 1e-05, "epoch": 0.3870102049223743, "percentage": 38.71, "elapsed_time": "7:03:49", "remaining_time": "11:11:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2060, "total_steps": 5309, "loss": 3.0588, "learning_rate": 1e-05, "epoch": 0.3879518355912852, "percentage": 38.8, "elapsed_time": "7:04:43", "remaining_time": "11:09:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2065, "total_steps": 5309, "loss": 3.0914, "learning_rate": 1e-05, "epoch": 0.3888934662601961, "percentage": 38.9, "elapsed_time": "7:05:39", "remaining_time": "11:08:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2070, "total_steps": 5309, "loss": 3.1279, "learning_rate": 1e-05, "epoch": 0.389835096929107, "percentage": 38.99, "elapsed_time": "7:06:35", "remaining_time": "11:07:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2075, "total_steps": 5309, "loss": 3.0307, "learning_rate": 1e-05, "epoch": 0.39077672759801785, "percentage": 39.08, "elapsed_time": "7:07:29", "remaining_time": "11:06:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2080, "total_steps": 5309, "loss": 3.0223, "learning_rate": 1e-05, "epoch": 0.39171835826692875, "percentage": 39.18, "elapsed_time": "7:08:24", "remaining_time": "11:05:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2085, "total_steps": 5309, "loss": 3.107, "learning_rate": 1e-05, "epoch": 0.39265998893583964, "percentage": 39.27, "elapsed_time": "7:09:19", "remaining_time": "11:03:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2090, "total_steps": 5309, "loss": 3.1048, "learning_rate": 1e-05, "epoch": 0.39360161960475054, "percentage": 39.37, "elapsed_time": "7:10:11", "remaining_time": "11:02:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2095, "total_steps": 5309, "loss": 3.0824, "learning_rate": 1e-05, "epoch": 0.39454325027366144, "percentage": 39.46, "elapsed_time": "7:11:04", "remaining_time": "11:01:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2100, "total_steps": 5309, "loss": 3.0604, "learning_rate": 1e-05, "epoch": 0.3954848809425723, "percentage": 39.56, "elapsed_time": "7:11:59", "remaining_time": "11:00:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2105, "total_steps": 5309, "loss": 3.1625, "learning_rate": 1e-05, "epoch": 0.3964265116114832, "percentage": 39.65, "elapsed_time": "7:12:54", "remaining_time": "10:58:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2110, "total_steps": 5309, "loss": 3.0494, "learning_rate": 1e-05, "epoch": 0.3973681422803941, "percentage": 39.74, "elapsed_time": "7:13:47", "remaining_time": "10:57:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2115, "total_steps": 5309, "loss": 3.1758, "learning_rate": 1e-05, "epoch": 0.398309772949305, "percentage": 39.84, "elapsed_time": "7:14:42", "remaining_time": "10:56:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2120, "total_steps": 5309, "loss": 3.1234, "learning_rate": 1e-05, "epoch": 0.39925140361821587, "percentage": 39.93, "elapsed_time": "7:15:35", "remaining_time": "10:55:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2125, "total_steps": 5309, "loss": 3.013, "learning_rate": 1e-05, "epoch": 0.4001930342871267, "percentage": 40.03, "elapsed_time": "7:16:32", "remaining_time": "10:54:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2130, "total_steps": 5309, "loss": 3.1199, "learning_rate": 1e-05, "epoch": 0.4011346649560376, "percentage": 40.12, "elapsed_time": "7:17:25", "remaining_time": "10:52:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2135, "total_steps": 5309, "loss": 3.0762, "learning_rate": 1e-05, "epoch": 0.4020762956249485, "percentage": 40.21, "elapsed_time": "7:18:20", "remaining_time": "10:51:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2140, "total_steps": 5309, "loss": 3.053, "learning_rate": 1e-05, "epoch": 0.4030179262938594, "percentage": 40.31, "elapsed_time": "7:19:14", "remaining_time": "10:50:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2145, "total_steps": 5309, "loss": 3.1715, "learning_rate": 1e-05, "epoch": 0.40395955696277025, "percentage": 40.4, "elapsed_time": "7:20:10", "remaining_time": "10:49:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2150, "total_steps": 5309, "loss": 3.093, "learning_rate": 1e-05, "epoch": 0.40490118763168115, "percentage": 40.5, "elapsed_time": "7:21:03", "remaining_time": "10:48:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2155, "total_steps": 5309, "loss": 3.0454, "learning_rate": 1e-05, "epoch": 0.40584281830059205, "percentage": 40.59, "elapsed_time": "7:21:58", "remaining_time": "10:46:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2160, "total_steps": 5309, "loss": 3.1014, "learning_rate": 1e-05, "epoch": 0.40678444896950294, "percentage": 40.69, "elapsed_time": "7:22:49", "remaining_time": "10:45:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2165, "total_steps": 5309, "loss": 3.1274, "learning_rate": 1e-05, "epoch": 0.40772607963841384, "percentage": 40.78, "elapsed_time": "7:23:43", "remaining_time": "10:44:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2170, "total_steps": 5309, "loss": 3.0354, "learning_rate": 1e-05, "epoch": 0.4086677103073247, "percentage": 40.87, "elapsed_time": "7:24:39", "remaining_time": "10:43:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2175, "total_steps": 5309, "loss": 3.0585, "learning_rate": 1e-05, "epoch": 0.4096093409762356, "percentage": 40.97, "elapsed_time": "7:25:31", "remaining_time": "10:41:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2180, "total_steps": 5309, "loss": 3.0792, "learning_rate": 1e-05, "epoch": 0.4105509716451465, "percentage": 41.06, "elapsed_time": "7:26:26", "remaining_time": "10:40:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2185, "total_steps": 5309, "loss": 3.1141, "learning_rate": 1e-05, "epoch": 0.4114926023140574, "percentage": 41.16, "elapsed_time": "7:27:20", "remaining_time": "10:39:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2190, "total_steps": 5309, "loss": 3.0372, "learning_rate": 1e-05, "epoch": 0.4124342329829683, "percentage": 41.25, "elapsed_time": "7:28:16", "remaining_time": "10:38:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2195, "total_steps": 5309, "loss": 3.0653, "learning_rate": 1e-05, "epoch": 0.4133758636518791, "percentage": 41.34, "elapsed_time": "7:29:09", "remaining_time": "10:37:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2200, "total_steps": 5309, "loss": 3.1723, "learning_rate": 1e-05, "epoch": 0.41431749432079, "percentage": 41.44, "elapsed_time": "7:30:04", "remaining_time": "10:36:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2205, "total_steps": 5309, "loss": 3.1088, "learning_rate": 1e-05, "epoch": 0.4152591249897009, "percentage": 41.53, "elapsed_time": "7:32:17", "remaining_time": "10:36:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2210, "total_steps": 5309, "loss": 3.1864, "learning_rate": 1e-05, "epoch": 0.4162007556586118, "percentage": 41.63, "elapsed_time": "7:33:12", "remaining_time": "10:35:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2215, "total_steps": 5309, "loss": 3.1957, "learning_rate": 1e-05, "epoch": 0.4171423863275227, "percentage": 41.72, "elapsed_time": "7:34:05", "remaining_time": "10:34:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2220, "total_steps": 5309, "loss": 3.1946, "learning_rate": 1e-05, "epoch": 0.41808401699643355, "percentage": 41.82, "elapsed_time": "7:34:58", "remaining_time": "10:33:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2225, "total_steps": 5309, "loss": 3.0261, "learning_rate": 1e-05, "epoch": 0.41902564766534445, "percentage": 41.91, "elapsed_time": "7:35:53", "remaining_time": "10:31:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2230, "total_steps": 5309, "loss": 3.0848, "learning_rate": 1e-05, "epoch": 0.41996727833425535, "percentage": 42.0, "elapsed_time": "7:36:49", "remaining_time": "10:30:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2235, "total_steps": 5309, "loss": 3.0151, "learning_rate": 1e-05, "epoch": 0.42090890900316624, "percentage": 42.1, "elapsed_time": "7:37:43", "remaining_time": "10:29:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2240, "total_steps": 5309, "loss": 2.9477, "learning_rate": 1e-05, "epoch": 0.42185053967207714, "percentage": 42.19, "elapsed_time": "7:38:41", "remaining_time": "10:28:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2245, "total_steps": 5309, "loss": 3.0536, "learning_rate": 1e-05, "epoch": 0.422792170340988, "percentage": 42.29, "elapsed_time": "7:39:36", "remaining_time": "10:27:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2250, "total_steps": 5309, "loss": 3.0879, "learning_rate": 1e-05, "epoch": 0.4237338010098989, "percentage": 42.38, "elapsed_time": "7:40:30", "remaining_time": "10:26:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2255, "total_steps": 5309, "loss": 3.0493, "learning_rate": 1e-05, "epoch": 0.4246754316788098, "percentage": 42.48, "elapsed_time": "7:41:24", "remaining_time": "10:24:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2260, "total_steps": 5309, "loss": 2.9738, "learning_rate": 1e-05, "epoch": 0.4256170623477207, "percentage": 42.57, "elapsed_time": "7:42:17", "remaining_time": "10:23:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2265, "total_steps": 5309, "loss": 3.2125, "learning_rate": 1e-05, "epoch": 0.4265586930166316, "percentage": 42.66, "elapsed_time": "7:43:11", "remaining_time": "10:22:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2270, "total_steps": 5309, "loss": 3.1131, "learning_rate": 1e-05, "epoch": 0.4275003236855424, "percentage": 42.76, "elapsed_time": "7:44:06", "remaining_time": "10:21:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2275, "total_steps": 5309, "loss": 3.0646, "learning_rate": 1e-05, "epoch": 0.4284419543544533, "percentage": 42.85, "elapsed_time": "7:45:00", "remaining_time": "10:20:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2280, "total_steps": 5309, "loss": 3.1952, "learning_rate": 1e-05, "epoch": 0.4293835850233642, "percentage": 42.95, "elapsed_time": "7:45:51", "remaining_time": "10:18:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2285, "total_steps": 5309, "loss": 3.1168, "learning_rate": 1e-05, "epoch": 0.4303252156922751, "percentage": 43.04, "elapsed_time": "7:46:47", "remaining_time": "10:17:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2290, "total_steps": 5309, "loss": 3.126, "learning_rate": 1e-05, "epoch": 0.431266846361186, "percentage": 43.13, "elapsed_time": "7:47:40", "remaining_time": "10:16:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2295, "total_steps": 5309, "loss": 3.0791, "learning_rate": 1e-05, "epoch": 0.43220847703009685, "percentage": 43.23, "elapsed_time": "7:48:33", "remaining_time": "10:15:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2300, "total_steps": 5309, "loss": 3.1876, "learning_rate": 1e-05, "epoch": 0.43315010769900775, "percentage": 43.32, "elapsed_time": "7:49:26", "remaining_time": "10:14:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2305, "total_steps": 5309, "loss": 3.0427, "learning_rate": 1e-05, "epoch": 0.43409173836791864, "percentage": 43.42, "elapsed_time": "7:50:19", "remaining_time": "10:12:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2310, "total_steps": 5309, "loss": 3.1455, "learning_rate": 1e-05, "epoch": 0.43503336903682954, "percentage": 43.51, "elapsed_time": "7:51:12", "remaining_time": "10:11:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2315, "total_steps": 5309, "loss": 3.0863, "learning_rate": 1e-05, "epoch": 0.43597499970574044, "percentage": 43.61, "elapsed_time": "7:52:05", "remaining_time": "10:10:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2320, "total_steps": 5309, "loss": 3.1586, "learning_rate": 1e-05, "epoch": 0.4369166303746513, "percentage": 43.7, "elapsed_time": "7:52:58", "remaining_time": "10:09:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2325, "total_steps": 5309, "loss": 3.1336, "learning_rate": 1e-05, "epoch": 0.4378582610435622, "percentage": 43.79, "elapsed_time": "7:53:52", "remaining_time": "10:08:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2330, "total_steps": 5309, "loss": 3.05, "learning_rate": 1e-05, "epoch": 0.4387998917124731, "percentage": 43.89, "elapsed_time": "7:54:46", "remaining_time": "10:07:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2335, "total_steps": 5309, "loss": 3.0782, "learning_rate": 1e-05, "epoch": 0.439741522381384, "percentage": 43.98, "elapsed_time": "7:55:39", "remaining_time": "10:05:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2340, "total_steps": 5309, "loss": 3.113, "learning_rate": 1e-05, "epoch": 0.4406831530502949, "percentage": 44.08, "elapsed_time": "7:56:31", "remaining_time": "10:04:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2345, "total_steps": 5309, "loss": 3.0913, "learning_rate": 1e-05, "epoch": 0.4416247837192057, "percentage": 44.17, "elapsed_time": "7:57:25", "remaining_time": "10:03:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2350, "total_steps": 5309, "loss": 3.1279, "learning_rate": 1e-05, "epoch": 0.4425664143881166, "percentage": 44.26, "elapsed_time": "7:58:21", "remaining_time": "10:02:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2355, "total_steps": 5309, "loss": 3.1026, "learning_rate": 1e-05, "epoch": 0.4435080450570275, "percentage": 44.36, "elapsed_time": "7:59:13", "remaining_time": "10:01:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2360, "total_steps": 5309, "loss": 3.1523, "learning_rate": 1e-05, "epoch": 0.4444496757259384, "percentage": 44.45, "elapsed_time": "8:00:10", "remaining_time": "10:00:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2365, "total_steps": 5309, "loss": 3.0798, "learning_rate": 1e-05, "epoch": 0.4453913063948493, "percentage": 44.55, "elapsed_time": "8:01:04", "remaining_time": "9:58:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2370, "total_steps": 5309, "loss": 3.1813, "learning_rate": 1e-05, "epoch": 0.44633293706376015, "percentage": 44.64, "elapsed_time": "8:01:57", "remaining_time": "9:57:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2375, "total_steps": 5309, "loss": 3.0597, "learning_rate": 1e-05, "epoch": 0.44727456773267105, "percentage": 44.74, "elapsed_time": "8:02:50", "remaining_time": "9:56:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2380, "total_steps": 5309, "loss": 3.0837, "learning_rate": 1e-05, "epoch": 0.44821619840158194, "percentage": 44.83, "elapsed_time": "8:03:45", "remaining_time": "9:55:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2385, "total_steps": 5309, "loss": 2.9755, "learning_rate": 1e-05, "epoch": 0.44915782907049284, "percentage": 44.92, "elapsed_time": "8:04:40", "remaining_time": "9:54:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2390, "total_steps": 5309, "loss": 3.0906, "learning_rate": 1e-05, "epoch": 0.45009945973940374, "percentage": 45.02, "elapsed_time": "8:05:37", "remaining_time": "9:53:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2395, "total_steps": 5309, "loss": 3.0489, "learning_rate": 1e-05, "epoch": 0.4510410904083146, "percentage": 45.11, "elapsed_time": "8:06:30", "remaining_time": "9:51:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2400, "total_steps": 5309, "loss": 3.1248, "learning_rate": 1e-05, "epoch": 0.4519827210772255, "percentage": 45.21, "elapsed_time": "8:07:23", "remaining_time": "9:50:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2405, "total_steps": 5309, "loss": 3.1008, "learning_rate": 1e-05, "epoch": 0.4529243517461364, "percentage": 45.3, "elapsed_time": "8:09:38", "remaining_time": "9:51:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2410, "total_steps": 5309, "loss": 3.1117, "learning_rate": 1e-05, "epoch": 0.4538659824150473, "percentage": 45.39, "elapsed_time": "8:10:30", "remaining_time": "9:50:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2415, "total_steps": 5309, "loss": 3.1321, "learning_rate": 1e-05, "epoch": 0.4548076130839581, "percentage": 45.49, "elapsed_time": "8:11:25", "remaining_time": "9:48:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2420, "total_steps": 5309, "loss": 3.1185, "learning_rate": 1e-05, "epoch": 0.455749243752869, "percentage": 45.58, "elapsed_time": "8:12:21", "remaining_time": "9:47:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2425, "total_steps": 5309, "loss": 3.0592, "learning_rate": 1e-05, "epoch": 0.4566908744217799, "percentage": 45.68, "elapsed_time": "8:13:16", "remaining_time": "9:46:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2430, "total_steps": 5309, "loss": 3.1555, "learning_rate": 1e-05, "epoch": 0.4576325050906908, "percentage": 45.77, "elapsed_time": "8:14:08", "remaining_time": "9:45:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2435, "total_steps": 5309, "loss": 3.0891, "learning_rate": 1e-05, "epoch": 0.4585741357596017, "percentage": 45.87, "elapsed_time": "8:15:02", "remaining_time": "9:44:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2440, "total_steps": 5309, "loss": 2.9779, "learning_rate": 1e-05, "epoch": 0.45951576642851255, "percentage": 45.96, "elapsed_time": "8:15:57", "remaining_time": "9:43:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2445, "total_steps": 5309, "loss": 3.0613, "learning_rate": 1e-05, "epoch": 0.46045739709742345, "percentage": 46.05, "elapsed_time": "8:16:51", "remaining_time": "9:42:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2450, "total_steps": 5309, "loss": 2.9949, "learning_rate": 1e-05, "epoch": 0.46139902776633435, "percentage": 46.15, "elapsed_time": "8:17:45", "remaining_time": "9:40:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2455, "total_steps": 5309, "loss": 3.1089, "learning_rate": 1e-05, "epoch": 0.46234065843524524, "percentage": 46.24, "elapsed_time": "8:18:40", "remaining_time": "9:39:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2460, "total_steps": 5309, "loss": 2.9965, "learning_rate": 1e-05, "epoch": 0.46328228910415614, "percentage": 46.34, "elapsed_time": "8:19:34", "remaining_time": "9:38:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2465, "total_steps": 5309, "loss": 3.0439, "learning_rate": 1e-05, "epoch": 0.464223919773067, "percentage": 46.43, "elapsed_time": "8:20:27", "remaining_time": "9:37:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2470, "total_steps": 5309, "loss": 3.0025, "learning_rate": 1e-05, "epoch": 0.4651655504419779, "percentage": 46.52, "elapsed_time": "8:21:21", "remaining_time": "9:36:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2475, "total_steps": 5309, "loss": 3.0738, "learning_rate": 1e-05, "epoch": 0.4661071811108888, "percentage": 46.62, "elapsed_time": "8:22:15", "remaining_time": "9:35:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2480, "total_steps": 5309, "loss": 2.9749, "learning_rate": 1e-05, "epoch": 0.4670488117797997, "percentage": 46.71, "elapsed_time": "8:23:10", "remaining_time": "9:33:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2485, "total_steps": 5309, "loss": 3.0647, "learning_rate": 1e-05, "epoch": 0.4679904424487106, "percentage": 46.81, "elapsed_time": "8:24:03", "remaining_time": "9:32:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2490, "total_steps": 5309, "loss": 3.0231, "learning_rate": 1e-05, "epoch": 0.4689320731176214, "percentage": 46.9, "elapsed_time": "8:24:57", "remaining_time": "9:31:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2495, "total_steps": 5309, "loss": 3.0132, "learning_rate": 1e-05, "epoch": 0.4698737037865323, "percentage": 47.0, "elapsed_time": "8:25:50", "remaining_time": "9:30:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2500, "total_steps": 5309, "loss": 3.0343, "learning_rate": 1e-05, "epoch": 0.4708153344554432, "percentage": 47.09, "elapsed_time": "8:26:45", "remaining_time": "9:29:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2505, "total_steps": 5309, "loss": 3.0681, "learning_rate": 1e-05, "epoch": 0.4717569651243541, "percentage": 47.18, "elapsed_time": "8:27:39", "remaining_time": "9:28:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2510, "total_steps": 5309, "loss": 3.1242, "learning_rate": 1e-05, "epoch": 0.472698595793265, "percentage": 47.28, "elapsed_time": "8:28:33", "remaining_time": "9:27:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2515, "total_steps": 5309, "loss": 3.0638, "learning_rate": 1e-05, "epoch": 0.47364022646217585, "percentage": 47.37, "elapsed_time": "8:29:25", "remaining_time": "9:25:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2520, "total_steps": 5309, "loss": 3.0472, "learning_rate": 1e-05, "epoch": 0.47458185713108675, "percentage": 47.47, "elapsed_time": "8:30:18", "remaining_time": "9:24:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2525, "total_steps": 5309, "loss": 3.1256, "learning_rate": 1e-05, "epoch": 0.47552348779999765, "percentage": 47.56, "elapsed_time": "8:31:12", "remaining_time": "9:23:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2530, "total_steps": 5309, "loss": 3.0334, "learning_rate": 1e-05, "epoch": 0.47646511846890854, "percentage": 47.65, "elapsed_time": "8:32:06", "remaining_time": "9:22:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2535, "total_steps": 5309, "loss": 3.1666, "learning_rate": 1e-05, "epoch": 0.47740674913781944, "percentage": 47.75, "elapsed_time": "8:33:01", "remaining_time": "9:21:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2540, "total_steps": 5309, "loss": 3.1129, "learning_rate": 1e-05, "epoch": 0.4783483798067303, "percentage": 47.84, "elapsed_time": "8:33:55", "remaining_time": "9:20:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2545, "total_steps": 5309, "loss": 3.0084, "learning_rate": 1e-05, "epoch": 0.4792900104756412, "percentage": 47.94, "elapsed_time": "8:34:48", "remaining_time": "9:19:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2550, "total_steps": 5309, "loss": 3.0855, "learning_rate": 1e-05, "epoch": 0.4802316411445521, "percentage": 48.03, "elapsed_time": "8:35:42", "remaining_time": "9:17:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2555, "total_steps": 5309, "loss": 2.9989, "learning_rate": 1e-05, "epoch": 0.481173271813463, "percentage": 48.13, "elapsed_time": "8:36:36", "remaining_time": "9:16:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2560, "total_steps": 5309, "loss": 2.9992, "learning_rate": 1e-05, "epoch": 0.4821149024823739, "percentage": 48.22, "elapsed_time": "8:37:31", "remaining_time": "9:15:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2565, "total_steps": 5309, "loss": 2.996, "learning_rate": 1e-05, "epoch": 0.4830565331512847, "percentage": 48.31, "elapsed_time": "8:38:25", "remaining_time": "9:14:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2570, "total_steps": 5309, "loss": 3.0643, "learning_rate": 1e-05, "epoch": 0.4839981638201956, "percentage": 48.41, "elapsed_time": "8:39:19", "remaining_time": "9:13:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2575, "total_steps": 5309, "loss": 3.1647, "learning_rate": 1e-05, "epoch": 0.4849397944891065, "percentage": 48.5, "elapsed_time": "8:40:11", "remaining_time": "9:12:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2580, "total_steps": 5309, "loss": 3.0211, "learning_rate": 1e-05, "epoch": 0.4858814251580174, "percentage": 48.6, "elapsed_time": "8:41:04", "remaining_time": "9:11:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2585, "total_steps": 5309, "loss": 3.0319, "learning_rate": 1e-05, "epoch": 0.4868230558269283, "percentage": 48.69, "elapsed_time": "8:42:00", "remaining_time": "9:10:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2590, "total_steps": 5309, "loss": 3.0748, "learning_rate": 1e-05, "epoch": 0.48776468649583915, "percentage": 48.79, "elapsed_time": "8:42:53", "remaining_time": "9:08:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2595, "total_steps": 5309, "loss": 3.0973, "learning_rate": 1e-05, "epoch": 0.48870631716475005, "percentage": 48.88, "elapsed_time": "8:43:48", "remaining_time": "9:07:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2600, "total_steps": 5309, "loss": 3.0398, "learning_rate": 1e-05, "epoch": 0.48964794783366095, "percentage": 48.97, "elapsed_time": "8:44:41", "remaining_time": "9:06:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2605, "total_steps": 5309, "loss": 3.16, "learning_rate": 1e-05, "epoch": 0.49058957850257184, "percentage": 49.07, "elapsed_time": "8:46:56", "remaining_time": "9:06:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2610, "total_steps": 5309, "loss": 3.0305, "learning_rate": 1e-05, "epoch": 0.49153120917148274, "percentage": 49.16, "elapsed_time": "8:47:50", "remaining_time": "9:05:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2615, "total_steps": 5309, "loss": 3.0226, "learning_rate": 1e-05, "epoch": 0.4924728398403936, "percentage": 49.26, "elapsed_time": "8:48:44", "remaining_time": "9:04:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2620, "total_steps": 5309, "loss": 3.0626, "learning_rate": 1e-05, "epoch": 0.4934144705093045, "percentage": 49.35, "elapsed_time": "8:49:37", "remaining_time": "9:03:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2625, "total_steps": 5309, "loss": 3.1405, "learning_rate": 1e-05, "epoch": 0.4943561011782154, "percentage": 49.44, "elapsed_time": "8:50:30", "remaining_time": "9:02:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2630, "total_steps": 5309, "loss": 2.9996, "learning_rate": 1e-05, "epoch": 0.4952977318471263, "percentage": 49.54, "elapsed_time": "8:51:24", "remaining_time": "9:01:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2635, "total_steps": 5309, "loss": 3.0108, "learning_rate": 1e-05, "epoch": 0.4962393625160372, "percentage": 49.63, "elapsed_time": "8:52:16", "remaining_time": "9:00:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2640, "total_steps": 5309, "loss": 3.1121, "learning_rate": 1e-05, "epoch": 0.497180993184948, "percentage": 49.73, "elapsed_time": "8:53:10", "remaining_time": "8:59:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2645, "total_steps": 5309, "loss": 3.1481, "learning_rate": 1e-05, "epoch": 0.4981226238538589, "percentage": 49.82, "elapsed_time": "8:54:01", "remaining_time": "8:57:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2650, "total_steps": 5309, "loss": 3.1499, "learning_rate": 1e-05, "epoch": 0.4990642545227698, "percentage": 49.92, "elapsed_time": "8:54:55", "remaining_time": "8:56:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2655, "total_steps": 5309, "loss": 3.0624, "learning_rate": 1e-05, "epoch": 0.5000058851916807, "percentage": 50.01, "elapsed_time": "8:55:49", "remaining_time": "8:55:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2660, "total_steps": 5309, "loss": 2.9495, "learning_rate": 1e-05, "epoch": 0.5009475158605916, "percentage": 50.1, "elapsed_time": "8:56:45", "remaining_time": "8:54:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2665, "total_steps": 5309, "loss": 2.9833, "learning_rate": 1e-05, "epoch": 0.5018891465295025, "percentage": 50.2, "elapsed_time": "8:57:36", "remaining_time": "8:53:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2670, "total_steps": 5309, "loss": 3.1446, "learning_rate": 1e-05, "epoch": 0.5028307771984134, "percentage": 50.29, "elapsed_time": "8:58:31", "remaining_time": "8:52:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2675, "total_steps": 5309, "loss": 3.1812, "learning_rate": 1e-05, "epoch": 0.5037724078673242, "percentage": 50.39, "elapsed_time": "8:59:23", "remaining_time": "8:51:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2680, "total_steps": 5309, "loss": 3.0981, "learning_rate": 1e-05, "epoch": 0.5047140385362351, "percentage": 50.48, "elapsed_time": "9:00:16", "remaining_time": "8:49:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2685, "total_steps": 5309, "loss": 3.0404, "learning_rate": 1e-05, "epoch": 0.505655669205146, "percentage": 50.57, "elapsed_time": "9:01:12", "remaining_time": "8:48:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2690, "total_steps": 5309, "loss": 3.0807, "learning_rate": 1e-05, "epoch": 0.5065972998740569, "percentage": 50.67, "elapsed_time": "9:02:06", "remaining_time": "8:47:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2695, "total_steps": 5309, "loss": 3.0895, "learning_rate": 1e-05, "epoch": 0.5075389305429678, "percentage": 50.76, "elapsed_time": "9:03:00", "remaining_time": "8:46:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2700, "total_steps": 5309, "loss": 3.0731, "learning_rate": 1e-05, "epoch": 0.5084805612118787, "percentage": 50.86, "elapsed_time": "9:03:52", "remaining_time": "8:45:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2705, "total_steps": 5309, "loss": 3.0837, "learning_rate": 1e-05, "epoch": 0.5094221918807895, "percentage": 50.95, "elapsed_time": "9:04:47", "remaining_time": "8:44:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2710, "total_steps": 5309, "loss": 2.9995, "learning_rate": 1e-05, "epoch": 0.5103638225497005, "percentage": 51.05, "elapsed_time": "9:05:41", "remaining_time": "8:43:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2715, "total_steps": 5309, "loss": 3.1655, "learning_rate": 1e-05, "epoch": 0.5113054532186113, "percentage": 51.14, "elapsed_time": "9:06:34", "remaining_time": "8:42:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2720, "total_steps": 5309, "loss": 3.0245, "learning_rate": 1e-05, "epoch": 0.5122470838875223, "percentage": 51.23, "elapsed_time": "9:07:29", "remaining_time": "8:41:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2725, "total_steps": 5309, "loss": 3.0993, "learning_rate": 1e-05, "epoch": 0.5131887145564331, "percentage": 51.33, "elapsed_time": "9:08:19", "remaining_time": "8:39:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2730, "total_steps": 5309, "loss": 3.0897, "learning_rate": 1e-05, "epoch": 0.514130345225344, "percentage": 51.42, "elapsed_time": "9:09:14", "remaining_time": "8:38:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2735, "total_steps": 5309, "loss": 2.9622, "learning_rate": 1e-05, "epoch": 0.5150719758942549, "percentage": 51.52, "elapsed_time": "9:10:09", "remaining_time": "8:37:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2740, "total_steps": 5309, "loss": 3.1474, "learning_rate": 1e-05, "epoch": 0.5160136065631657, "percentage": 51.61, "elapsed_time": "9:11:03", "remaining_time": "8:36:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2745, "total_steps": 5309, "loss": 3.095, "learning_rate": 1e-05, "epoch": 0.5169552372320767, "percentage": 51.7, "elapsed_time": "9:11:56", "remaining_time": "8:35:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2750, "total_steps": 5309, "loss": 3.1509, "learning_rate": 1e-05, "epoch": 0.5178968679009875, "percentage": 51.8, "elapsed_time": "9:12:48", "remaining_time": "8:34:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2755, "total_steps": 5309, "loss": 3.0771, "learning_rate": 1e-05, "epoch": 0.5188384985698984, "percentage": 51.89, "elapsed_time": "9:13:43", "remaining_time": "8:33:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2760, "total_steps": 5309, "loss": 2.9578, "learning_rate": 1e-05, "epoch": 0.5197801292388093, "percentage": 51.99, "elapsed_time": "9:14:35", "remaining_time": "8:32:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2765, "total_steps": 5309, "loss": 3.0864, "learning_rate": 1e-05, "epoch": 0.5207217599077202, "percentage": 52.08, "elapsed_time": "9:15:29", "remaining_time": "8:31:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2770, "total_steps": 5309, "loss": 2.9654, "learning_rate": 1e-05, "epoch": 0.5216633905766311, "percentage": 52.18, "elapsed_time": "9:16:22", "remaining_time": "8:29:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2775, "total_steps": 5309, "loss": 2.9616, "learning_rate": 1e-05, "epoch": 0.522605021245542, "percentage": 52.27, "elapsed_time": "9:17:16", "remaining_time": "8:28:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2780, "total_steps": 5309, "loss": 3.1041, "learning_rate": 1e-05, "epoch": 0.5235466519144528, "percentage": 52.36, "elapsed_time": "9:18:10", "remaining_time": "8:27:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2785, "total_steps": 5309, "loss": 3.1307, "learning_rate": 1e-05, "epoch": 0.5244882825833638, "percentage": 52.46, "elapsed_time": "9:19:04", "remaining_time": "8:26:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2790, "total_steps": 5309, "loss": 3.0366, "learning_rate": 1e-05, "epoch": 0.5254299132522746, "percentage": 52.55, "elapsed_time": "9:19:58", "remaining_time": "8:25:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2795, "total_steps": 5309, "loss": 3.0846, "learning_rate": 1e-05, "epoch": 0.5263715439211855, "percentage": 52.65, "elapsed_time": "9:20:50", "remaining_time": "8:24:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2800, "total_steps": 5309, "loss": 3.161, "learning_rate": 1e-05, "epoch": 0.5273131745900964, "percentage": 52.74, "elapsed_time": "9:21:45", "remaining_time": "8:23:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2805, "total_steps": 5309, "loss": 3.0004, "learning_rate": 1e-05, "epoch": 0.5282548052590073, "percentage": 52.83, "elapsed_time": "9:23:58", "remaining_time": "8:23:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2810, "total_steps": 5309, "loss": 3.0108, "learning_rate": 1e-05, "epoch": 0.5291964359279182, "percentage": 52.93, "elapsed_time": "9:24:51", "remaining_time": "8:22:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2815, "total_steps": 5309, "loss": 3.0985, "learning_rate": 1e-05, "epoch": 0.530138066596829, "percentage": 53.02, "elapsed_time": "9:25:44", "remaining_time": "8:21:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2820, "total_steps": 5309, "loss": 3.081, "learning_rate": 1e-05, "epoch": 0.5310796972657399, "percentage": 53.12, "elapsed_time": "9:26:36", "remaining_time": "8:20:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2825, "total_steps": 5309, "loss": 3.1838, "learning_rate": 1e-05, "epoch": 0.5320213279346508, "percentage": 53.21, "elapsed_time": "9:27:31", "remaining_time": "8:19:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2830, "total_steps": 5309, "loss": 3.12, "learning_rate": 1e-05, "epoch": 0.5329629586035617, "percentage": 53.31, "elapsed_time": "9:28:23", "remaining_time": "8:17:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2835, "total_steps": 5309, "loss": 3.0373, "learning_rate": 1e-05, "epoch": 0.5339045892724726, "percentage": 53.4, "elapsed_time": "9:29:19", "remaining_time": "8:16:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2840, "total_steps": 5309, "loss": 3.0716, "learning_rate": 1e-05, "epoch": 0.5348462199413835, "percentage": 53.49, "elapsed_time": "9:30:12", "remaining_time": "8:15:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2845, "total_steps": 5309, "loss": 2.9321, "learning_rate": 1e-05, "epoch": 0.5357878506102943, "percentage": 53.59, "elapsed_time": "9:31:08", "remaining_time": "8:14:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2850, "total_steps": 5309, "loss": 3.1087, "learning_rate": 1e-05, "epoch": 0.5367294812792053, "percentage": 53.68, "elapsed_time": "9:32:01", "remaining_time": "8:13:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2855, "total_steps": 5309, "loss": 3.0788, "learning_rate": 1e-05, "epoch": 0.5376711119481161, "percentage": 53.78, "elapsed_time": "9:32:55", "remaining_time": "8:12:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2860, "total_steps": 5309, "loss": 3.1399, "learning_rate": 1e-05, "epoch": 0.5386127426170271, "percentage": 53.87, "elapsed_time": "9:33:49", "remaining_time": "8:11:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2865, "total_steps": 5309, "loss": 3.0926, "learning_rate": 1e-05, "epoch": 0.5395543732859379, "percentage": 53.96, "elapsed_time": "9:34:44", "remaining_time": "8:10:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2870, "total_steps": 5309, "loss": 3.0853, "learning_rate": 1e-05, "epoch": 0.5404960039548488, "percentage": 54.06, "elapsed_time": "9:35:37", "remaining_time": "8:09:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2875, "total_steps": 5309, "loss": 2.8899, "learning_rate": 1e-05, "epoch": 0.5414376346237597, "percentage": 54.15, "elapsed_time": "9:36:32", "remaining_time": "8:08:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2880, "total_steps": 5309, "loss": 3.1303, "learning_rate": 1e-05, "epoch": 0.5423792652926706, "percentage": 54.25, "elapsed_time": "9:37:24", "remaining_time": "8:06:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2885, "total_steps": 5309, "loss": 3.1267, "learning_rate": 1e-05, "epoch": 0.5433208959615815, "percentage": 54.34, "elapsed_time": "9:38:18", "remaining_time": "8:05:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2890, "total_steps": 5309, "loss": 3.1023, "learning_rate": 1e-05, "epoch": 0.5442625266304923, "percentage": 54.44, "elapsed_time": "9:39:10", "remaining_time": "8:04:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2895, "total_steps": 5309, "loss": 3.1474, "learning_rate": 1e-05, "epoch": 0.5452041572994032, "percentage": 54.53, "elapsed_time": "9:40:03", "remaining_time": "8:03:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2900, "total_steps": 5309, "loss": 2.9699, "learning_rate": 1e-05, "epoch": 0.5461457879683141, "percentage": 54.62, "elapsed_time": "9:40:58", "remaining_time": "8:02:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2905, "total_steps": 5309, "loss": 3.2087, "learning_rate": 1e-05, "epoch": 0.547087418637225, "percentage": 54.72, "elapsed_time": "9:41:51", "remaining_time": "8:01:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2910, "total_steps": 5309, "loss": 3.0275, "learning_rate": 1e-05, "epoch": 0.5480290493061359, "percentage": 54.81, "elapsed_time": "9:42:45", "remaining_time": "8:00:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2915, "total_steps": 5309, "loss": 3.119, "learning_rate": 1e-05, "epoch": 0.5489706799750468, "percentage": 54.91, "elapsed_time": "9:43:37", "remaining_time": "7:59:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2920, "total_steps": 5309, "loss": 3.0491, "learning_rate": 1e-05, "epoch": 0.5499123106439576, "percentage": 55.0, "elapsed_time": "9:44:30", "remaining_time": "7:58:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2925, "total_steps": 5309, "loss": 2.9752, "learning_rate": 1e-05, "epoch": 0.5508539413128686, "percentage": 55.1, "elapsed_time": "9:45:22", "remaining_time": "7:57:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2930, "total_steps": 5309, "loss": 3.188, "learning_rate": 1e-05, "epoch": 0.5517955719817794, "percentage": 55.19, "elapsed_time": "9:46:17", "remaining_time": "7:56:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2935, "total_steps": 5309, "loss": 3.01, "learning_rate": 1e-05, "epoch": 0.5527372026506904, "percentage": 55.28, "elapsed_time": "9:47:12", "remaining_time": "7:54:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2940, "total_steps": 5309, "loss": 2.9473, "learning_rate": 1e-05, "epoch": 0.5536788333196012, "percentage": 55.38, "elapsed_time": "9:48:05", "remaining_time": "7:53:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2945, "total_steps": 5309, "loss": 3.0252, "learning_rate": 1e-05, "epoch": 0.5546204639885121, "percentage": 55.47, "elapsed_time": "9:48:59", "remaining_time": "7:52:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2950, "total_steps": 5309, "loss": 3.0013, "learning_rate": 1e-05, "epoch": 0.555562094657423, "percentage": 55.57, "elapsed_time": "9:49:52", "remaining_time": "7:51:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2955, "total_steps": 5309, "loss": 3.1842, "learning_rate": 1e-05, "epoch": 0.5565037253263339, "percentage": 55.66, "elapsed_time": "9:50:46", "remaining_time": "7:50:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2960, "total_steps": 5309, "loss": 2.9562, "learning_rate": 1e-05, "epoch": 0.5574453559952448, "percentage": 55.75, "elapsed_time": "9:51:38", "remaining_time": "7:49:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2965, "total_steps": 5309, "loss": 3.0687, "learning_rate": 1e-05, "epoch": 0.5583869866641556, "percentage": 55.85, "elapsed_time": "9:52:31", "remaining_time": "7:48:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2970, "total_steps": 5309, "loss": 3.0819, "learning_rate": 1e-05, "epoch": 0.5593286173330665, "percentage": 55.94, "elapsed_time": "9:53:26", "remaining_time": "7:47:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2975, "total_steps": 5309, "loss": 3.078, "learning_rate": 1e-05, "epoch": 0.5602702480019774, "percentage": 56.04, "elapsed_time": "9:54:18", "remaining_time": "7:46:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2980, "total_steps": 5309, "loss": 3.1172, "learning_rate": 1e-05, "epoch": 0.5612118786708883, "percentage": 56.13, "elapsed_time": "9:55:11", "remaining_time": "7:45:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2985, "total_steps": 5309, "loss": 3.0753, "learning_rate": 1e-05, "epoch": 0.5621535093397992, "percentage": 56.23, "elapsed_time": "9:56:04", "remaining_time": "7:44:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2990, "total_steps": 5309, "loss": 2.9837, "learning_rate": 1e-05, "epoch": 0.5630951400087101, "percentage": 56.32, "elapsed_time": "9:56:56", "remaining_time": "7:42:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2995, "total_steps": 5309, "loss": 3.1187, "learning_rate": 1e-05, "epoch": 0.5640367706776209, "percentage": 56.41, "elapsed_time": "9:57:50", "remaining_time": "7:41:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3000, "total_steps": 5309, "loss": 2.9771, "learning_rate": 1e-05, "epoch": 0.5649784013465319, "percentage": 56.51, "elapsed_time": "9:58:44", "remaining_time": "7:40:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3000, "total_steps": 5309, "eval_loss": 3.0637450218200684, "epoch": 0.5649784013465319, "percentage": 56.51, "elapsed_time": "10:16:14", "remaining_time": "7:54:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3005, "total_steps": 5309, "loss": 3.0877, "learning_rate": 1e-05, "epoch": 0.5659200320154427, "percentage": 56.6, "elapsed_time": "10:18:30", "remaining_time": "7:54:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3010, "total_steps": 5309, "loss": 3.0216, "learning_rate": 1e-05, "epoch": 0.5668616626843537, "percentage": 56.7, "elapsed_time": "10:19:20", "remaining_time": "7:53:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3015, "total_steps": 5309, "loss": 3.1276, "learning_rate": 1e-05, "epoch": 0.5678032933532645, "percentage": 56.79, "elapsed_time": "10:20:14", "remaining_time": "7:51:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3020, "total_steps": 5309, "loss": 2.9892, "learning_rate": 1e-05, "epoch": 0.5687449240221754, "percentage": 56.88, "elapsed_time": "10:21:07", "remaining_time": "7:50:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3025, "total_steps": 5309, "loss": 3.0323, "learning_rate": 1e-05, "epoch": 0.5696865546910863, "percentage": 56.98, "elapsed_time": "10:22:04", "remaining_time": "7:49:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3030, "total_steps": 5309, "loss": 3.0609, "learning_rate": 1e-05, "epoch": 0.5706281853599972, "percentage": 57.07, "elapsed_time": "10:22:57", "remaining_time": "7:48:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3035, "total_steps": 5309, "loss": 3.1092, "learning_rate": 1e-05, "epoch": 0.5715698160289081, "percentage": 57.17, "elapsed_time": "10:23:50", "remaining_time": "7:47:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3040, "total_steps": 5309, "loss": 3.1217, "learning_rate": 1e-05, "epoch": 0.572511446697819, "percentage": 57.26, "elapsed_time": "10:24:45", "remaining_time": "7:46:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3045, "total_steps": 5309, "loss": 3.0726, "learning_rate": 1e-05, "epoch": 0.5734530773667298, "percentage": 57.36, "elapsed_time": "10:25:39", "remaining_time": "7:45:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3050, "total_steps": 5309, "loss": 3.065, "learning_rate": 1e-05, "epoch": 0.5743947080356407, "percentage": 57.45, "elapsed_time": "10:26:33", "remaining_time": "7:44:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3055, "total_steps": 5309, "loss": 3.1518, "learning_rate": 1e-05, "epoch": 0.5753363387045516, "percentage": 57.54, "elapsed_time": "10:27:25", "remaining_time": "7:42:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3060, "total_steps": 5309, "loss": 3.0006, "learning_rate": 1e-05, "epoch": 0.5762779693734625, "percentage": 57.64, "elapsed_time": "10:28:18", "remaining_time": "7:41:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3065, "total_steps": 5309, "loss": 3.0849, "learning_rate": 1e-05, "epoch": 0.5772196000423734, "percentage": 57.73, "elapsed_time": "10:29:12", "remaining_time": "7:40:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3070, "total_steps": 5309, "loss": 2.9541, "learning_rate": 1e-05, "epoch": 0.5781612307112842, "percentage": 57.83, "elapsed_time": "10:30:06", "remaining_time": "7:39:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3075, "total_steps": 5309, "loss": 3.0632, "learning_rate": 1e-05, "epoch": 0.5791028613801952, "percentage": 57.92, "elapsed_time": "10:31:02", "remaining_time": "7:38:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3080, "total_steps": 5309, "loss": 3.1407, "learning_rate": 1e-05, "epoch": 0.580044492049106, "percentage": 58.01, "elapsed_time": "10:31:56", "remaining_time": "7:37:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3085, "total_steps": 5309, "loss": 3.1047, "learning_rate": 1e-05, "epoch": 0.580986122718017, "percentage": 58.11, "elapsed_time": "10:32:49", "remaining_time": "7:36:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3090, "total_steps": 5309, "loss": 3.0165, "learning_rate": 1e-05, "epoch": 0.5819277533869278, "percentage": 58.2, "elapsed_time": "10:33:42", "remaining_time": "7:35:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3095, "total_steps": 5309, "loss": 3.1079, "learning_rate": 1e-05, "epoch": 0.5828693840558387, "percentage": 58.3, "elapsed_time": "10:34:35", "remaining_time": "7:33:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3100, "total_steps": 5309, "loss": 3.1699, "learning_rate": 1e-05, "epoch": 0.5838110147247496, "percentage": 58.39, "elapsed_time": "10:35:27", "remaining_time": "7:32:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3105, "total_steps": 5309, "loss": 3.0419, "learning_rate": 1e-05, "epoch": 0.5847526453936605, "percentage": 58.49, "elapsed_time": "10:36:20", "remaining_time": "7:31:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3110, "total_steps": 5309, "loss": 2.9814, "learning_rate": 1e-05, "epoch": 0.5856942760625714, "percentage": 58.58, "elapsed_time": "10:37:14", "remaining_time": "7:30:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3115, "total_steps": 5309, "loss": 3.0864, "learning_rate": 1e-05, "epoch": 0.5866359067314822, "percentage": 58.67, "elapsed_time": "10:38:10", "remaining_time": "7:29:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3120, "total_steps": 5309, "loss": 3.1298, "learning_rate": 1e-05, "epoch": 0.5875775374003931, "percentage": 58.77, "elapsed_time": "10:39:05", "remaining_time": "7:28:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3125, "total_steps": 5309, "loss": 3.0013, "learning_rate": 1e-05, "epoch": 0.588519168069304, "percentage": 58.86, "elapsed_time": "10:39:58", "remaining_time": "7:27:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3130, "total_steps": 5309, "loss": 2.9838, "learning_rate": 1e-05, "epoch": 0.5894607987382149, "percentage": 58.96, "elapsed_time": "10:40:52", "remaining_time": "7:26:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3135, "total_steps": 5309, "loss": 3.1155, "learning_rate": 1e-05, "epoch": 0.5904024294071258, "percentage": 59.05, "elapsed_time": "10:41:48", "remaining_time": "7:25:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3140, "total_steps": 5309, "loss": 3.1303, "learning_rate": 1e-05, "epoch": 0.5913440600760367, "percentage": 59.14, "elapsed_time": "10:42:40", "remaining_time": "7:23:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3145, "total_steps": 5309, "loss": 2.9929, "learning_rate": 1e-05, "epoch": 0.5922856907449475, "percentage": 59.24, "elapsed_time": "10:43:36", "remaining_time": "7:22:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3150, "total_steps": 5309, "loss": 3.0979, "learning_rate": 1e-05, "epoch": 0.5932273214138585, "percentage": 59.33, "elapsed_time": "10:44:30", "remaining_time": "7:21:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3155, "total_steps": 5309, "loss": 3.0098, "learning_rate": 1e-05, "epoch": 0.5941689520827693, "percentage": 59.43, "elapsed_time": "10:45:23", "remaining_time": "7:20:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3160, "total_steps": 5309, "loss": 3.0168, "learning_rate": 1e-05, "epoch": 0.5951105827516803, "percentage": 59.52, "elapsed_time": "10:46:19", "remaining_time": "7:19:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3165, "total_steps": 5309, "loss": 2.9791, "learning_rate": 1e-05, "epoch": 0.5960522134205911, "percentage": 59.62, "elapsed_time": "10:47:13", "remaining_time": "7:18:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3170, "total_steps": 5309, "loss": 2.9036, "learning_rate": 1e-05, "epoch": 0.596993844089502, "percentage": 59.71, "elapsed_time": "10:48:07", "remaining_time": "7:17:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3175, "total_steps": 5309, "loss": 2.9316, "learning_rate": 1e-05, "epoch": 0.5979354747584129, "percentage": 59.8, "elapsed_time": "10:49:02", "remaining_time": "7:16:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3180, "total_steps": 5309, "loss": 3.0915, "learning_rate": 1e-05, "epoch": 0.5988771054273238, "percentage": 59.9, "elapsed_time": "10:49:58", "remaining_time": "7:15:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3185, "total_steps": 5309, "loss": 2.9547, "learning_rate": 1e-05, "epoch": 0.5998187360962347, "percentage": 59.99, "elapsed_time": "10:50:54", "remaining_time": "7:14:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3190, "total_steps": 5309, "loss": 2.9792, "learning_rate": 1e-05, "epoch": 0.6007603667651455, "percentage": 60.09, "elapsed_time": "10:51:48", "remaining_time": "7:12:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3195, "total_steps": 5309, "loss": 3.0121, "learning_rate": 1e-05, "epoch": 0.6017019974340564, "percentage": 60.18, "elapsed_time": "10:52:41", "remaining_time": "7:11:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3200, "total_steps": 5309, "loss": 3.1288, "learning_rate": 1e-05, "epoch": 0.6026436281029673, "percentage": 60.28, "elapsed_time": "10:53:35", "remaining_time": "7:10:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3205, "total_steps": 5309, "loss": 3.0423, "learning_rate": 1e-05, "epoch": 0.6035852587718782, "percentage": 60.37, "elapsed_time": "10:55:46", "remaining_time": "7:10:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3210, "total_steps": 5309, "loss": 3.056, "learning_rate": 1e-05, "epoch": 0.6045268894407891, "percentage": 60.46, "elapsed_time": "10:56:38", "remaining_time": "7:09:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3215, "total_steps": 5309, "loss": 3.0777, "learning_rate": 1e-05, "epoch": 0.6054685201097, "percentage": 60.56, "elapsed_time": "10:57:31", "remaining_time": "7:08:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3220, "total_steps": 5309, "loss": 3.0872, "learning_rate": 1e-05, "epoch": 0.6064101507786108, "percentage": 60.65, "elapsed_time": "10:58:25", "remaining_time": "7:07:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3225, "total_steps": 5309, "loss": 3.1206, "learning_rate": 1e-05, "epoch": 0.6073517814475218, "percentage": 60.75, "elapsed_time": "10:59:18", "remaining_time": "7:06:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3230, "total_steps": 5309, "loss": 3.052, "learning_rate": 1e-05, "epoch": 0.6082934121164326, "percentage": 60.84, "elapsed_time": "11:00:13", "remaining_time": "7:04:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3235, "total_steps": 5309, "loss": 3.1386, "learning_rate": 1e-05, "epoch": 0.6092350427853436, "percentage": 60.93, "elapsed_time": "11:01:07", "remaining_time": "7:03:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3240, "total_steps": 5309, "loss": 2.9426, "learning_rate": 1e-05, "epoch": 0.6101766734542544, "percentage": 61.03, "elapsed_time": "11:02:00", "remaining_time": "7:02:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3245, "total_steps": 5309, "loss": 2.9756, "learning_rate": 1e-05, "epoch": 0.6111183041231653, "percentage": 61.12, "elapsed_time": "11:02:52", "remaining_time": "7:01:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3250, "total_steps": 5309, "loss": 3.0383, "learning_rate": 1e-05, "epoch": 0.6120599347920762, "percentage": 61.22, "elapsed_time": "11:03:45", "remaining_time": "7:00:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3255, "total_steps": 5309, "loss": 2.8681, "learning_rate": 1e-05, "epoch": 0.613001565460987, "percentage": 61.31, "elapsed_time": "11:04:41", "remaining_time": "6:59:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3260, "total_steps": 5309, "loss": 3.0287, "learning_rate": 1e-05, "epoch": 0.613943196129898, "percentage": 61.41, "elapsed_time": "11:05:34", "remaining_time": "6:58:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3265, "total_steps": 5309, "loss": 3.0866, "learning_rate": 1e-05, "epoch": 0.6148848267988088, "percentage": 61.5, "elapsed_time": "11:06:28", "remaining_time": "6:57:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3270, "total_steps": 5309, "loss": 2.9918, "learning_rate": 1e-05, "epoch": 0.6158264574677197, "percentage": 61.59, "elapsed_time": "11:07:24", "remaining_time": "6:56:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3275, "total_steps": 5309, "loss": 2.9678, "learning_rate": 1e-05, "epoch": 0.6167680881366306, "percentage": 61.69, "elapsed_time": "11:08:18", "remaining_time": "6:55:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3280, "total_steps": 5309, "loss": 3.1028, "learning_rate": 1e-05, "epoch": 0.6177097188055415, "percentage": 61.78, "elapsed_time": "11:09:11", "remaining_time": "6:53:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3285, "total_steps": 5309, "loss": 3.0633, "learning_rate": 1e-05, "epoch": 0.6186513494744523, "percentage": 61.88, "elapsed_time": "11:10:05", "remaining_time": "6:52:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3290, "total_steps": 5309, "loss": 3.0126, "learning_rate": 1e-05, "epoch": 0.6195929801433633, "percentage": 61.97, "elapsed_time": "11:10:58", "remaining_time": "6:51:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3295, "total_steps": 5309, "loss": 3.0549, "learning_rate": 1e-05, "epoch": 0.6205346108122741, "percentage": 62.06, "elapsed_time": "11:11:52", "remaining_time": "6:50:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3300, "total_steps": 5309, "loss": 3.0469, "learning_rate": 1e-05, "epoch": 0.6214762414811851, "percentage": 62.16, "elapsed_time": "11:12:46", "remaining_time": "6:49:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3305, "total_steps": 5309, "loss": 3.0797, "learning_rate": 1e-05, "epoch": 0.6224178721500959, "percentage": 62.25, "elapsed_time": "11:13:39", "remaining_time": "6:48:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3310, "total_steps": 5309, "loss": 3.0835, "learning_rate": 1e-05, "epoch": 0.6233595028190068, "percentage": 62.35, "elapsed_time": "11:14:31", "remaining_time": "6:47:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3315, "total_steps": 5309, "loss": 3.0321, "learning_rate": 1e-05, "epoch": 0.6243011334879177, "percentage": 62.44, "elapsed_time": "11:15:24", "remaining_time": "6:46:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3320, "total_steps": 5309, "loss": 2.9796, "learning_rate": 1e-05, "epoch": 0.6252427641568286, "percentage": 62.54, "elapsed_time": "11:16:18", "remaining_time": "6:45:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3325, "total_steps": 5309, "loss": 3.0791, "learning_rate": 1e-05, "epoch": 0.6261843948257395, "percentage": 62.63, "elapsed_time": "11:17:12", "remaining_time": "6:44:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3330, "total_steps": 5309, "loss": 3.0435, "learning_rate": 1e-05, "epoch": 0.6271260254946504, "percentage": 62.72, "elapsed_time": "11:18:05", "remaining_time": "6:42:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3335, "total_steps": 5309, "loss": 3.0616, "learning_rate": 1e-05, "epoch": 0.6280676561635612, "percentage": 62.82, "elapsed_time": "11:18:57", "remaining_time": "6:41:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3340, "total_steps": 5309, "loss": 3.0322, "learning_rate": 1e-05, "epoch": 0.6290092868324721, "percentage": 62.91, "elapsed_time": "11:19:51", "remaining_time": "6:40:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3345, "total_steps": 5309, "loss": 3.0367, "learning_rate": 1e-05, "epoch": 0.629950917501383, "percentage": 63.01, "elapsed_time": "11:20:47", "remaining_time": "6:39:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3350, "total_steps": 5309, "loss": 3.052, "learning_rate": 1e-05, "epoch": 0.6308925481702939, "percentage": 63.1, "elapsed_time": "11:21:44", "remaining_time": "6:38:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3355, "total_steps": 5309, "loss": 3.0902, "learning_rate": 1e-05, "epoch": 0.6318341788392048, "percentage": 63.19, "elapsed_time": "11:22:37", "remaining_time": "6:37:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3360, "total_steps": 5309, "loss": 3.015, "learning_rate": 1e-05, "epoch": 0.6327758095081156, "percentage": 63.29, "elapsed_time": "11:23:29", "remaining_time": "6:36:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3365, "total_steps": 5309, "loss": 3.0254, "learning_rate": 1e-05, "epoch": 0.6337174401770266, "percentage": 63.38, "elapsed_time": "11:24:24", "remaining_time": "6:35:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3370, "total_steps": 5309, "loss": 3.0161, "learning_rate": 1e-05, "epoch": 0.6346590708459374, "percentage": 63.48, "elapsed_time": "11:25:18", "remaining_time": "6:34:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3375, "total_steps": 5309, "loss": 3.0329, "learning_rate": 1e-05, "epoch": 0.6356007015148484, "percentage": 63.57, "elapsed_time": "11:26:12", "remaining_time": "6:33:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3380, "total_steps": 5309, "loss": 2.9956, "learning_rate": 1e-05, "epoch": 0.6365423321837592, "percentage": 63.67, "elapsed_time": "11:27:07", "remaining_time": "6:32:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3385, "total_steps": 5309, "loss": 2.9224, "learning_rate": 1e-05, "epoch": 0.6374839628526701, "percentage": 63.76, "elapsed_time": "11:28:04", "remaining_time": "6:31:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3390, "total_steps": 5309, "loss": 3.14, "learning_rate": 1e-05, "epoch": 0.638425593521581, "percentage": 63.85, "elapsed_time": "11:28:59", "remaining_time": "6:30:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3395, "total_steps": 5309, "loss": 2.9937, "learning_rate": 1e-05, "epoch": 0.6393672241904919, "percentage": 63.95, "elapsed_time": "11:29:52", "remaining_time": "6:28:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3400, "total_steps": 5309, "loss": 3.0108, "learning_rate": 1e-05, "epoch": 0.6403088548594028, "percentage": 64.04, "elapsed_time": "11:30:46", "remaining_time": "6:27:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3405, "total_steps": 5309, "loss": 3.0887, "learning_rate": 1e-05, "epoch": 0.6412504855283137, "percentage": 64.14, "elapsed_time": "11:33:03", "remaining_time": "6:27:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3410, "total_steps": 5309, "loss": 2.9877, "learning_rate": 1e-05, "epoch": 0.6421921161972245, "percentage": 64.23, "elapsed_time": "11:33:56", "remaining_time": "6:26:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3415, "total_steps": 5309, "loss": 3.0624, "learning_rate": 1e-05, "epoch": 0.6431337468661354, "percentage": 64.32, "elapsed_time": "11:34:52", "remaining_time": "6:25:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3420, "total_steps": 5309, "loss": 2.9223, "learning_rate": 1e-05, "epoch": 0.6440753775350463, "percentage": 64.42, "elapsed_time": "11:35:45", "remaining_time": "6:24:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3425, "total_steps": 5309, "loss": 3.1286, "learning_rate": 1e-05, "epoch": 0.6450170082039572, "percentage": 64.51, "elapsed_time": "11:36:40", "remaining_time": "6:23:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3430, "total_steps": 5309, "loss": 3.0108, "learning_rate": 1e-05, "epoch": 0.6459586388728681, "percentage": 64.61, "elapsed_time": "11:37:35", "remaining_time": "6:22:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3435, "total_steps": 5309, "loss": 3.0991, "learning_rate": 1e-05, "epoch": 0.6469002695417789, "percentage": 64.7, "elapsed_time": "11:38:28", "remaining_time": "6:21:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3440, "total_steps": 5309, "loss": 3.1454, "learning_rate": 1e-05, "epoch": 0.6478419002106899, "percentage": 64.8, "elapsed_time": "11:39:21", "remaining_time": "6:19:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3445, "total_steps": 5309, "loss": 2.9953, "learning_rate": 1e-05, "epoch": 0.6487835308796007, "percentage": 64.89, "elapsed_time": "11:40:14", "remaining_time": "6:18:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3450, "total_steps": 5309, "loss": 2.9901, "learning_rate": 1e-05, "epoch": 0.6497251615485117, "percentage": 64.98, "elapsed_time": "11:41:07", "remaining_time": "6:17:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3455, "total_steps": 5309, "loss": 3.1011, "learning_rate": 1e-05, "epoch": 0.6506667922174225, "percentage": 65.08, "elapsed_time": "11:42:00", "remaining_time": "6:16:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3460, "total_steps": 5309, "loss": 2.9883, "learning_rate": 1e-05, "epoch": 0.6516084228863334, "percentage": 65.17, "elapsed_time": "11:42:53", "remaining_time": "6:15:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3465, "total_steps": 5309, "loss": 2.9701, "learning_rate": 1e-05, "epoch": 0.6525500535552443, "percentage": 65.27, "elapsed_time": "11:43:45", "remaining_time": "6:14:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3470, "total_steps": 5309, "loss": 3.0205, "learning_rate": 1e-05, "epoch": 0.6534916842241552, "percentage": 65.36, "elapsed_time": "11:44:40", "remaining_time": "6:13:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3475, "total_steps": 5309, "loss": 2.9935, "learning_rate": 1e-05, "epoch": 0.6544333148930661, "percentage": 65.45, "elapsed_time": "11:45:34", "remaining_time": "6:12:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3480, "total_steps": 5309, "loss": 2.8969, "learning_rate": 1e-05, "epoch": 0.655374945561977, "percentage": 65.55, "elapsed_time": "11:46:28", "remaining_time": "6:11:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3485, "total_steps": 5309, "loss": 3.0523, "learning_rate": 1e-05, "epoch": 0.6563165762308878, "percentage": 65.64, "elapsed_time": "11:47:21", "remaining_time": "6:10:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3490, "total_steps": 5309, "loss": 3.0571, "learning_rate": 1e-05, "epoch": 0.6572582068997987, "percentage": 65.74, "elapsed_time": "11:48:14", "remaining_time": "6:09:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3495, "total_steps": 5309, "loss": 3.0252, "learning_rate": 1e-05, "epoch": 0.6581998375687096, "percentage": 65.83, "elapsed_time": "11:49:05", "remaining_time": "6:08:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3500, "total_steps": 5309, "loss": 3.0203, "learning_rate": 1e-05, "epoch": 0.6591414682376205, "percentage": 65.93, "elapsed_time": "11:49:59", "remaining_time": "6:06:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3505, "total_steps": 5309, "loss": 3.1012, "learning_rate": 1e-05, "epoch": 0.6600830989065314, "percentage": 66.02, "elapsed_time": "11:50:54", "remaining_time": "6:05:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3510, "total_steps": 5309, "loss": 3.031, "learning_rate": 1e-05, "epoch": 0.6610247295754422, "percentage": 66.11, "elapsed_time": "11:51:49", "remaining_time": "6:04:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3515, "total_steps": 5309, "loss": 3.0551, "learning_rate": 1e-05, "epoch": 0.6619663602443532, "percentage": 66.21, "elapsed_time": "11:52:42", "remaining_time": "6:03:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3520, "total_steps": 5309, "loss": 3.0459, "learning_rate": 1e-05, "epoch": 0.662907990913264, "percentage": 66.3, "elapsed_time": "11:53:34", "remaining_time": "6:02:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3525, "total_steps": 5309, "loss": 2.9017, "learning_rate": 1e-05, "epoch": 0.663849621582175, "percentage": 66.4, "elapsed_time": "11:54:28", "remaining_time": "6:01:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3530, "total_steps": 5309, "loss": 3.0382, "learning_rate": 1e-05, "epoch": 0.6647912522510858, "percentage": 66.49, "elapsed_time": "11:55:21", "remaining_time": "6:00:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3535, "total_steps": 5309, "loss": 3.1805, "learning_rate": 1e-05, "epoch": 0.6657328829199967, "percentage": 66.59, "elapsed_time": "11:56:15", "remaining_time": "5:59:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3540, "total_steps": 5309, "loss": 3.0568, "learning_rate": 1e-05, "epoch": 0.6666745135889076, "percentage": 66.68, "elapsed_time": "11:57:09", "remaining_time": "5:58:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3545, "total_steps": 5309, "loss": 3.0804, "learning_rate": 1e-05, "epoch": 0.6676161442578185, "percentage": 66.77, "elapsed_time": "11:58:02", "remaining_time": "5:57:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3550, "total_steps": 5309, "loss": 3.003, "learning_rate": 1e-05, "epoch": 0.6685577749267294, "percentage": 66.87, "elapsed_time": "11:58:58", "remaining_time": "5:56:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3555, "total_steps": 5309, "loss": 2.9733, "learning_rate": 1e-05, "epoch": 0.6694994055956403, "percentage": 66.96, "elapsed_time": "11:59:54", "remaining_time": "5:55:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3560, "total_steps": 5309, "loss": 3.0515, "learning_rate": 1e-05, "epoch": 0.6704410362645511, "percentage": 67.06, "elapsed_time": "12:00:49", "remaining_time": "5:54:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3565, "total_steps": 5309, "loss": 2.8611, "learning_rate": 1e-05, "epoch": 0.671382666933462, "percentage": 67.15, "elapsed_time": "12:01:42", "remaining_time": "5:53:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3570, "total_steps": 5309, "loss": 3.0633, "learning_rate": 1e-05, "epoch": 0.6723242976023729, "percentage": 67.24, "elapsed_time": "12:02:37", "remaining_time": "5:52:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3575, "total_steps": 5309, "loss": 3.0196, "learning_rate": 1e-05, "epoch": 0.6732659282712838, "percentage": 67.34, "elapsed_time": "12:03:31", "remaining_time": "5:50:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3580, "total_steps": 5309, "loss": 3.052, "learning_rate": 1e-05, "epoch": 0.6742075589401947, "percentage": 67.43, "elapsed_time": "12:04:23", "remaining_time": "5:49:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3585, "total_steps": 5309, "loss": 2.9969, "learning_rate": 1e-05, "epoch": 0.6751491896091055, "percentage": 67.53, "elapsed_time": "12:05:17", "remaining_time": "5:48:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3590, "total_steps": 5309, "loss": 3.0297, "learning_rate": 1e-05, "epoch": 0.6760908202780165, "percentage": 67.62, "elapsed_time": "12:06:11", "remaining_time": "5:47:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3595, "total_steps": 5309, "loss": 2.9475, "learning_rate": 1e-05, "epoch": 0.6770324509469273, "percentage": 67.72, "elapsed_time": "12:07:06", "remaining_time": "5:46:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3600, "total_steps": 5309, "loss": 2.9165, "learning_rate": 1e-05, "epoch": 0.6779740816158383, "percentage": 67.81, "elapsed_time": "12:07:59", "remaining_time": "5:45:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3605, "total_steps": 5309, "loss": 3.0665, "learning_rate": 1e-05, "epoch": 0.6789157122847491, "percentage": 67.9, "elapsed_time": "12:10:12", "remaining_time": "5:45:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3610, "total_steps": 5309, "loss": 3.0468, "learning_rate": 1e-05, "epoch": 0.67985734295366, "percentage": 68.0, "elapsed_time": "12:11:05", "remaining_time": "5:44:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3615, "total_steps": 5309, "loss": 2.9307, "learning_rate": 1e-05, "epoch": 0.6807989736225709, "percentage": 68.09, "elapsed_time": "12:11:57", "remaining_time": "5:42:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3620, "total_steps": 5309, "loss": 3.0759, "learning_rate": 1e-05, "epoch": 0.6817406042914818, "percentage": 68.19, "elapsed_time": "12:12:51", "remaining_time": "5:41:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3625, "total_steps": 5309, "loss": 3.0509, "learning_rate": 1e-05, "epoch": 0.6826822349603927, "percentage": 68.28, "elapsed_time": "12:13:44", "remaining_time": "5:40:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3630, "total_steps": 5309, "loss": 2.9175, "learning_rate": 1e-05, "epoch": 0.6836238656293036, "percentage": 68.37, "elapsed_time": "12:14:39", "remaining_time": "5:39:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3635, "total_steps": 5309, "loss": 3.1881, "learning_rate": 1e-05, "epoch": 0.6845654962982144, "percentage": 68.47, "elapsed_time": "12:15:32", "remaining_time": "5:38:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3640, "total_steps": 5309, "loss": 3.0881, "learning_rate": 1e-05, "epoch": 0.6855071269671253, "percentage": 68.56, "elapsed_time": "12:16:26", "remaining_time": "5:37:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3645, "total_steps": 5309, "loss": 3.0303, "learning_rate": 1e-05, "epoch": 0.6864487576360362, "percentage": 68.66, "elapsed_time": "12:17:20", "remaining_time": "5:36:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3650, "total_steps": 5309, "loss": 3.1092, "learning_rate": 1e-05, "epoch": 0.6873903883049471, "percentage": 68.75, "elapsed_time": "12:18:14", "remaining_time": "5:35:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3655, "total_steps": 5309, "loss": 3.0515, "learning_rate": 1e-05, "epoch": 0.688332018973858, "percentage": 68.85, "elapsed_time": "12:19:07", "remaining_time": "5:34:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3660, "total_steps": 5309, "loss": 3.0485, "learning_rate": 1e-05, "epoch": 0.6892736496427688, "percentage": 68.94, "elapsed_time": "12:19:59", "remaining_time": "5:33:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3665, "total_steps": 5309, "loss": 3.0337, "learning_rate": 1e-05, "epoch": 0.6902152803116798, "percentage": 69.03, "elapsed_time": "12:20:53", "remaining_time": "5:32:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3670, "total_steps": 5309, "loss": 2.9561, "learning_rate": 1e-05, "epoch": 0.6911569109805906, "percentage": 69.13, "elapsed_time": "12:21:45", "remaining_time": "5:31:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3675, "total_steps": 5309, "loss": 3.1157, "learning_rate": 1e-05, "epoch": 0.6920985416495016, "percentage": 69.22, "elapsed_time": "12:22:39", "remaining_time": "5:30:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3680, "total_steps": 5309, "loss": 3.0824, "learning_rate": 1e-05, "epoch": 0.6930401723184124, "percentage": 69.32, "elapsed_time": "12:23:32", "remaining_time": "5:29:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3685, "total_steps": 5309, "loss": 3.0039, "learning_rate": 1e-05, "epoch": 0.6939818029873233, "percentage": 69.41, "elapsed_time": "12:24:26", "remaining_time": "5:28:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3690, "total_steps": 5309, "loss": 3.0786, "learning_rate": 1e-05, "epoch": 0.6949234336562342, "percentage": 69.5, "elapsed_time": "12:25:20", "remaining_time": "5:27:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3695, "total_steps": 5309, "loss": 2.9884, "learning_rate": 1e-05, "epoch": 0.695865064325145, "percentage": 69.6, "elapsed_time": "12:26:14", "remaining_time": "5:25:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3700, "total_steps": 5309, "loss": 2.9574, "learning_rate": 1e-05, "epoch": 0.696806694994056, "percentage": 69.69, "elapsed_time": "12:27:07", "remaining_time": "5:24:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3705, "total_steps": 5309, "loss": 3.0264, "learning_rate": 1e-05, "epoch": 0.6977483256629669, "percentage": 69.79, "elapsed_time": "12:28:00", "remaining_time": "5:23:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3710, "total_steps": 5309, "loss": 3.059, "learning_rate": 1e-05, "epoch": 0.6986899563318777, "percentage": 69.88, "elapsed_time": "12:28:53", "remaining_time": "5:22:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3715, "total_steps": 5309, "loss": 3.0736, "learning_rate": 1e-05, "epoch": 0.6996315870007886, "percentage": 69.98, "elapsed_time": "12:29:46", "remaining_time": "5:21:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3720, "total_steps": 5309, "loss": 2.9954, "learning_rate": 1e-05, "epoch": 0.7005732176696995, "percentage": 70.07, "elapsed_time": "12:30:39", "remaining_time": "5:20:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3725, "total_steps": 5309, "loss": 2.9234, "learning_rate": 1e-05, "epoch": 0.7015148483386104, "percentage": 70.16, "elapsed_time": "12:31:32", "remaining_time": "5:19:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3730, "total_steps": 5309, "loss": 2.9974, "learning_rate": 1e-05, "epoch": 0.7024564790075213, "percentage": 70.26, "elapsed_time": "12:32:26", "remaining_time": "5:18:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3735, "total_steps": 5309, "loss": 3.0908, "learning_rate": 1e-05, "epoch": 0.7033981096764321, "percentage": 70.35, "elapsed_time": "12:33:20", "remaining_time": "5:17:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3740, "total_steps": 5309, "loss": 3.0355, "learning_rate": 1e-05, "epoch": 0.7043397403453431, "percentage": 70.45, "elapsed_time": "12:34:13", "remaining_time": "5:16:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3745, "total_steps": 5309, "loss": 2.938, "learning_rate": 1e-05, "epoch": 0.7052813710142539, "percentage": 70.54, "elapsed_time": "12:35:07", "remaining_time": "5:15:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3750, "total_steps": 5309, "loss": 3.1014, "learning_rate": 1e-05, "epoch": 0.7062230016831649, "percentage": 70.63, "elapsed_time": "12:36:02", "remaining_time": "5:14:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3755, "total_steps": 5309, "loss": 3.064, "learning_rate": 1e-05, "epoch": 0.7071646323520757, "percentage": 70.73, "elapsed_time": "12:36:56", "remaining_time": "5:13:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3760, "total_steps": 5309, "loss": 3.0352, "learning_rate": 1e-05, "epoch": 0.7081062630209866, "percentage": 70.82, "elapsed_time": "12:37:54", "remaining_time": "5:12:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3765, "total_steps": 5309, "loss": 3.0674, "learning_rate": 1e-05, "epoch": 0.7090478936898975, "percentage": 70.92, "elapsed_time": "12:38:48", "remaining_time": "5:11:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3770, "total_steps": 5309, "loss": 3.0081, "learning_rate": 1e-05, "epoch": 0.7099895243588084, "percentage": 71.01, "elapsed_time": "12:39:40", "remaining_time": "5:10:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3775, "total_steps": 5309, "loss": 3.0408, "learning_rate": 1e-05, "epoch": 0.7109311550277193, "percentage": 71.11, "elapsed_time": "12:40:35", "remaining_time": "5:09:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3780, "total_steps": 5309, "loss": 3.0377, "learning_rate": 1e-05, "epoch": 0.7118727856966302, "percentage": 71.2, "elapsed_time": "12:41:30", "remaining_time": "5:08:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3785, "total_steps": 5309, "loss": 3.001, "learning_rate": 1e-05, "epoch": 0.712814416365541, "percentage": 71.29, "elapsed_time": "12:42:25", "remaining_time": "5:06:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3790, "total_steps": 5309, "loss": 2.9582, "learning_rate": 1e-05, "epoch": 0.713756047034452, "percentage": 71.39, "elapsed_time": "12:43:21", "remaining_time": "5:05:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3795, "total_steps": 5309, "loss": 3.0887, "learning_rate": 1e-05, "epoch": 0.7146976777033628, "percentage": 71.48, "elapsed_time": "12:44:14", "remaining_time": "5:04:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3800, "total_steps": 5309, "loss": 3.0967, "learning_rate": 1e-05, "epoch": 0.7156393083722736, "percentage": 71.58, "elapsed_time": "12:45:07", "remaining_time": "5:03:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3805, "total_steps": 5309, "loss": 3.0354, "learning_rate": 1e-05, "epoch": 0.7165809390411846, "percentage": 71.67, "elapsed_time": "12:47:16", "remaining_time": "5:03:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3810, "total_steps": 5309, "loss": 3.0144, "learning_rate": 1e-05, "epoch": 0.7175225697100954, "percentage": 71.76, "elapsed_time": "12:48:09", "remaining_time": "5:02:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3815, "total_steps": 5309, "loss": 2.9888, "learning_rate": 1e-05, "epoch": 0.7184642003790064, "percentage": 71.86, "elapsed_time": "12:49:01", "remaining_time": "5:01:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3820, "total_steps": 5309, "loss": 3.1182, "learning_rate": 1e-05, "epoch": 0.7194058310479172, "percentage": 71.95, "elapsed_time": "12:49:54", "remaining_time": "5:00:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3825, "total_steps": 5309, "loss": 3.0422, "learning_rate": 1e-05, "epoch": 0.7203474617168281, "percentage": 72.05, "elapsed_time": "12:50:48", "remaining_time": "4:59:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3830, "total_steps": 5309, "loss": 3.0205, "learning_rate": 1e-05, "epoch": 0.721289092385739, "percentage": 72.14, "elapsed_time": "12:51:45", "remaining_time": "4:58:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3835, "total_steps": 5309, "loss": 3.0333, "learning_rate": 1e-05, "epoch": 0.7222307230546499, "percentage": 72.24, "elapsed_time": "12:52:37", "remaining_time": "4:56:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3840, "total_steps": 5309, "loss": 3.081, "learning_rate": 1e-05, "epoch": 0.7231723537235608, "percentage": 72.33, "elapsed_time": "12:53:29", "remaining_time": "4:55:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3845, "total_steps": 5309, "loss": 2.9635, "learning_rate": 1e-05, "epoch": 0.7241139843924717, "percentage": 72.42, "elapsed_time": "12:54:23", "remaining_time": "4:54:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3850, "total_steps": 5309, "loss": 3.0792, "learning_rate": 1e-05, "epoch": 0.7250556150613825, "percentage": 72.52, "elapsed_time": "12:55:16", "remaining_time": "4:53:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3855, "total_steps": 5309, "loss": 2.9793, "learning_rate": 1e-05, "epoch": 0.7259972457302935, "percentage": 72.61, "elapsed_time": "12:56:10", "remaining_time": "4:52:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3860, "total_steps": 5309, "loss": 3.0311, "learning_rate": 1e-05, "epoch": 0.7269388763992043, "percentage": 72.71, "elapsed_time": "12:57:03", "remaining_time": "4:51:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3865, "total_steps": 5309, "loss": 2.9846, "learning_rate": 1e-05, "epoch": 0.7278805070681152, "percentage": 72.8, "elapsed_time": "12:57:59", "remaining_time": "4:50:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3870, "total_steps": 5309, "loss": 3.0651, "learning_rate": 1e-05, "epoch": 0.7288221377370261, "percentage": 72.9, "elapsed_time": "12:58:51", "remaining_time": "4:49:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3875, "total_steps": 5309, "loss": 2.9806, "learning_rate": 1e-05, "epoch": 0.7297637684059369, "percentage": 72.99, "elapsed_time": "12:59:44", "remaining_time": "4:48:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3880, "total_steps": 5309, "loss": 3.0375, "learning_rate": 1e-05, "epoch": 0.7307053990748479, "percentage": 73.08, "elapsed_time": "13:00:36", "remaining_time": "4:47:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3885, "total_steps": 5309, "loss": 3.058, "learning_rate": 1e-05, "epoch": 0.7316470297437587, "percentage": 73.18, "elapsed_time": "13:01:31", "remaining_time": "4:46:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3890, "total_steps": 5309, "loss": 3.0514, "learning_rate": 1e-05, "epoch": 0.7325886604126697, "percentage": 73.27, "elapsed_time": "13:02:28", "remaining_time": "4:45:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3895, "total_steps": 5309, "loss": 2.9818, "learning_rate": 1e-05, "epoch": 0.7335302910815805, "percentage": 73.37, "elapsed_time": "13:03:22", "remaining_time": "4:44:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3900, "total_steps": 5309, "loss": 3.1053, "learning_rate": 1e-05, "epoch": 0.7344719217504914, "percentage": 73.46, "elapsed_time": "13:04:15", "remaining_time": "4:43:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3905, "total_steps": 5309, "loss": 2.9821, "learning_rate": 1e-05, "epoch": 0.7354135524194023, "percentage": 73.55, "elapsed_time": "13:05:09", "remaining_time": "4:42:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3910, "total_steps": 5309, "loss": 2.9765, "learning_rate": 1e-05, "epoch": 0.7363551830883132, "percentage": 73.65, "elapsed_time": "13:06:01", "remaining_time": "4:41:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3915, "total_steps": 5309, "loss": 3.1376, "learning_rate": 1e-05, "epoch": 0.7372968137572241, "percentage": 73.74, "elapsed_time": "13:06:54", "remaining_time": "4:40:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3920, "total_steps": 5309, "loss": 3.1063, "learning_rate": 1e-05, "epoch": 0.738238444426135, "percentage": 73.84, "elapsed_time": "13:07:48", "remaining_time": "4:39:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3925, "total_steps": 5309, "loss": 2.9815, "learning_rate": 1e-05, "epoch": 0.7391800750950458, "percentage": 73.93, "elapsed_time": "13:08:40", "remaining_time": "4:38:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3930, "total_steps": 5309, "loss": 2.9989, "learning_rate": 1e-05, "epoch": 0.7401217057639567, "percentage": 74.03, "elapsed_time": "13:09:35", "remaining_time": "4:37:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3935, "total_steps": 5309, "loss": 3.0436, "learning_rate": 1e-05, "epoch": 0.7410633364328676, "percentage": 74.12, "elapsed_time": "13:10:29", "remaining_time": "4:36:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3940, "total_steps": 5309, "loss": 2.9933, "learning_rate": 1e-05, "epoch": 0.7420049671017785, "percentage": 74.21, "elapsed_time": "13:11:23", "remaining_time": "4:34:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3945, "total_steps": 5309, "loss": 3.1475, "learning_rate": 1e-05, "epoch": 0.7429465977706894, "percentage": 74.31, "elapsed_time": "13:12:15", "remaining_time": "4:33:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3950, "total_steps": 5309, "loss": 2.9639, "learning_rate": 1e-05, "epoch": 0.7438882284396002, "percentage": 74.4, "elapsed_time": "13:13:09", "remaining_time": "4:32:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3955, "total_steps": 5309, "loss": 3.0413, "learning_rate": 1e-05, "epoch": 0.7448298591085112, "percentage": 74.5, "elapsed_time": "13:14:02", "remaining_time": "4:31:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3960, "total_steps": 5309, "loss": 2.9888, "learning_rate": 1e-05, "epoch": 0.745771489777422, "percentage": 74.59, "elapsed_time": "13:14:55", "remaining_time": "4:30:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3965, "total_steps": 5309, "loss": 3.0662, "learning_rate": 1e-05, "epoch": 0.746713120446333, "percentage": 74.68, "elapsed_time": "13:15:52", "remaining_time": "4:29:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3970, "total_steps": 5309, "loss": 3.0452, "learning_rate": 1e-05, "epoch": 0.7476547511152438, "percentage": 74.78, "elapsed_time": "13:16:47", "remaining_time": "4:28:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3975, "total_steps": 5309, "loss": 2.9464, "learning_rate": 1e-05, "epoch": 0.7485963817841547, "percentage": 74.87, "elapsed_time": "13:17:38", "remaining_time": "4:27:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3980, "total_steps": 5309, "loss": 3.0599, "learning_rate": 1e-05, "epoch": 0.7495380124530656, "percentage": 74.97, "elapsed_time": "13:18:32", "remaining_time": "4:26:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3985, "total_steps": 5309, "loss": 3.0561, "learning_rate": 1e-05, "epoch": 0.7504796431219765, "percentage": 75.06, "elapsed_time": "13:19:27", "remaining_time": "4:25:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3990, "total_steps": 5309, "loss": 3.0022, "learning_rate": 1e-05, "epoch": 0.7514212737908874, "percentage": 75.16, "elapsed_time": "13:20:20", "remaining_time": "4:24:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3995, "total_steps": 5309, "loss": 3.1197, "learning_rate": 1e-05, "epoch": 0.7523629044597983, "percentage": 75.25, "elapsed_time": "13:21:15", "remaining_time": "4:23:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4000, "total_steps": 5309, "loss": 2.946, "learning_rate": 1e-05, "epoch": 0.7533045351287091, "percentage": 75.34, "elapsed_time": "13:22:11", "remaining_time": "4:22:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4000, "total_steps": 5309, "eval_loss": 3.0350847244262695, "epoch": 0.7533045351287091, "percentage": 75.34, "elapsed_time": "13:39:51", "remaining_time": "4:28:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4005, "total_steps": 5309, "loss": 2.9728, "learning_rate": 1e-05, "epoch": 0.75424616579762, "percentage": 75.44, "elapsed_time": "13:42:02", "remaining_time": "4:27:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4010, "total_steps": 5309, "loss": 3.0188, "learning_rate": 1e-05, "epoch": 0.7551877964665309, "percentage": 75.53, "elapsed_time": "13:42:56", "remaining_time": "4:26:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4015, "total_steps": 5309, "loss": 2.9826, "learning_rate": 1e-05, "epoch": 0.7561294271354418, "percentage": 75.63, "elapsed_time": "13:43:50", "remaining_time": "4:25:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4020, "total_steps": 5309, "loss": 3.0136, "learning_rate": 1e-05, "epoch": 0.7570710578043527, "percentage": 75.72, "elapsed_time": "13:44:45", "remaining_time": "4:24:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4025, "total_steps": 5309, "loss": 2.9847, "learning_rate": 1e-05, "epoch": 0.7580126884732635, "percentage": 75.81, "elapsed_time": "13:45:38", "remaining_time": "4:23:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4030, "total_steps": 5309, "loss": 3.1012, "learning_rate": 1e-05, "epoch": 0.7589543191421745, "percentage": 75.91, "elapsed_time": "13:46:32", "remaining_time": "4:22:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4035, "total_steps": 5309, "loss": 3.0014, "learning_rate": 1e-05, "epoch": 0.7598959498110853, "percentage": 76.0, "elapsed_time": "13:47:24", "remaining_time": "4:21:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4040, "total_steps": 5309, "loss": 3.014, "learning_rate": 1e-05, "epoch": 0.7608375804799963, "percentage": 76.1, "elapsed_time": "13:48:20", "remaining_time": "4:20:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4045, "total_steps": 5309, "loss": 2.9964, "learning_rate": 1e-05, "epoch": 0.7617792111489071, "percentage": 76.19, "elapsed_time": "13:49:13", "remaining_time": "4:19:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4050, "total_steps": 5309, "loss": 3.0237, "learning_rate": 1e-05, "epoch": 0.762720841817818, "percentage": 76.29, "elapsed_time": "13:50:06", "remaining_time": "4:18:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4055, "total_steps": 5309, "loss": 2.9814, "learning_rate": 1e-05, "epoch": 0.7636624724867289, "percentage": 76.38, "elapsed_time": "13:50:59", "remaining_time": "4:16:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4060, "total_steps": 5309, "loss": 3.0512, "learning_rate": 1e-05, "epoch": 0.7646041031556398, "percentage": 76.47, "elapsed_time": "13:51:52", "remaining_time": "4:15:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4065, "total_steps": 5309, "loss": 3.0855, "learning_rate": 1e-05, "epoch": 0.7655457338245507, "percentage": 76.57, "elapsed_time": "13:52:44", "remaining_time": "4:14:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4070, "total_steps": 5309, "loss": 2.9926, "learning_rate": 1e-05, "epoch": 0.7664873644934616, "percentage": 76.66, "elapsed_time": "13:53:38", "remaining_time": "4:13:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4075, "total_steps": 5309, "loss": 2.9967, "learning_rate": 1e-05, "epoch": 0.7674289951623724, "percentage": 76.76, "elapsed_time": "13:54:32", "remaining_time": "4:12:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4080, "total_steps": 5309, "loss": 3.0271, "learning_rate": 1e-05, "epoch": 0.7683706258312833, "percentage": 76.85, "elapsed_time": "13:55:24", "remaining_time": "4:11:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4085, "total_steps": 5309, "loss": 2.979, "learning_rate": 1e-05, "epoch": 0.7693122565001942, "percentage": 76.94, "elapsed_time": "13:56:16", "remaining_time": "4:10:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4090, "total_steps": 5309, "loss": 3.0638, "learning_rate": 1e-05, "epoch": 0.7702538871691051, "percentage": 77.04, "elapsed_time": "13:57:09", "remaining_time": "4:09:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4095, "total_steps": 5309, "loss": 2.9982, "learning_rate": 1e-05, "epoch": 0.771195517838016, "percentage": 77.13, "elapsed_time": "13:58:00", "remaining_time": "4:08:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4100, "total_steps": 5309, "loss": 2.9228, "learning_rate": 1e-05, "epoch": 0.7721371485069268, "percentage": 77.23, "elapsed_time": "13:58:54", "remaining_time": "4:07:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4105, "total_steps": 5309, "loss": 3.0264, "learning_rate": 1e-05, "epoch": 0.7730787791758378, "percentage": 77.32, "elapsed_time": "13:59:49", "remaining_time": "4:06:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4110, "total_steps": 5309, "loss": 3.1302, "learning_rate": 1e-05, "epoch": 0.7740204098447486, "percentage": 77.42, "elapsed_time": "14:00:43", "remaining_time": "4:05:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4115, "total_steps": 5309, "loss": 2.9592, "learning_rate": 1e-05, "epoch": 0.7749620405136596, "percentage": 77.51, "elapsed_time": "14:01:37", "remaining_time": "4:04:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4120, "total_steps": 5309, "loss": 3.0449, "learning_rate": 1e-05, "epoch": 0.7759036711825704, "percentage": 77.6, "elapsed_time": "14:02:31", "remaining_time": "4:03:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4125, "total_steps": 5309, "loss": 3.0414, "learning_rate": 1e-05, "epoch": 0.7768453018514813, "percentage": 77.7, "elapsed_time": "14:03:26", "remaining_time": "4:02:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4130, "total_steps": 5309, "loss": 3.0961, "learning_rate": 1e-05, "epoch": 0.7777869325203922, "percentage": 77.79, "elapsed_time": "14:04:18", "remaining_time": "4:01:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4135, "total_steps": 5309, "loss": 2.9958, "learning_rate": 1e-05, "epoch": 0.7787285631893031, "percentage": 77.89, "elapsed_time": "14:05:13", "remaining_time": "3:59:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4140, "total_steps": 5309, "loss": 2.9861, "learning_rate": 1e-05, "epoch": 0.779670193858214, "percentage": 77.98, "elapsed_time": "14:06:07", "remaining_time": "3:58:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4145, "total_steps": 5309, "loss": 2.9421, "learning_rate": 1e-05, "epoch": 0.7806118245271249, "percentage": 78.07, "elapsed_time": "14:07:02", "remaining_time": "3:57:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4150, "total_steps": 5309, "loss": 2.9885, "learning_rate": 1e-05, "epoch": 0.7815534551960357, "percentage": 78.17, "elapsed_time": "14:07:56", "remaining_time": "3:56:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4155, "total_steps": 5309, "loss": 2.8914, "learning_rate": 1e-05, "epoch": 0.7824950858649466, "percentage": 78.26, "elapsed_time": "14:08:50", "remaining_time": "3:55:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4160, "total_steps": 5309, "loss": 2.9848, "learning_rate": 1e-05, "epoch": 0.7834367165338575, "percentage": 78.36, "elapsed_time": "14:09:43", "remaining_time": "3:54:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4165, "total_steps": 5309, "loss": 2.9447, "learning_rate": 1e-05, "epoch": 0.7843783472027684, "percentage": 78.45, "elapsed_time": "14:10:38", "remaining_time": "3:53:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4170, "total_steps": 5309, "loss": 2.9969, "learning_rate": 1e-05, "epoch": 0.7853199778716793, "percentage": 78.55, "elapsed_time": "14:11:31", "remaining_time": "3:52:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4175, "total_steps": 5309, "loss": 3.1038, "learning_rate": 1e-05, "epoch": 0.7862616085405901, "percentage": 78.64, "elapsed_time": "14:12:25", "remaining_time": "3:51:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4180, "total_steps": 5309, "loss": 3.1315, "learning_rate": 1e-05, "epoch": 0.7872032392095011, "percentage": 78.73, "elapsed_time": "14:13:19", "remaining_time": "3:50:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4185, "total_steps": 5309, "loss": 3.0766, "learning_rate": 1e-05, "epoch": 0.7881448698784119, "percentage": 78.83, "elapsed_time": "14:14:12", "remaining_time": "3:49:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4190, "total_steps": 5309, "loss": 3.0528, "learning_rate": 1e-05, "epoch": 0.7890865005473229, "percentage": 78.92, "elapsed_time": "14:15:05", "remaining_time": "3:48:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4195, "total_steps": 5309, "loss": 3.0533, "learning_rate": 1e-05, "epoch": 0.7900281312162337, "percentage": 79.02, "elapsed_time": "14:15:58", "remaining_time": "3:47:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4200, "total_steps": 5309, "loss": 3.0414, "learning_rate": 1e-05, "epoch": 0.7909697618851446, "percentage": 79.11, "elapsed_time": "14:16:51", "remaining_time": "3:46:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4205, "total_steps": 5309, "loss": 3.0211, "learning_rate": 1e-05, "epoch": 0.7919113925540555, "percentage": 79.21, "elapsed_time": "14:19:04", "remaining_time": "3:45:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4210, "total_steps": 5309, "loss": 3.0595, "learning_rate": 1e-05, "epoch": 0.7928530232229664, "percentage": 79.3, "elapsed_time": "14:19:56", "remaining_time": "3:44:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4215, "total_steps": 5309, "loss": 3.0505, "learning_rate": 1e-05, "epoch": 0.7937946538918773, "percentage": 79.39, "elapsed_time": "14:20:50", "remaining_time": "3:43:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4220, "total_steps": 5309, "loss": 2.9477, "learning_rate": 1e-05, "epoch": 0.7947362845607882, "percentage": 79.49, "elapsed_time": "14:21:46", "remaining_time": "3:42:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4225, "total_steps": 5309, "loss": 2.9963, "learning_rate": 1e-05, "epoch": 0.795677915229699, "percentage": 79.58, "elapsed_time": "14:22:40", "remaining_time": "3:41:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4230, "total_steps": 5309, "loss": 3.0773, "learning_rate": 1e-05, "epoch": 0.79661954589861, "percentage": 79.68, "elapsed_time": "14:23:36", "remaining_time": "3:40:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4235, "total_steps": 5309, "loss": 3.0217, "learning_rate": 1e-05, "epoch": 0.7975611765675208, "percentage": 79.77, "elapsed_time": "14:24:31", "remaining_time": "3:39:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4240, "total_steps": 5309, "loss": 2.9698, "learning_rate": 1e-05, "epoch": 0.7985028072364317, "percentage": 79.86, "elapsed_time": "14:25:26", "remaining_time": "3:38:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4245, "total_steps": 5309, "loss": 3.012, "learning_rate": 1e-05, "epoch": 0.7994444379053426, "percentage": 79.96, "elapsed_time": "14:26:20", "remaining_time": "3:37:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4250, "total_steps": 5309, "loss": 2.9623, "learning_rate": 1e-05, "epoch": 0.8003860685742534, "percentage": 80.05, "elapsed_time": "14:27:13", "remaining_time": "3:36:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4255, "total_steps": 5309, "loss": 3.004, "learning_rate": 1e-05, "epoch": 0.8013276992431644, "percentage": 80.15, "elapsed_time": "14:28:09", "remaining_time": "3:35:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4260, "total_steps": 5309, "loss": 3.0707, "learning_rate": 1e-05, "epoch": 0.8022693299120752, "percentage": 80.24, "elapsed_time": "14:29:02", "remaining_time": "3:33:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4265, "total_steps": 5309, "loss": 3.033, "learning_rate": 1e-05, "epoch": 0.8032109605809862, "percentage": 80.34, "elapsed_time": "14:29:54", "remaining_time": "3:32:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4270, "total_steps": 5309, "loss": 2.9285, "learning_rate": 1e-05, "epoch": 0.804152591249897, "percentage": 80.43, "elapsed_time": "14:30:48", "remaining_time": "3:31:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4275, "total_steps": 5309, "loss": 2.9806, "learning_rate": 1e-05, "epoch": 0.8050942219188079, "percentage": 80.52, "elapsed_time": "14:31:43", "remaining_time": "3:30:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4280, "total_steps": 5309, "loss": 3.0609, "learning_rate": 1e-05, "epoch": 0.8060358525877188, "percentage": 80.62, "elapsed_time": "14:32:34", "remaining_time": "3:29:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4285, "total_steps": 5309, "loss": 3.1415, "learning_rate": 1e-05, "epoch": 0.8069774832566297, "percentage": 80.71, "elapsed_time": "14:33:27", "remaining_time": "3:28:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4290, "total_steps": 5309, "loss": 3.0246, "learning_rate": 1e-05, "epoch": 0.8079191139255405, "percentage": 80.81, "elapsed_time": "14:34:21", "remaining_time": "3:27:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4295, "total_steps": 5309, "loss": 2.9366, "learning_rate": 1e-05, "epoch": 0.8088607445944515, "percentage": 80.9, "elapsed_time": "14:35:16", "remaining_time": "3:26:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4300, "total_steps": 5309, "loss": 3.0745, "learning_rate": 1e-05, "epoch": 0.8098023752633623, "percentage": 80.99, "elapsed_time": "14:36:09", "remaining_time": "3:25:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4305, "total_steps": 5309, "loss": 3.0592, "learning_rate": 1e-05, "epoch": 0.8107440059322732, "percentage": 81.09, "elapsed_time": "14:37:01", "remaining_time": "3:24:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4310, "total_steps": 5309, "loss": 2.9483, "learning_rate": 1e-05, "epoch": 0.8116856366011841, "percentage": 81.18, "elapsed_time": "14:37:54", "remaining_time": "3:23:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4315, "total_steps": 5309, "loss": 3.0345, "learning_rate": 1e-05, "epoch": 0.8126272672700949, "percentage": 81.28, "elapsed_time": "14:38:48", "remaining_time": "3:22:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4320, "total_steps": 5309, "loss": 2.9852, "learning_rate": 1e-05, "epoch": 0.8135688979390059, "percentage": 81.37, "elapsed_time": "14:39:42", "remaining_time": "3:21:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4325, "total_steps": 5309, "loss": 3.0945, "learning_rate": 1e-05, "epoch": 0.8145105286079167, "percentage": 81.47, "elapsed_time": "14:40:36", "remaining_time": "3:20:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4330, "total_steps": 5309, "loss": 2.9639, "learning_rate": 1e-05, "epoch": 0.8154521592768277, "percentage": 81.56, "elapsed_time": "14:41:32", "remaining_time": "3:19:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4335, "total_steps": 5309, "loss": 3.0707, "learning_rate": 1e-05, "epoch": 0.8163937899457385, "percentage": 81.65, "elapsed_time": "14:42:25", "remaining_time": "3:18:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4340, "total_steps": 5309, "loss": 3.0978, "learning_rate": 1e-05, "epoch": 0.8173354206146494, "percentage": 81.75, "elapsed_time": "14:43:20", "remaining_time": "3:17:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4345, "total_steps": 5309, "loss": 3.0075, "learning_rate": 1e-05, "epoch": 0.8182770512835603, "percentage": 81.84, "elapsed_time": "14:44:14", "remaining_time": "3:16:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4350, "total_steps": 5309, "loss": 3.1404, "learning_rate": 1e-05, "epoch": 0.8192186819524712, "percentage": 81.94, "elapsed_time": "14:45:11", "remaining_time": "3:15:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4355, "total_steps": 5309, "loss": 2.8578, "learning_rate": 1e-05, "epoch": 0.8201603126213821, "percentage": 82.03, "elapsed_time": "14:46:06", "remaining_time": "3:14:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4360, "total_steps": 5309, "loss": 2.9544, "learning_rate": 1e-05, "epoch": 0.821101943290293, "percentage": 82.12, "elapsed_time": "14:47:00", "remaining_time": "3:13:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4365, "total_steps": 5309, "loss": 3.0135, "learning_rate": 1e-05, "epoch": 0.8220435739592038, "percentage": 82.22, "elapsed_time": "14:47:53", "remaining_time": "3:12:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4370, "total_steps": 5309, "loss": 3.0015, "learning_rate": 1e-05, "epoch": 0.8229852046281148, "percentage": 82.31, "elapsed_time": "14:48:46", "remaining_time": "3:10:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4375, "total_steps": 5309, "loss": 3.0321, "learning_rate": 1e-05, "epoch": 0.8239268352970256, "percentage": 82.41, "elapsed_time": "14:49:40", "remaining_time": "3:09:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4380, "total_steps": 5309, "loss": 3.1258, "learning_rate": 1e-05, "epoch": 0.8248684659659365, "percentage": 82.5, "elapsed_time": "14:50:31", "remaining_time": "3:08:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4385, "total_steps": 5309, "loss": 3.1225, "learning_rate": 1e-05, "epoch": 0.8258100966348474, "percentage": 82.6, "elapsed_time": "14:51:25", "remaining_time": "3:07:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4390, "total_steps": 5309, "loss": 2.9543, "learning_rate": 1e-05, "epoch": 0.8267517273037582, "percentage": 82.69, "elapsed_time": "14:52:20", "remaining_time": "3:06:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4395, "total_steps": 5309, "loss": 2.9904, "learning_rate": 1e-05, "epoch": 0.8276933579726692, "percentage": 82.78, "elapsed_time": "14:53:13", "remaining_time": "3:05:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4400, "total_steps": 5309, "loss": 2.994, "learning_rate": 1e-05, "epoch": 0.82863498864158, "percentage": 82.88, "elapsed_time": "14:54:06", "remaining_time": "3:04:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4405, "total_steps": 5309, "loss": 3.024, "learning_rate": 1e-05, "epoch": 0.829576619310491, "percentage": 82.97, "elapsed_time": "14:56:21", "remaining_time": "3:03:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4410, "total_steps": 5309, "loss": 3.0905, "learning_rate": 1e-05, "epoch": 0.8305182499794018, "percentage": 83.07, "elapsed_time": "14:57:15", "remaining_time": "3:02:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4415, "total_steps": 5309, "loss": 3.0603, "learning_rate": 1e-05, "epoch": 0.8314598806483127, "percentage": 83.16, "elapsed_time": "14:58:08", "remaining_time": "3:01:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4420, "total_steps": 5309, "loss": 3.0027, "learning_rate": 1e-05, "epoch": 0.8324015113172236, "percentage": 83.25, "elapsed_time": "14:59:03", "remaining_time": "3:00:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4425, "total_steps": 5309, "loss": 2.9662, "learning_rate": 1e-05, "epoch": 0.8333431419861345, "percentage": 83.35, "elapsed_time": "14:59:58", "remaining_time": "2:59:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4430, "total_steps": 5309, "loss": 2.9869, "learning_rate": 1e-05, "epoch": 0.8342847726550454, "percentage": 83.44, "elapsed_time": "15:00:53", "remaining_time": "2:58:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4435, "total_steps": 5309, "loss": 3.0145, "learning_rate": 1e-05, "epoch": 0.8352264033239563, "percentage": 83.54, "elapsed_time": "15:01:47", "remaining_time": "2:57:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4440, "total_steps": 5309, "loss": 3.1651, "learning_rate": 1e-05, "epoch": 0.8361680339928671, "percentage": 83.63, "elapsed_time": "15:02:41", "remaining_time": "2:56:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4445, "total_steps": 5309, "loss": 3.0095, "learning_rate": 1e-05, "epoch": 0.837109664661778, "percentage": 83.73, "elapsed_time": "15:03:32", "remaining_time": "2:55:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4450, "total_steps": 5309, "loss": 3.0569, "learning_rate": 1e-05, "epoch": 0.8380512953306889, "percentage": 83.82, "elapsed_time": "15:04:27", "remaining_time": "2:54:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4455, "total_steps": 5309, "loss": 2.9869, "learning_rate": 1e-05, "epoch": 0.8389929259995998, "percentage": 83.91, "elapsed_time": "15:05:21", "remaining_time": "2:53:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4460, "total_steps": 5309, "loss": 3.0701, "learning_rate": 1e-05, "epoch": 0.8399345566685107, "percentage": 84.01, "elapsed_time": "15:06:16", "remaining_time": "2:52:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4465, "total_steps": 5309, "loss": 3.1, "learning_rate": 1e-05, "epoch": 0.8408761873374215, "percentage": 84.1, "elapsed_time": "15:07:08", "remaining_time": "2:51:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4470, "total_steps": 5309, "loss": 2.9665, "learning_rate": 1e-05, "epoch": 0.8418178180063325, "percentage": 84.2, "elapsed_time": "15:08:00", "remaining_time": "2:50:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4475, "total_steps": 5309, "loss": 3.0122, "learning_rate": 1e-05, "epoch": 0.8427594486752433, "percentage": 84.29, "elapsed_time": "15:08:53", "remaining_time": "2:49:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4480, "total_steps": 5309, "loss": 3.1027, "learning_rate": 1e-05, "epoch": 0.8437010793441543, "percentage": 84.39, "elapsed_time": "15:09:47", "remaining_time": "2:48:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4485, "total_steps": 5309, "loss": 2.9872, "learning_rate": 1e-05, "epoch": 0.8446427100130651, "percentage": 84.48, "elapsed_time": "15:10:40", "remaining_time": "2:47:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4490, "total_steps": 5309, "loss": 2.9336, "learning_rate": 1e-05, "epoch": 0.845584340681976, "percentage": 84.57, "elapsed_time": "15:11:34", "remaining_time": "2:46:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4495, "total_steps": 5309, "loss": 2.9181, "learning_rate": 1e-05, "epoch": 0.8465259713508869, "percentage": 84.67, "elapsed_time": "15:12:26", "remaining_time": "2:45:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4500, "total_steps": 5309, "loss": 3.0798, "learning_rate": 1e-05, "epoch": 0.8474676020197978, "percentage": 84.76, "elapsed_time": "15:13:21", "remaining_time": "2:44:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4505, "total_steps": 5309, "loss": 2.9763, "learning_rate": 1e-05, "epoch": 0.8484092326887087, "percentage": 84.86, "elapsed_time": "15:14:13", "remaining_time": "2:43:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4510, "total_steps": 5309, "loss": 3.021, "learning_rate": 1e-05, "epoch": 0.8493508633576196, "percentage": 84.95, "elapsed_time": "15:15:05", "remaining_time": "2:42:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4515, "total_steps": 5309, "loss": 2.9505, "learning_rate": 1e-05, "epoch": 0.8502924940265304, "percentage": 85.04, "elapsed_time": "15:16:00", "remaining_time": "2:41:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4520, "total_steps": 5309, "loss": 2.8787, "learning_rate": 1e-05, "epoch": 0.8512341246954414, "percentage": 85.14, "elapsed_time": "15:16:54", "remaining_time": "2:40:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4525, "total_steps": 5309, "loss": 3.1491, "learning_rate": 1e-05, "epoch": 0.8521757553643522, "percentage": 85.23, "elapsed_time": "15:17:47", "remaining_time": "2:39:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4530, "total_steps": 5309, "loss": 3.0369, "learning_rate": 1e-05, "epoch": 0.8531173860332631, "percentage": 85.33, "elapsed_time": "15:18:43", "remaining_time": "2:37:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4535, "total_steps": 5309, "loss": 3.0956, "learning_rate": 1e-05, "epoch": 0.854059016702174, "percentage": 85.42, "elapsed_time": "15:19:36", "remaining_time": "2:36:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4540, "total_steps": 5309, "loss": 3.0892, "learning_rate": 1e-05, "epoch": 0.8550006473710848, "percentage": 85.52, "elapsed_time": "15:20:28", "remaining_time": "2:35:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4545, "total_steps": 5309, "loss": 2.9785, "learning_rate": 1e-05, "epoch": 0.8559422780399958, "percentage": 85.61, "elapsed_time": "15:21:22", "remaining_time": "2:34:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4550, "total_steps": 5309, "loss": 3.0025, "learning_rate": 1e-05, "epoch": 0.8568839087089066, "percentage": 85.7, "elapsed_time": "15:22:17", "remaining_time": "2:33:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4555, "total_steps": 5309, "loss": 2.8551, "learning_rate": 1e-05, "epoch": 0.8578255393778176, "percentage": 85.8, "elapsed_time": "15:23:09", "remaining_time": "2:32:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4560, "total_steps": 5309, "loss": 2.9634, "learning_rate": 1e-05, "epoch": 0.8587671700467284, "percentage": 85.89, "elapsed_time": "15:24:04", "remaining_time": "2:31:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4565, "total_steps": 5309, "loss": 3.1556, "learning_rate": 1e-05, "epoch": 0.8597088007156393, "percentage": 85.99, "elapsed_time": "15:24:56", "remaining_time": "2:30:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4570, "total_steps": 5309, "loss": 3.0464, "learning_rate": 1e-05, "epoch": 0.8606504313845502, "percentage": 86.08, "elapsed_time": "15:25:50", "remaining_time": "2:29:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4575, "total_steps": 5309, "loss": 3.012, "learning_rate": 1e-05, "epoch": 0.8615920620534611, "percentage": 86.17, "elapsed_time": "15:26:44", "remaining_time": "2:28:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4580, "total_steps": 5309, "loss": 2.934, "learning_rate": 1e-05, "epoch": 0.862533692722372, "percentage": 86.27, "elapsed_time": "15:27:38", "remaining_time": "2:27:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4585, "total_steps": 5309, "loss": 2.9922, "learning_rate": 1e-05, "epoch": 0.8634753233912829, "percentage": 86.36, "elapsed_time": "15:28:33", "remaining_time": "2:26:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4590, "total_steps": 5309, "loss": 2.904, "learning_rate": 1e-05, "epoch": 0.8644169540601937, "percentage": 86.46, "elapsed_time": "15:29:25", "remaining_time": "2:25:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4595, "total_steps": 5309, "loss": 3.0824, "learning_rate": 1e-05, "epoch": 0.8653585847291047, "percentage": 86.55, "elapsed_time": "15:30:19", "remaining_time": "2:24:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4600, "total_steps": 5309, "loss": 3.0608, "learning_rate": 1e-05, "epoch": 0.8663002153980155, "percentage": 86.65, "elapsed_time": "15:31:14", "remaining_time": "2:23:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4605, "total_steps": 5309, "loss": 3.007, "learning_rate": 1e-05, "epoch": 0.8672418460669264, "percentage": 86.74, "elapsed_time": "15:33:28", "remaining_time": "2:22:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4610, "total_steps": 5309, "loss": 2.9562, "learning_rate": 1e-05, "epoch": 0.8681834767358373, "percentage": 86.83, "elapsed_time": "15:34:23", "remaining_time": "2:21:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4615, "total_steps": 5309, "loss": 2.9716, "learning_rate": 1e-05, "epoch": 0.8691251074047481, "percentage": 86.93, "elapsed_time": "15:35:17", "remaining_time": "2:20:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4620, "total_steps": 5309, "loss": 3.008, "learning_rate": 1e-05, "epoch": 0.8700667380736591, "percentage": 87.02, "elapsed_time": "15:36:13", "remaining_time": "2:19:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4625, "total_steps": 5309, "loss": 3.1845, "learning_rate": 1e-05, "epoch": 0.8710083687425699, "percentage": 87.12, "elapsed_time": "15:37:06", "remaining_time": "2:18:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4630, "total_steps": 5309, "loss": 3.0967, "learning_rate": 1e-05, "epoch": 0.8719499994114809, "percentage": 87.21, "elapsed_time": "15:37:59", "remaining_time": "2:17:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4635, "total_steps": 5309, "loss": 3.0172, "learning_rate": 1e-05, "epoch": 0.8728916300803917, "percentage": 87.3, "elapsed_time": "15:38:52", "remaining_time": "2:16:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4640, "total_steps": 5309, "loss": 3.0151, "learning_rate": 1e-05, "epoch": 0.8738332607493026, "percentage": 87.4, "elapsed_time": "15:39:46", "remaining_time": "2:15:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4645, "total_steps": 5309, "loss": 3.0446, "learning_rate": 1e-05, "epoch": 0.8747748914182135, "percentage": 87.49, "elapsed_time": "15:40:39", "remaining_time": "2:14:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4650, "total_steps": 5309, "loss": 3.0111, "learning_rate": 1e-05, "epoch": 0.8757165220871244, "percentage": 87.59, "elapsed_time": "15:41:34", "remaining_time": "2:13:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4655, "total_steps": 5309, "loss": 3.006, "learning_rate": 1e-05, "epoch": 0.8766581527560353, "percentage": 87.68, "elapsed_time": "15:42:28", "remaining_time": "2:12:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4660, "total_steps": 5309, "loss": 2.9864, "learning_rate": 1e-05, "epoch": 0.8775997834249462, "percentage": 87.78, "elapsed_time": "15:43:21", "remaining_time": "2:11:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4665, "total_steps": 5309, "loss": 2.9275, "learning_rate": 1e-05, "epoch": 0.878541414093857, "percentage": 87.87, "elapsed_time": "15:44:15", "remaining_time": "2:10:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4670, "total_steps": 5309, "loss": 3.0478, "learning_rate": 1e-05, "epoch": 0.879483044762768, "percentage": 87.96, "elapsed_time": "15:45:08", "remaining_time": "2:09:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4675, "total_steps": 5309, "loss": 2.9357, "learning_rate": 1e-05, "epoch": 0.8804246754316788, "percentage": 88.06, "elapsed_time": "15:46:02", "remaining_time": "2:08:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4680, "total_steps": 5309, "loss": 2.9292, "learning_rate": 1e-05, "epoch": 0.8813663061005897, "percentage": 88.15, "elapsed_time": "15:46:57", "remaining_time": "2:07:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4685, "total_steps": 5309, "loss": 2.9556, "learning_rate": 1e-05, "epoch": 0.8823079367695006, "percentage": 88.25, "elapsed_time": "15:47:50", "remaining_time": "2:06:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4690, "total_steps": 5309, "loss": 2.95, "learning_rate": 1e-05, "epoch": 0.8832495674384114, "percentage": 88.34, "elapsed_time": "15:48:44", "remaining_time": "2:05:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4695, "total_steps": 5309, "loss": 2.9276, "learning_rate": 1e-05, "epoch": 0.8841911981073224, "percentage": 88.43, "elapsed_time": "15:49:38", "remaining_time": "2:04:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4700, "total_steps": 5309, "loss": 2.957, "learning_rate": 1e-05, "epoch": 0.8851328287762332, "percentage": 88.53, "elapsed_time": "15:50:30", "remaining_time": "2:03:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4705, "total_steps": 5309, "loss": 3.0653, "learning_rate": 1e-05, "epoch": 0.8860744594451442, "percentage": 88.62, "elapsed_time": "15:51:24", "remaining_time": "2:02:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4710, "total_steps": 5309, "loss": 3.0135, "learning_rate": 1e-05, "epoch": 0.887016090114055, "percentage": 88.72, "elapsed_time": "15:52:19", "remaining_time": "2:01:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4715, "total_steps": 5309, "loss": 2.9784, "learning_rate": 1e-05, "epoch": 0.8879577207829659, "percentage": 88.81, "elapsed_time": "15:53:12", "remaining_time": "2:00:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4720, "total_steps": 5309, "loss": 2.9473, "learning_rate": 1e-05, "epoch": 0.8888993514518768, "percentage": 88.91, "elapsed_time": "15:54:06", "remaining_time": "1:59:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4725, "total_steps": 5309, "loss": 3.0772, "learning_rate": 1e-05, "epoch": 0.8898409821207877, "percentage": 89.0, "elapsed_time": "15:55:01", "remaining_time": "1:58:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4730, "total_steps": 5309, "loss": 3.0302, "learning_rate": 1e-05, "epoch": 0.8907826127896986, "percentage": 89.09, "elapsed_time": "15:55:55", "remaining_time": "1:57:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4735, "total_steps": 5309, "loss": 3.0771, "learning_rate": 1e-05, "epoch": 0.8917242434586095, "percentage": 89.19, "elapsed_time": "15:56:51", "remaining_time": "1:55:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4740, "total_steps": 5309, "loss": 3.0053, "learning_rate": 1e-05, "epoch": 0.8926658741275203, "percentage": 89.28, "elapsed_time": "15:57:45", "remaining_time": "1:54:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4745, "total_steps": 5309, "loss": 3.0288, "learning_rate": 1e-05, "epoch": 0.8936075047964313, "percentage": 89.38, "elapsed_time": "15:58:38", "remaining_time": "1:53:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4750, "total_steps": 5309, "loss": 3.0103, "learning_rate": 1e-05, "epoch": 0.8945491354653421, "percentage": 89.47, "elapsed_time": "15:59:32", "remaining_time": "1:52:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4755, "total_steps": 5309, "loss": 3.0107, "learning_rate": 1e-05, "epoch": 0.895490766134253, "percentage": 89.56, "elapsed_time": "16:00:26", "remaining_time": "1:51:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4760, "total_steps": 5309, "loss": 3.0275, "learning_rate": 1e-05, "epoch": 0.8964323968031639, "percentage": 89.66, "elapsed_time": "16:01:21", "remaining_time": "1:50:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4765, "total_steps": 5309, "loss": 2.9595, "learning_rate": 1e-05, "epoch": 0.8973740274720747, "percentage": 89.75, "elapsed_time": "16:02:16", "remaining_time": "1:49:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4770, "total_steps": 5309, "loss": 3.0929, "learning_rate": 1e-05, "epoch": 0.8983156581409857, "percentage": 89.85, "elapsed_time": "16:03:09", "remaining_time": "1:48:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4775, "total_steps": 5309, "loss": 3.1027, "learning_rate": 1e-05, "epoch": 0.8992572888098965, "percentage": 89.94, "elapsed_time": "16:04:03", "remaining_time": "1:47:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4780, "total_steps": 5309, "loss": 2.9818, "learning_rate": 1e-05, "epoch": 0.9001989194788075, "percentage": 90.04, "elapsed_time": "16:04:55", "remaining_time": "1:46:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4785, "total_steps": 5309, "loss": 2.996, "learning_rate": 1e-05, "epoch": 0.9011405501477183, "percentage": 90.13, "elapsed_time": "16:05:47", "remaining_time": "1:45:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4790, "total_steps": 5309, "loss": 3.0178, "learning_rate": 1e-05, "epoch": 0.9020821808166292, "percentage": 90.22, "elapsed_time": "16:06:40", "remaining_time": "1:44:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4795, "total_steps": 5309, "loss": 3.0277, "learning_rate": 1e-05, "epoch": 0.9030238114855401, "percentage": 90.32, "elapsed_time": "16:07:35", "remaining_time": "1:43:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4800, "total_steps": 5309, "loss": 2.9376, "learning_rate": 1e-05, "epoch": 0.903965442154451, "percentage": 90.41, "elapsed_time": "16:08:28", "remaining_time": "1:42:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4805, "total_steps": 5309, "loss": 3.0268, "learning_rate": 1e-05, "epoch": 0.9049070728233618, "percentage": 90.51, "elapsed_time": "16:10:41", "remaining_time": "1:41:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4810, "total_steps": 5309, "loss": 3.0405, "learning_rate": 1e-05, "epoch": 0.9058487034922728, "percentage": 90.6, "elapsed_time": "16:11:36", "remaining_time": "1:40:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4815, "total_steps": 5309, "loss": 3.1039, "learning_rate": 1e-05, "epoch": 0.9067903341611836, "percentage": 90.7, "elapsed_time": "16:12:28", "remaining_time": "1:39:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4820, "total_steps": 5309, "loss": 3.0336, "learning_rate": 1e-05, "epoch": 0.9077319648300946, "percentage": 90.79, "elapsed_time": "16:13:24", "remaining_time": "1:38:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4825, "total_steps": 5309, "loss": 3.1019, "learning_rate": 1e-05, "epoch": 0.9086735954990054, "percentage": 90.88, "elapsed_time": "16:14:16", "remaining_time": "1:37:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4830, "total_steps": 5309, "loss": 2.9516, "learning_rate": 1e-05, "epoch": 0.9096152261679162, "percentage": 90.98, "elapsed_time": "16:15:11", "remaining_time": "1:36:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4835, "total_steps": 5309, "loss": 2.979, "learning_rate": 1e-05, "epoch": 0.9105568568368272, "percentage": 91.07, "elapsed_time": "16:16:06", "remaining_time": "1:35:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4840, "total_steps": 5309, "loss": 3.0011, "learning_rate": 1e-05, "epoch": 0.911498487505738, "percentage": 91.17, "elapsed_time": "16:17:00", "remaining_time": "1:34:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4845, "total_steps": 5309, "loss": 2.8976, "learning_rate": 1e-05, "epoch": 0.912440118174649, "percentage": 91.26, "elapsed_time": "16:17:53", "remaining_time": "1:33:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4850, "total_steps": 5309, "loss": 3.0961, "learning_rate": 1e-05, "epoch": 0.9133817488435598, "percentage": 91.35, "elapsed_time": "16:18:46", "remaining_time": "1:32:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4855, "total_steps": 5309, "loss": 2.9493, "learning_rate": 1e-05, "epoch": 0.9143233795124707, "percentage": 91.45, "elapsed_time": "16:19:40", "remaining_time": "1:31:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4860, "total_steps": 5309, "loss": 2.9642, "learning_rate": 1e-05, "epoch": 0.9152650101813816, "percentage": 91.54, "elapsed_time": "16:20:33", "remaining_time": "1:30:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4865, "total_steps": 5309, "loss": 2.9965, "learning_rate": 1e-05, "epoch": 0.9162066408502925, "percentage": 91.64, "elapsed_time": "16:21:26", "remaining_time": "1:29:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4870, "total_steps": 5309, "loss": 3.0096, "learning_rate": 1e-05, "epoch": 0.9171482715192034, "percentage": 91.73, "elapsed_time": "16:22:19", "remaining_time": "1:28:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4875, "total_steps": 5309, "loss": 3.0186, "learning_rate": 1e-05, "epoch": 0.9180899021881143, "percentage": 91.83, "elapsed_time": "16:23:10", "remaining_time": "1:27:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4880, "total_steps": 5309, "loss": 2.9532, "learning_rate": 1e-05, "epoch": 0.9190315328570251, "percentage": 91.92, "elapsed_time": "16:24:06", "remaining_time": "1:26:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4885, "total_steps": 5309, "loss": 2.964, "learning_rate": 1e-05, "epoch": 0.919973163525936, "percentage": 92.01, "elapsed_time": "16:25:00", "remaining_time": "1:25:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4890, "total_steps": 5309, "loss": 2.9265, "learning_rate": 1e-05, "epoch": 0.9209147941948469, "percentage": 92.11, "elapsed_time": "16:25:54", "remaining_time": "1:24:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4895, "total_steps": 5309, "loss": 2.9748, "learning_rate": 1e-05, "epoch": 0.9218564248637579, "percentage": 92.2, "elapsed_time": "16:26:49", "remaining_time": "1:23:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4900, "total_steps": 5309, "loss": 2.9084, "learning_rate": 1e-05, "epoch": 0.9227980555326687, "percentage": 92.3, "elapsed_time": "16:27:44", "remaining_time": "1:22:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4905, "total_steps": 5309, "loss": 3.0383, "learning_rate": 1e-05, "epoch": 0.9237396862015795, "percentage": 92.39, "elapsed_time": "16:28:38", "remaining_time": "1:21:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4910, "total_steps": 5309, "loss": 2.9808, "learning_rate": 1e-05, "epoch": 0.9246813168704905, "percentage": 92.48, "elapsed_time": "16:29:31", "remaining_time": "1:20:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4915, "total_steps": 5309, "loss": 3.0511, "learning_rate": 1e-05, "epoch": 0.9256229475394013, "percentage": 92.58, "elapsed_time": "16:30:25", "remaining_time": "1:19:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4920, "total_steps": 5309, "loss": 3.0086, "learning_rate": 1e-05, "epoch": 0.9265645782083123, "percentage": 92.67, "elapsed_time": "16:31:19", "remaining_time": "1:18:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4925, "total_steps": 5309, "loss": 3.0951, "learning_rate": 1e-05, "epoch": 0.9275062088772231, "percentage": 92.77, "elapsed_time": "16:32:11", "remaining_time": "1:17:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4930, "total_steps": 5309, "loss": 3.0002, "learning_rate": 1e-05, "epoch": 0.928447839546134, "percentage": 92.86, "elapsed_time": "16:33:05", "remaining_time": "1:16:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4935, "total_steps": 5309, "loss": 2.9763, "learning_rate": 1e-05, "epoch": 0.9293894702150449, "percentage": 92.96, "elapsed_time": "16:33:57", "remaining_time": "1:15:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4940, "total_steps": 5309, "loss": 2.9946, "learning_rate": 1e-05, "epoch": 0.9303311008839558, "percentage": 93.05, "elapsed_time": "16:34:50", "remaining_time": "1:14:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4945, "total_steps": 5309, "loss": 3.0732, "learning_rate": 1e-05, "epoch": 0.9312727315528667, "percentage": 93.14, "elapsed_time": "16:35:45", "remaining_time": "1:13:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4950, "total_steps": 5309, "loss": 3.0506, "learning_rate": 1e-05, "epoch": 0.9322143622217776, "percentage": 93.24, "elapsed_time": "16:36:37", "remaining_time": "1:12:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4955, "total_steps": 5309, "loss": 2.9862, "learning_rate": 1e-05, "epoch": 0.9331559928906884, "percentage": 93.33, "elapsed_time": "16:37:33", "remaining_time": "1:11:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4960, "total_steps": 5309, "loss": 2.9428, "learning_rate": 1e-05, "epoch": 0.9340976235595994, "percentage": 93.43, "elapsed_time": "16:38:28", "remaining_time": "1:10:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4965, "total_steps": 5309, "loss": 3.0667, "learning_rate": 1e-05, "epoch": 0.9350392542285102, "percentage": 93.52, "elapsed_time": "16:39:23", "remaining_time": "1:09:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4970, "total_steps": 5309, "loss": 2.9411, "learning_rate": 1e-05, "epoch": 0.9359808848974212, "percentage": 93.61, "elapsed_time": "16:40:18", "remaining_time": "1:08:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4975, "total_steps": 5309, "loss": 3.0971, "learning_rate": 1e-05, "epoch": 0.936922515566332, "percentage": 93.71, "elapsed_time": "16:41:11", "remaining_time": "1:07:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4980, "total_steps": 5309, "loss": 3.1249, "learning_rate": 1e-05, "epoch": 0.9378641462352428, "percentage": 93.8, "elapsed_time": "16:42:04", "remaining_time": "1:06:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4985, "total_steps": 5309, "loss": 3.0034, "learning_rate": 1e-05, "epoch": 0.9388057769041538, "percentage": 93.9, "elapsed_time": "16:42:57", "remaining_time": "1:05:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4990, "total_steps": 5309, "loss": 3.0705, "learning_rate": 1e-05, "epoch": 0.9397474075730646, "percentage": 93.99, "elapsed_time": "16:43:50", "remaining_time": "1:04:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4995, "total_steps": 5309, "loss": 2.9683, "learning_rate": 1e-05, "epoch": 0.9406890382419756, "percentage": 94.09, "elapsed_time": "16:44:42", "remaining_time": "1:03:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5000, "total_steps": 5309, "loss": 2.9827, "learning_rate": 1e-05, "epoch": 0.9416306689108864, "percentage": 94.18, "elapsed_time": "16:45:36", "remaining_time": "1:02:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5000, "total_steps": 5309, "eval_loss": 3.008730888366699, "epoch": 0.9416306689108864, "percentage": 94.18, "elapsed_time": "17:02:55", "remaining_time": "1:03:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5005, "total_steps": 5309, "loss": 2.9817, "learning_rate": 1e-05, "epoch": 0.9425722995797973, "percentage": 94.27, "elapsed_time": "17:05:12", "remaining_time": "1:02:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5010, "total_steps": 5309, "loss": 3.0721, "learning_rate": 1e-05, "epoch": 0.9435139302487082, "percentage": 94.37, "elapsed_time": "17:06:06", "remaining_time": "1:01:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5015, "total_steps": 5309, "loss": 3.0179, "learning_rate": 1e-05, "epoch": 0.9444555609176191, "percentage": 94.46, "elapsed_time": "17:07:00", "remaining_time": "1:00:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5020, "total_steps": 5309, "loss": 3.0148, "learning_rate": 1e-05, "epoch": 0.94539719158653, "percentage": 94.56, "elapsed_time": "17:07:52", "remaining_time": "0:59:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5025, "total_steps": 5309, "loss": 3.0165, "learning_rate": 1e-05, "epoch": 0.9463388222554409, "percentage": 94.65, "elapsed_time": "17:08:46", "remaining_time": "0:58:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5030, "total_steps": 5309, "loss": 2.9934, "learning_rate": 1e-05, "epoch": 0.9472804529243517, "percentage": 94.74, "elapsed_time": "17:09:37", "remaining_time": "0:57:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5035, "total_steps": 5309, "loss": 3.0171, "learning_rate": 1e-05, "epoch": 0.9482220835932627, "percentage": 94.84, "elapsed_time": "17:10:29", "remaining_time": "0:56:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5040, "total_steps": 5309, "loss": 2.932, "learning_rate": 1e-05, "epoch": 0.9491637142621735, "percentage": 94.93, "elapsed_time": "17:11:24", "remaining_time": "0:55:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5045, "total_steps": 5309, "loss": 2.9003, "learning_rate": 1e-05, "epoch": 0.9501053449310845, "percentage": 95.03, "elapsed_time": "17:12:18", "remaining_time": "0:54:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5050, "total_steps": 5309, "loss": 3.066, "learning_rate": 1e-05, "epoch": 0.9510469755999953, "percentage": 95.12, "elapsed_time": "17:13:14", "remaining_time": "0:52:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5055, "total_steps": 5309, "loss": 3.0384, "learning_rate": 1e-05, "epoch": 0.9519886062689061, "percentage": 95.22, "elapsed_time": "17:14:10", "remaining_time": "0:51:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5060, "total_steps": 5309, "loss": 3.1658, "learning_rate": 1e-05, "epoch": 0.9529302369378171, "percentage": 95.31, "elapsed_time": "17:15:07", "remaining_time": "0:50:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5065, "total_steps": 5309, "loss": 3.0877, "learning_rate": 1e-05, "epoch": 0.9538718676067279, "percentage": 95.4, "elapsed_time": "17:15:59", "remaining_time": "0:49:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5070, "total_steps": 5309, "loss": 2.9102, "learning_rate": 1e-05, "epoch": 0.9548134982756389, "percentage": 95.5, "elapsed_time": "17:16:52", "remaining_time": "0:48:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5075, "total_steps": 5309, "loss": 2.9883, "learning_rate": 1e-05, "epoch": 0.9557551289445497, "percentage": 95.59, "elapsed_time": "17:17:45", "remaining_time": "0:47:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5080, "total_steps": 5309, "loss": 3.0714, "learning_rate": 1e-05, "epoch": 0.9566967596134606, "percentage": 95.69, "elapsed_time": "17:18:36", "remaining_time": "0:46:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5085, "total_steps": 5309, "loss": 2.9703, "learning_rate": 1e-05, "epoch": 0.9576383902823715, "percentage": 95.78, "elapsed_time": "17:19:30", "remaining_time": "0:45:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5090, "total_steps": 5309, "loss": 3.0111, "learning_rate": 1e-05, "epoch": 0.9585800209512824, "percentage": 95.87, "elapsed_time": "17:20:23", "remaining_time": "0:44:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5095, "total_steps": 5309, "loss": 3.0237, "learning_rate": 1e-05, "epoch": 0.9595216516201933, "percentage": 95.97, "elapsed_time": "17:21:16", "remaining_time": "0:43:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5100, "total_steps": 5309, "loss": 2.9803, "learning_rate": 1e-05, "epoch": 0.9604632822891042, "percentage": 96.06, "elapsed_time": "17:22:10", "remaining_time": "0:42:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5105, "total_steps": 5309, "loss": 2.941, "learning_rate": 1e-05, "epoch": 0.961404912958015, "percentage": 96.16, "elapsed_time": "17:23:06", "remaining_time": "0:41:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5110, "total_steps": 5309, "loss": 3.1096, "learning_rate": 1e-05, "epoch": 0.962346543626926, "percentage": 96.25, "elapsed_time": "17:24:00", "remaining_time": "0:40:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5115, "total_steps": 5309, "loss": 3.0179, "learning_rate": 1e-05, "epoch": 0.9632881742958368, "percentage": 96.35, "elapsed_time": "17:24:53", "remaining_time": "0:39:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5120, "total_steps": 5309, "loss": 3.1118, "learning_rate": 1e-05, "epoch": 0.9642298049647477, "percentage": 96.44, "elapsed_time": "17:25:47", "remaining_time": "0:38:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5125, "total_steps": 5309, "loss": 2.9616, "learning_rate": 1e-05, "epoch": 0.9651714356336586, "percentage": 96.53, "elapsed_time": "17:26:42", "remaining_time": "0:37:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5130, "total_steps": 5309, "loss": 2.8741, "learning_rate": 1e-05, "epoch": 0.9661130663025694, "percentage": 96.63, "elapsed_time": "17:27:36", "remaining_time": "0:36:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5135, "total_steps": 5309, "loss": 3.0775, "learning_rate": 1e-05, "epoch": 0.9670546969714804, "percentage": 96.72, "elapsed_time": "17:28:29", "remaining_time": "0:35:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5140, "total_steps": 5309, "loss": 3.0476, "learning_rate": 1e-05, "epoch": 0.9679963276403912, "percentage": 96.82, "elapsed_time": "17:29:21", "remaining_time": "0:34:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5145, "total_steps": 5309, "loss": 3.0245, "learning_rate": 1e-05, "epoch": 0.9689379583093022, "percentage": 96.91, "elapsed_time": "17:30:12", "remaining_time": "0:33:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5150, "total_steps": 5309, "loss": 2.9943, "learning_rate": 1e-05, "epoch": 0.969879588978213, "percentage": 97.01, "elapsed_time": "17:31:06", "remaining_time": "0:32:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5155, "total_steps": 5309, "loss": 3.0385, "learning_rate": 1e-05, "epoch": 0.9708212196471239, "percentage": 97.1, "elapsed_time": "17:31:58", "remaining_time": "0:31:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5160, "total_steps": 5309, "loss": 3.0848, "learning_rate": 1e-05, "epoch": 0.9717628503160348, "percentage": 97.19, "elapsed_time": "17:32:49", "remaining_time": "0:30:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5165, "total_steps": 5309, "loss": 3.0152, "learning_rate": 1e-05, "epoch": 0.9727044809849457, "percentage": 97.29, "elapsed_time": "17:33:43", "remaining_time": "0:29:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5170, "total_steps": 5309, "loss": 2.91, "learning_rate": 1e-05, "epoch": 0.9736461116538566, "percentage": 97.38, "elapsed_time": "17:34:37", "remaining_time": "0:28:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5175, "total_steps": 5309, "loss": 3.0045, "learning_rate": 1e-05, "epoch": 0.9745877423227675, "percentage": 97.48, "elapsed_time": "17:35:30", "remaining_time": "0:27:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5180, "total_steps": 5309, "loss": 2.9847, "learning_rate": 1e-05, "epoch": 0.9755293729916783, "percentage": 97.57, "elapsed_time": "17:36:24", "remaining_time": "0:26:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5185, "total_steps": 5309, "loss": 2.9757, "learning_rate": 1e-05, "epoch": 0.9764710036605893, "percentage": 97.66, "elapsed_time": "17:37:18", "remaining_time": "0:25:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5190, "total_steps": 5309, "loss": 2.9804, "learning_rate": 1e-05, "epoch": 0.9774126343295001, "percentage": 97.76, "elapsed_time": "17:38:12", "remaining_time": "0:24:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5195, "total_steps": 5309, "loss": 2.9841, "learning_rate": 1e-05, "epoch": 0.978354264998411, "percentage": 97.85, "elapsed_time": "17:39:05", "remaining_time": "0:23:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5200, "total_steps": 5309, "loss": 3.1176, "learning_rate": 1e-05, "epoch": 0.9792958956673219, "percentage": 97.95, "elapsed_time": "17:39:59", "remaining_time": "0:22:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5205, "total_steps": 5309, "loss": 2.9664, "learning_rate": 1e-05, "epoch": 0.9802375263362327, "percentage": 98.04, "elapsed_time": "17:42:11", "remaining_time": "0:21:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5210, "total_steps": 5309, "loss": 2.9684, "learning_rate": 1e-05, "epoch": 0.9811791570051437, "percentage": 98.14, "elapsed_time": "17:43:06", "remaining_time": "0:20:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5215, "total_steps": 5309, "loss": 2.8905, "learning_rate": 1e-05, "epoch": 0.9821207876740545, "percentage": 98.23, "elapsed_time": "17:43:58", "remaining_time": "0:19:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5220, "total_steps": 5309, "loss": 3.0164, "learning_rate": 1e-05, "epoch": 0.9830624183429655, "percentage": 98.32, "elapsed_time": "17:44:51", "remaining_time": "0:18:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5225, "total_steps": 5309, "loss": 2.9722, "learning_rate": 1e-05, "epoch": 0.9840040490118763, "percentage": 98.42, "elapsed_time": "17:45:43", "remaining_time": "0:17:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5230, "total_steps": 5309, "loss": 2.9922, "learning_rate": 1e-05, "epoch": 0.9849456796807872, "percentage": 98.51, "elapsed_time": "17:46:38", "remaining_time": "0:16:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5235, "total_steps": 5309, "loss": 2.9465, "learning_rate": 1e-05, "epoch": 0.9858873103496981, "percentage": 98.61, "elapsed_time": "17:47:31", "remaining_time": "0:15:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5240, "total_steps": 5309, "loss": 2.9417, "learning_rate": 1e-05, "epoch": 0.986828941018609, "percentage": 98.7, "elapsed_time": "17:48:23", "remaining_time": "0:14:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5245, "total_steps": 5309, "loss": 3.0678, "learning_rate": 1e-05, "epoch": 0.9877705716875199, "percentage": 98.79, "elapsed_time": "17:49:15", "remaining_time": "0:13:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5250, "total_steps": 5309, "loss": 2.9374, "learning_rate": 1e-05, "epoch": 0.9887122023564308, "percentage": 98.89, "elapsed_time": "17:50:10", "remaining_time": "0:12:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5255, "total_steps": 5309, "loss": 2.9633, "learning_rate": 1e-05, "epoch": 0.9896538330253416, "percentage": 98.98, "elapsed_time": "17:51:04", "remaining_time": "0:11:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5260, "total_steps": 5309, "loss": 3.0061, "learning_rate": 1e-05, "epoch": 0.9905954636942526, "percentage": 99.08, "elapsed_time": "17:51:57", "remaining_time": "0:09:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5265, "total_steps": 5309, "loss": 2.9133, "learning_rate": 1e-05, "epoch": 0.9915370943631634, "percentage": 99.17, "elapsed_time": "17:52:49", "remaining_time": "0:08:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5270, "total_steps": 5309, "loss": 2.9518, "learning_rate": 1e-05, "epoch": 0.9924787250320743, "percentage": 99.27, "elapsed_time": "17:53:43", "remaining_time": "0:07:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5275, "total_steps": 5309, "loss": 3.0659, "learning_rate": 1e-05, "epoch": 0.9934203557009852, "percentage": 99.36, "elapsed_time": "17:54:36", "remaining_time": "0:06:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5280, "total_steps": 5309, "loss": 3.0431, "learning_rate": 1e-05, "epoch": 0.994361986369896, "percentage": 99.45, "elapsed_time": "17:55:28", "remaining_time": "0:05:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5285, "total_steps": 5309, "loss": 2.9397, "learning_rate": 1e-05, "epoch": 0.995303617038807, "percentage": 99.55, "elapsed_time": "17:56:21", "remaining_time": "0:04:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5290, "total_steps": 5309, "loss": 2.9773, "learning_rate": 1e-05, "epoch": 0.9962452477077178, "percentage": 99.64, "elapsed_time": "17:57:13", "remaining_time": "0:03:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5295, "total_steps": 5309, "loss": 2.9691, "learning_rate": 1e-05, "epoch": 0.9971868783766287, "percentage": 99.74, "elapsed_time": "17:58:07", "remaining_time": "0:02:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5300, "total_steps": 5309, "loss": 3.0107, "learning_rate": 1e-05, "epoch": 0.9981285090455396, "percentage": 99.83, "elapsed_time": "17:59:01", "remaining_time": "0:01:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5305, "total_steps": 5309, "loss": 2.9, "learning_rate": 1e-05, "epoch": 0.9990701397144505, "percentage": 99.92, "elapsed_time": "17:59:55", "remaining_time": "0:00:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5309, "total_steps": 5309, "epoch": 0.9998234442495793, "percentage": 100.0, "elapsed_time": "18:01:59", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}