{"current_steps": 1, "total_steps": 4438, "loss": 0.3782, "learning_rate": 2.2522522522522524e-08, "epoch": 0.00022530768580843213, "percentage": 0.02, "elapsed_time": "0:00:14", "remaining_time": "17:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 4438, "loss": 0.3779, "learning_rate": 4.504504504504505e-08, "epoch": 0.00045061537161686426, "percentage": 0.05, "elapsed_time": "0:00:24", "remaining_time": "15:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 4438, "loss": 0.3532, "learning_rate": 6.756756756756757e-08, "epoch": 0.0006759230574252964, "percentage": 0.07, "elapsed_time": "0:00:35", "remaining_time": "14:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 4438, "loss": 0.3981, "learning_rate": 9.00900900900901e-08, "epoch": 0.0009012307432337285, "percentage": 0.09, "elapsed_time": "0:00:46", "remaining_time": "14:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 4438, "loss": 0.3753, "learning_rate": 1.1261261261261262e-07, "epoch": 0.0011265384290421608, "percentage": 0.11, "elapsed_time": "0:00:58", "remaining_time": "14:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 4438, "loss": 0.389, "learning_rate": 1.3513513513513515e-07, "epoch": 0.0013518461148505929, "percentage": 0.14, "elapsed_time": "0:01:08", "remaining_time": "13:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 4438, "loss": 0.3573, "learning_rate": 1.5765765765765766e-07, "epoch": 0.001577153800659025, "percentage": 0.16, "elapsed_time": "0:01:18", "remaining_time": "13:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 4438, "loss": 0.3716, "learning_rate": 1.801801801801802e-07, "epoch": 0.001802461486467457, "percentage": 0.18, "elapsed_time": "0:01:28", "remaining_time": "13:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 4438, "loss": 0.367, "learning_rate": 2.0270270270270273e-07, "epoch": 0.0020277691722758893, "percentage": 0.2, "elapsed_time": "0:01:39", "remaining_time": "13:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 4438, "loss": 0.3763, "learning_rate": 2.2522522522522524e-07, "epoch": 0.0022530768580843216, "percentage": 0.23, "elapsed_time": "0:01:50", "remaining_time": "13:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 4438, "loss": 0.4068, "learning_rate": 2.477477477477478e-07, "epoch": 0.0024783845438927535, "percentage": 0.25, "elapsed_time": "0:02:01", "remaining_time": "13:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 4438, "loss": 0.382, "learning_rate": 2.702702702702703e-07, "epoch": 0.0027036922297011858, "percentage": 0.27, "elapsed_time": "0:02:12", "remaining_time": "13:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 4438, "loss": 0.3716, "learning_rate": 2.927927927927928e-07, "epoch": 0.0029289999155096176, "percentage": 0.29, "elapsed_time": "0:02:24", "remaining_time": "13:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 4438, "loss": 0.3911, "learning_rate": 3.153153153153153e-07, "epoch": 0.00315430760131805, "percentage": 0.32, "elapsed_time": "0:02:34", "remaining_time": "13:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 4438, "loss": 0.3662, "learning_rate": 3.378378378378379e-07, "epoch": 0.003379615287126482, "percentage": 0.34, "elapsed_time": "0:02:45", "remaining_time": "13:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 4438, "loss": 0.3825, "learning_rate": 3.603603603603604e-07, "epoch": 0.003604922972934914, "percentage": 0.36, "elapsed_time": "0:02:56", "remaining_time": "13:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 4438, "loss": 0.3612, "learning_rate": 3.828828828828829e-07, "epoch": 0.0038302306587433463, "percentage": 0.38, "elapsed_time": "0:03:07", "remaining_time": "13:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 4438, "loss": 0.3849, "learning_rate": 4.0540540540540546e-07, "epoch": 0.004055538344551779, "percentage": 0.41, "elapsed_time": "0:03:19", "remaining_time": "13:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 4438, "loss": 0.3798, "learning_rate": 4.27927927927928e-07, "epoch": 0.0042808460303602105, "percentage": 0.43, "elapsed_time": "0:03:29", "remaining_time": "13:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 4438, "loss": 0.3539, "learning_rate": 4.504504504504505e-07, "epoch": 0.004506153716168643, "percentage": 0.45, "elapsed_time": "0:03:40", "remaining_time": "13:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 4438, "loss": 0.3557, "learning_rate": 4.7297297297297305e-07, "epoch": 0.004731461401977075, "percentage": 0.47, "elapsed_time": "0:03:51", "remaining_time": "13:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 4438, "loss": 0.3505, "learning_rate": 4.954954954954956e-07, "epoch": 0.004956769087785507, "percentage": 0.5, "elapsed_time": "0:04:02", "remaining_time": "13:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 4438, "loss": 0.3411, "learning_rate": 5.180180180180181e-07, "epoch": 0.00518207677359394, "percentage": 0.52, "elapsed_time": "0:04:12", "remaining_time": "13:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 4438, "loss": 0.3233, "learning_rate": 5.405405405405406e-07, "epoch": 0.0054073844594023715, "percentage": 0.54, "elapsed_time": "0:04:24", "remaining_time": "13:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 4438, "loss": 0.3374, "learning_rate": 5.630630630630631e-07, "epoch": 0.005632692145210803, "percentage": 0.56, "elapsed_time": "0:04:33", "remaining_time": "13:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 4438, "loss": 0.3429, "learning_rate": 5.855855855855856e-07, "epoch": 0.005857999831019235, "percentage": 0.59, "elapsed_time": "0:04:42", "remaining_time": "13:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 4438, "loss": 0.3614, "learning_rate": 6.081081081081082e-07, "epoch": 0.006083307516827668, "percentage": 0.61, "elapsed_time": "0:04:54", "remaining_time": "13:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 4438, "loss": 0.3176, "learning_rate": 6.306306306306306e-07, "epoch": 0.0063086152026361, "percentage": 0.63, "elapsed_time": "0:05:05", "remaining_time": "13:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 4438, "loss": 0.3203, "learning_rate": 6.531531531531532e-07, "epoch": 0.006533922888444532, "percentage": 0.65, "elapsed_time": "0:05:16", "remaining_time": "13:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 4438, "loss": 0.3, "learning_rate": 6.756756756756758e-07, "epoch": 0.006759230574252964, "percentage": 0.68, "elapsed_time": "0:05:26", "remaining_time": "13:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 4438, "loss": 0.3135, "learning_rate": 6.981981981981982e-07, "epoch": 0.006984538260061396, "percentage": 0.7, "elapsed_time": "0:05:38", "remaining_time": "13:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 4438, "loss": 0.3154, "learning_rate": 7.207207207207208e-07, "epoch": 0.007209845945869828, "percentage": 0.72, "elapsed_time": "0:05:49", "remaining_time": "13:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 4438, "loss": 0.321, "learning_rate": 7.432432432432434e-07, "epoch": 0.007435153631678261, "percentage": 0.74, "elapsed_time": "0:06:01", "remaining_time": "13:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 4438, "loss": 0.2995, "learning_rate": 7.657657657657658e-07, "epoch": 0.007660461317486693, "percentage": 0.77, "elapsed_time": "0:06:12", "remaining_time": "13:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 4438, "loss": 0.3095, "learning_rate": 7.882882882882883e-07, "epoch": 0.007885769003295125, "percentage": 0.79, "elapsed_time": "0:06:23", "remaining_time": "13:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 4438, "loss": 0.2888, "learning_rate": 8.108108108108109e-07, "epoch": 0.008111076689103557, "percentage": 0.81, "elapsed_time": "0:06:34", "remaining_time": "13:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 4438, "loss": 0.2894, "learning_rate": 8.333333333333333e-07, "epoch": 0.008336384374911989, "percentage": 0.83, "elapsed_time": "0:06:44", "remaining_time": "13:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 4438, "loss": 0.3088, "learning_rate": 8.55855855855856e-07, "epoch": 0.008561692060720421, "percentage": 0.86, "elapsed_time": "0:06:55", "remaining_time": "13:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 4438, "loss": 0.292, "learning_rate": 8.783783783783785e-07, "epoch": 0.008786999746528853, "percentage": 0.88, "elapsed_time": "0:07:07", "remaining_time": "13:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 4438, "loss": 0.2841, "learning_rate": 9.00900900900901e-07, "epoch": 0.009012307432337286, "percentage": 0.9, "elapsed_time": "0:07:19", "remaining_time": "13:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 4438, "loss": 0.3068, "learning_rate": 9.234234234234235e-07, "epoch": 0.009237615118145718, "percentage": 0.92, "elapsed_time": "0:07:30", "remaining_time": "13:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 4438, "loss": 0.2993, "learning_rate": 9.459459459459461e-07, "epoch": 0.00946292280395415, "percentage": 0.95, "elapsed_time": "0:07:41", "remaining_time": "13:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 4438, "loss": 0.2768, "learning_rate": 9.684684684684686e-07, "epoch": 0.009688230489762582, "percentage": 0.97, "elapsed_time": "0:07:51", "remaining_time": "13:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 4438, "loss": 0.2762, "learning_rate": 9.909909909909911e-07, "epoch": 0.009913538175571014, "percentage": 0.99, "elapsed_time": "0:08:01", "remaining_time": "13:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 4438, "loss": 0.2687, "learning_rate": 1.0135135135135136e-06, "epoch": 0.010138845861379446, "percentage": 1.01, "elapsed_time": "0:08:11", "remaining_time": "13:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 4438, "loss": 0.2749, "learning_rate": 1.0360360360360361e-06, "epoch": 0.01036415354718788, "percentage": 1.04, "elapsed_time": "0:08:21", "remaining_time": "13:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 4438, "loss": 0.2527, "learning_rate": 1.0585585585585587e-06, "epoch": 0.010589461232996311, "percentage": 1.06, "elapsed_time": "0:08:31", "remaining_time": "13:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 4438, "loss": 0.2806, "learning_rate": 1.0810810810810812e-06, "epoch": 0.010814768918804743, "percentage": 1.08, "elapsed_time": "0:08:42", "remaining_time": "13:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 4438, "loss": 0.2653, "learning_rate": 1.1036036036036037e-06, "epoch": 0.011040076604613175, "percentage": 1.1, "elapsed_time": "0:08:54", "remaining_time": "13:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 4438, "loss": 0.2603, "learning_rate": 1.1261261261261262e-06, "epoch": 0.011265384290421607, "percentage": 1.13, "elapsed_time": "0:09:04", "remaining_time": "13:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 4438, "loss": 0.2657, "learning_rate": 1.148648648648649e-06, "epoch": 0.011490691976230039, "percentage": 1.15, "elapsed_time": "0:09:15", "remaining_time": "13:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 4438, "loss": 0.2782, "learning_rate": 1.1711711711711712e-06, "epoch": 0.01171599966203847, "percentage": 1.17, "elapsed_time": "0:09:26", "remaining_time": "13:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 4438, "loss": 0.2765, "learning_rate": 1.1936936936936937e-06, "epoch": 0.011941307347846904, "percentage": 1.19, "elapsed_time": "0:09:37", "remaining_time": "13:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 4438, "loss": 0.2599, "learning_rate": 1.2162162162162164e-06, "epoch": 0.012166615033655336, "percentage": 1.22, "elapsed_time": "0:09:47", "remaining_time": "13:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 4438, "loss": 0.2867, "learning_rate": 1.2387387387387387e-06, "epoch": 0.012391922719463768, "percentage": 1.24, "elapsed_time": "0:09:59", "remaining_time": "13:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 4438, "loss": 0.2651, "learning_rate": 1.2612612612612613e-06, "epoch": 0.0126172304052722, "percentage": 1.26, "elapsed_time": "0:10:09", "remaining_time": "13:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 4438, "loss": 0.2546, "learning_rate": 1.2837837837837838e-06, "epoch": 0.012842538091080631, "percentage": 1.28, "elapsed_time": "0:10:21", "remaining_time": "13:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 4438, "loss": 0.239, "learning_rate": 1.3063063063063065e-06, "epoch": 0.013067845776889063, "percentage": 1.31, "elapsed_time": "0:10:31", "remaining_time": "13:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 4438, "loss": 0.2632, "learning_rate": 1.328828828828829e-06, "epoch": 0.013293153462697497, "percentage": 1.33, "elapsed_time": "0:10:43", "remaining_time": "13:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 4438, "loss": 0.2618, "learning_rate": 1.3513513513513515e-06, "epoch": 0.013518461148505929, "percentage": 1.35, "elapsed_time": "0:10:55", "remaining_time": "13:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 4438, "loss": 0.2699, "learning_rate": 1.373873873873874e-06, "epoch": 0.01374376883431436, "percentage": 1.37, "elapsed_time": "0:11:06", "remaining_time": "13:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 4438, "loss": 0.2517, "learning_rate": 1.3963963963963963e-06, "epoch": 0.013969076520122792, "percentage": 1.4, "elapsed_time": "0:11:17", "remaining_time": "13:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 4438, "loss": 0.2308, "learning_rate": 1.418918918918919e-06, "epoch": 0.014194384205931224, "percentage": 1.42, "elapsed_time": "0:11:26", "remaining_time": "13:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 4438, "loss": 0.2788, "learning_rate": 1.4414414414414416e-06, "epoch": 0.014419691891739656, "percentage": 1.44, "elapsed_time": "0:11:38", "remaining_time": "13:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 4438, "loss": 0.2625, "learning_rate": 1.463963963963964e-06, "epoch": 0.01464499957754809, "percentage": 1.46, "elapsed_time": "0:11:50", "remaining_time": "13:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 4438, "loss": 0.2588, "learning_rate": 1.4864864864864868e-06, "epoch": 0.014870307263356522, "percentage": 1.49, "elapsed_time": "0:12:01", "remaining_time": "13:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 4438, "loss": 0.2584, "learning_rate": 1.5090090090090093e-06, "epoch": 0.015095614949164953, "percentage": 1.51, "elapsed_time": "0:12:11", "remaining_time": "13:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 4438, "loss": 0.234, "learning_rate": 1.5315315315315316e-06, "epoch": 0.015320922634973385, "percentage": 1.53, "elapsed_time": "0:12:21", "remaining_time": "13:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 4438, "loss": 0.2534, "learning_rate": 1.5540540540540541e-06, "epoch": 0.015546230320781817, "percentage": 1.55, "elapsed_time": "0:12:31", "remaining_time": "13:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 4438, "loss": 0.2593, "learning_rate": 1.5765765765765766e-06, "epoch": 0.01577153800659025, "percentage": 1.58, "elapsed_time": "0:12:43", "remaining_time": "13:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 4438, "loss": 0.2617, "learning_rate": 1.5990990990990993e-06, "epoch": 0.015996845692398683, "percentage": 1.6, "elapsed_time": "0:12:54", "remaining_time": "13:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 4438, "loss": 0.2639, "learning_rate": 1.6216216216216219e-06, "epoch": 0.016222153378207115, "percentage": 1.62, "elapsed_time": "0:13:06", "remaining_time": "13:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 4438, "loss": 0.2271, "learning_rate": 1.6441441441441444e-06, "epoch": 0.016447461064015546, "percentage": 1.64, "elapsed_time": "0:13:16", "remaining_time": "13:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 4438, "loss": 0.2431, "learning_rate": 1.6666666666666667e-06, "epoch": 0.016672768749823978, "percentage": 1.67, "elapsed_time": "0:13:27", "remaining_time": "13:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 4438, "loss": 0.2415, "learning_rate": 1.6891891891891894e-06, "epoch": 0.01689807643563241, "percentage": 1.69, "elapsed_time": "0:13:38", "remaining_time": "13:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 4438, "loss": 0.2381, "learning_rate": 1.711711711711712e-06, "epoch": 0.017123384121440842, "percentage": 1.71, "elapsed_time": "0:13:50", "remaining_time": "13:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 4438, "loss": 0.2341, "learning_rate": 1.7342342342342344e-06, "epoch": 0.017348691807249274, "percentage": 1.74, "elapsed_time": "0:14:01", "remaining_time": "13:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 4438, "loss": 0.2503, "learning_rate": 1.756756756756757e-06, "epoch": 0.017573999493057706, "percentage": 1.76, "elapsed_time": "0:14:13", "remaining_time": "13:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 4438, "loss": 0.2267, "learning_rate": 1.7792792792792792e-06, "epoch": 0.017799307178866138, "percentage": 1.78, "elapsed_time": "0:14:24", "remaining_time": "13:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 4438, "loss": 0.2513, "learning_rate": 1.801801801801802e-06, "epoch": 0.018024614864674573, "percentage": 1.8, "elapsed_time": "0:14:35", "remaining_time": "13:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 4438, "loss": 0.2269, "learning_rate": 1.8243243243243245e-06, "epoch": 0.018249922550483005, "percentage": 1.83, "elapsed_time": "0:14:45", "remaining_time": "13:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 4438, "loss": 0.2435, "learning_rate": 1.846846846846847e-06, "epoch": 0.018475230236291437, "percentage": 1.85, "elapsed_time": "0:14:58", "remaining_time": "13:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 4438, "loss": 0.242, "learning_rate": 1.8693693693693697e-06, "epoch": 0.01870053792209987, "percentage": 1.87, "elapsed_time": "0:15:08", "remaining_time": "13:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 4438, "loss": 0.2466, "learning_rate": 1.8918918918918922e-06, "epoch": 0.0189258456079083, "percentage": 1.89, "elapsed_time": "0:15:19", "remaining_time": "13:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 4438, "loss": 0.2158, "learning_rate": 1.9144144144144145e-06, "epoch": 0.019151153293716732, "percentage": 1.92, "elapsed_time": "0:15:29", "remaining_time": "13:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 4438, "loss": 0.2196, "learning_rate": 1.9369369369369372e-06, "epoch": 0.019376460979525164, "percentage": 1.94, "elapsed_time": "0:15:40", "remaining_time": "13:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 4438, "loss": 0.2386, "learning_rate": 1.9594594594594595e-06, "epoch": 0.019601768665333596, "percentage": 1.96, "elapsed_time": "0:15:51", "remaining_time": "13:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 4438, "loss": 0.2356, "learning_rate": 1.9819819819819822e-06, "epoch": 0.019827076351142028, "percentage": 1.98, "elapsed_time": "0:16:02", "remaining_time": "13:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 4438, "loss": 0.2262, "learning_rate": 2.0045045045045045e-06, "epoch": 0.02005238403695046, "percentage": 2.01, "elapsed_time": "0:16:13", "remaining_time": "13:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 4438, "loss": 0.2325, "learning_rate": 2.0270270270270273e-06, "epoch": 0.02027769172275889, "percentage": 2.03, "elapsed_time": "0:16:26", "remaining_time": "13:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 4438, "loss": 0.2546, "learning_rate": 2.0495495495495496e-06, "epoch": 0.020502999408567323, "percentage": 2.05, "elapsed_time": "0:16:36", "remaining_time": "13:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 4438, "loss": 0.2411, "learning_rate": 2.0720720720720723e-06, "epoch": 0.02072830709437576, "percentage": 2.07, "elapsed_time": "0:16:47", "remaining_time": "13:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 4438, "loss": 0.2287, "learning_rate": 2.0945945945945946e-06, "epoch": 0.02095361478018419, "percentage": 2.1, "elapsed_time": "0:16:58", "remaining_time": "13:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 4438, "loss": 0.2431, "learning_rate": 2.1171171171171173e-06, "epoch": 0.021178922465992622, "percentage": 2.12, "elapsed_time": "0:17:09", "remaining_time": "13:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 4438, "loss": 0.2242, "learning_rate": 2.13963963963964e-06, "epoch": 0.021404230151801054, "percentage": 2.14, "elapsed_time": "0:17:20", "remaining_time": "13:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 4438, "loss": 0.2491, "learning_rate": 2.1621621621621623e-06, "epoch": 0.021629537837609486, "percentage": 2.16, "elapsed_time": "0:17:32", "remaining_time": "13:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 4438, "loss": 0.2291, "learning_rate": 2.1846846846846846e-06, "epoch": 0.021854845523417918, "percentage": 2.19, "elapsed_time": "0:17:44", "remaining_time": "13:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 4438, "loss": 0.2534, "learning_rate": 2.2072072072072073e-06, "epoch": 0.02208015320922635, "percentage": 2.21, "elapsed_time": "0:17:54", "remaining_time": "13:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 4438, "loss": 0.2545, "learning_rate": 2.22972972972973e-06, "epoch": 0.02230546089503478, "percentage": 2.23, "elapsed_time": "0:18:04", "remaining_time": "13:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 4438, "loss": 0.2233, "learning_rate": 2.2522522522522524e-06, "epoch": 0.022530768580843213, "percentage": 2.25, "elapsed_time": "0:18:14", "remaining_time": "13:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 4438, "loss": 0.2137, "learning_rate": 2.274774774774775e-06, "epoch": 0.022756076266651645, "percentage": 2.28, "elapsed_time": "0:18:24", "remaining_time": "13:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 4438, "loss": 0.2223, "learning_rate": 2.297297297297298e-06, "epoch": 0.022981383952460077, "percentage": 2.3, "elapsed_time": "0:18:35", "remaining_time": "13:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 4438, "loss": 0.2311, "learning_rate": 2.31981981981982e-06, "epoch": 0.02320669163826851, "percentage": 2.32, "elapsed_time": "0:18:46", "remaining_time": "13:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 4438, "loss": 0.2259, "learning_rate": 2.3423423423423424e-06, "epoch": 0.02343199932407694, "percentage": 2.34, "elapsed_time": "0:18:58", "remaining_time": "13:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 4438, "loss": 0.2443, "learning_rate": 2.364864864864865e-06, "epoch": 0.023657307009885376, "percentage": 2.37, "elapsed_time": "0:19:09", "remaining_time": "13:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 4438, "loss": 0.227, "learning_rate": 2.3873873873873874e-06, "epoch": 0.023882614695693808, "percentage": 2.39, "elapsed_time": "0:19:20", "remaining_time": "13:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 4438, "loss": 0.2205, "learning_rate": 2.40990990990991e-06, "epoch": 0.02410792238150224, "percentage": 2.41, "elapsed_time": "0:19:32", "remaining_time": "13:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 4438, "loss": 0.2205, "learning_rate": 2.432432432432433e-06, "epoch": 0.024333230067310672, "percentage": 2.43, "elapsed_time": "0:19:42", "remaining_time": "13:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 4438, "loss": 0.2378, "learning_rate": 2.454954954954955e-06, "epoch": 0.024558537753119104, "percentage": 2.46, "elapsed_time": "0:19:53", "remaining_time": "13:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 4438, "loss": 0.2139, "learning_rate": 2.4774774774774775e-06, "epoch": 0.024783845438927535, "percentage": 2.48, "elapsed_time": "0:20:04", "remaining_time": "13:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 4438, "loss": 0.2298, "learning_rate": 2.5e-06, "epoch": 0.025009153124735967, "percentage": 2.5, "elapsed_time": "0:20:13", "remaining_time": "13:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 4438, "loss": 0.246, "learning_rate": 2.5225225225225225e-06, "epoch": 0.0252344608105444, "percentage": 2.52, "elapsed_time": "0:20:25", "remaining_time": "13:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 4438, "loss": 0.2104, "learning_rate": 2.5450450450450452e-06, "epoch": 0.02545976849635283, "percentage": 2.55, "elapsed_time": "0:20:36", "remaining_time": "13:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 4438, "loss": 0.2266, "learning_rate": 2.5675675675675675e-06, "epoch": 0.025685076182161263, "percentage": 2.57, "elapsed_time": "0:20:46", "remaining_time": "13:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 4438, "loss": 0.2411, "learning_rate": 2.5900900900900907e-06, "epoch": 0.025910383867969695, "percentage": 2.59, "elapsed_time": "0:20:56", "remaining_time": "13:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 4438, "loss": 0.2297, "learning_rate": 2.612612612612613e-06, "epoch": 0.026135691553778127, "percentage": 2.61, "elapsed_time": "0:21:06", "remaining_time": "13:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 4438, "loss": 0.2245, "learning_rate": 2.6351351351351353e-06, "epoch": 0.026360999239586562, "percentage": 2.64, "elapsed_time": "0:21:18", "remaining_time": "13:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 4438, "loss": 0.2283, "learning_rate": 2.657657657657658e-06, "epoch": 0.026586306925394994, "percentage": 2.66, "elapsed_time": "0:21:29", "remaining_time": "13:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 4438, "loss": 0.2258, "learning_rate": 2.6801801801801803e-06, "epoch": 0.026811614611203426, "percentage": 2.68, "elapsed_time": "0:21:40", "remaining_time": "13:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 4438, "loss": 0.2227, "learning_rate": 2.702702702702703e-06, "epoch": 0.027036922297011858, "percentage": 2.7, "elapsed_time": "0:21:50", "remaining_time": "13:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 4438, "loss": 0.2194, "learning_rate": 2.7252252252252253e-06, "epoch": 0.02726222998282029, "percentage": 2.73, "elapsed_time": "0:22:00", "remaining_time": "13:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 4438, "loss": 0.23, "learning_rate": 2.747747747747748e-06, "epoch": 0.02748753766862872, "percentage": 2.75, "elapsed_time": "0:22:10", "remaining_time": "13:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 4438, "loss": 0.2195, "learning_rate": 2.7702702702702703e-06, "epoch": 0.027712845354437153, "percentage": 2.77, "elapsed_time": "0:22:22", "remaining_time": "13:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 4438, "loss": 0.2396, "learning_rate": 2.7927927927927926e-06, "epoch": 0.027938153040245585, "percentage": 2.79, "elapsed_time": "0:22:31", "remaining_time": "13:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 4438, "loss": 0.2236, "learning_rate": 2.8153153153153158e-06, "epoch": 0.028163460726054017, "percentage": 2.82, "elapsed_time": "0:22:40", "remaining_time": "13:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 4438, "loss": 0.2341, "learning_rate": 2.837837837837838e-06, "epoch": 0.02838876841186245, "percentage": 2.84, "elapsed_time": "0:22:52", "remaining_time": "13:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 4438, "loss": 0.2361, "learning_rate": 2.860360360360361e-06, "epoch": 0.02861407609767088, "percentage": 2.86, "elapsed_time": "0:23:04", "remaining_time": "13:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 4438, "loss": 0.2177, "learning_rate": 2.882882882882883e-06, "epoch": 0.028839383783479312, "percentage": 2.88, "elapsed_time": "0:23:15", "remaining_time": "13:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 4438, "loss": 0.2333, "learning_rate": 2.9054054054054054e-06, "epoch": 0.029064691469287748, "percentage": 2.91, "elapsed_time": "0:23:26", "remaining_time": "13:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 4438, "loss": 0.2413, "learning_rate": 2.927927927927928e-06, "epoch": 0.02928999915509618, "percentage": 2.93, "elapsed_time": "0:23:38", "remaining_time": "13:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 4438, "loss": 0.2172, "learning_rate": 2.9504504504504504e-06, "epoch": 0.02951530684090461, "percentage": 2.95, "elapsed_time": "0:23:49", "remaining_time": "13:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 4438, "loss": 0.2331, "learning_rate": 2.9729729729729736e-06, "epoch": 0.029740614526713043, "percentage": 2.97, "elapsed_time": "0:24:00", "remaining_time": "13:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 4438, "loss": 0.2344, "learning_rate": 2.995495495495496e-06, "epoch": 0.029965922212521475, "percentage": 3.0, "elapsed_time": "0:24:10", "remaining_time": "13:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 4438, "loss": 0.2199, "learning_rate": 3.0180180180180186e-06, "epoch": 0.030191229898329907, "percentage": 3.02, "elapsed_time": "0:24:20", "remaining_time": "13:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 4438, "loss": 0.2335, "learning_rate": 3.040540540540541e-06, "epoch": 0.03041653758413834, "percentage": 3.04, "elapsed_time": "0:24:30", "remaining_time": "13:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 4438, "loss": 0.2289, "learning_rate": 3.063063063063063e-06, "epoch": 0.03064184526994677, "percentage": 3.06, "elapsed_time": "0:24:40", "remaining_time": "13:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 4438, "loss": 0.2219, "learning_rate": 3.085585585585586e-06, "epoch": 0.030867152955755203, "percentage": 3.09, "elapsed_time": "0:24:51", "remaining_time": "13:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 4438, "loss": 0.2218, "learning_rate": 3.1081081081081082e-06, "epoch": 0.031092460641563634, "percentage": 3.11, "elapsed_time": "0:25:01", "remaining_time": "12:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 4438, "loss": 0.221, "learning_rate": 3.130630630630631e-06, "epoch": 0.03131776832737207, "percentage": 3.13, "elapsed_time": "0:25:13", "remaining_time": "13:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 4438, "loss": 0.2153, "learning_rate": 3.1531531531531532e-06, "epoch": 0.0315430760131805, "percentage": 3.15, "elapsed_time": "0:25:22", "remaining_time": "12:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 4438, "loss": 0.2199, "learning_rate": 3.1756756756756755e-06, "epoch": 0.03176838369898893, "percentage": 3.18, "elapsed_time": "0:25:34", "remaining_time": "12:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 4438, "loss": 0.2272, "learning_rate": 3.1981981981981987e-06, "epoch": 0.031993691384797365, "percentage": 3.2, "elapsed_time": "0:25:46", "remaining_time": "12:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 4438, "loss": 0.24, "learning_rate": 3.220720720720721e-06, "epoch": 0.0322189990706058, "percentage": 3.22, "elapsed_time": "0:25:57", "remaining_time": "12:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 4438, "loss": 0.2297, "learning_rate": 3.2432432432432437e-06, "epoch": 0.03244430675641423, "percentage": 3.24, "elapsed_time": "0:26:08", "remaining_time": "12:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 4438, "loss": 0.2382, "learning_rate": 3.265765765765766e-06, "epoch": 0.03266961444222266, "percentage": 3.27, "elapsed_time": "0:26:20", "remaining_time": "13:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 4438, "loss": 0.211, "learning_rate": 3.2882882882882887e-06, "epoch": 0.03289492212803109, "percentage": 3.29, "elapsed_time": "0:26:30", "remaining_time": "12:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 4438, "loss": 0.2104, "learning_rate": 3.310810810810811e-06, "epoch": 0.033120229813839525, "percentage": 3.31, "elapsed_time": "0:26:40", "remaining_time": "12:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 4438, "loss": 0.2072, "learning_rate": 3.3333333333333333e-06, "epoch": 0.033345537499647956, "percentage": 3.33, "elapsed_time": "0:26:51", "remaining_time": "12:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 4438, "loss": 0.2063, "learning_rate": 3.3558558558558565e-06, "epoch": 0.03357084518545639, "percentage": 3.36, "elapsed_time": "0:27:01", "remaining_time": "12:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 4438, "loss": 0.2259, "learning_rate": 3.3783783783783788e-06, "epoch": 0.03379615287126482, "percentage": 3.38, "elapsed_time": "0:27:11", "remaining_time": "12:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 4438, "loss": 0.2293, "learning_rate": 3.4009009009009015e-06, "epoch": 0.03402146055707325, "percentage": 3.4, "elapsed_time": "0:27:22", "remaining_time": "12:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 4438, "loss": 0.2028, "learning_rate": 3.423423423423424e-06, "epoch": 0.034246768242881684, "percentage": 3.42, "elapsed_time": "0:27:31", "remaining_time": "12:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 4438, "loss": 0.2085, "learning_rate": 3.445945945945946e-06, "epoch": 0.034472075928690116, "percentage": 3.45, "elapsed_time": "0:27:43", "remaining_time": "12:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 4438, "loss": 0.2179, "learning_rate": 3.468468468468469e-06, "epoch": 0.03469738361449855, "percentage": 3.47, "elapsed_time": "0:27:54", "remaining_time": "12:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 4438, "loss": 0.2214, "learning_rate": 3.490990990990991e-06, "epoch": 0.03492269130030698, "percentage": 3.49, "elapsed_time": "0:28:04", "remaining_time": "12:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 4438, "loss": 0.2385, "learning_rate": 3.513513513513514e-06, "epoch": 0.03514799898611541, "percentage": 3.52, "elapsed_time": "0:28:15", "remaining_time": "12:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 4438, "loss": 0.2183, "learning_rate": 3.536036036036036e-06, "epoch": 0.03537330667192384, "percentage": 3.54, "elapsed_time": "0:28:26", "remaining_time": "12:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 4438, "loss": 0.2074, "learning_rate": 3.5585585585585584e-06, "epoch": 0.035598614357732275, "percentage": 3.56, "elapsed_time": "0:28:36", "remaining_time": "12:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 4438, "loss": 0.2058, "learning_rate": 3.5810810810810816e-06, "epoch": 0.03582392204354071, "percentage": 3.58, "elapsed_time": "0:28:45", "remaining_time": "12:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 4438, "loss": 0.2505, "learning_rate": 3.603603603603604e-06, "epoch": 0.036049229729349146, "percentage": 3.61, "elapsed_time": "0:28:56", "remaining_time": "12:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 4438, "loss": 0.2267, "learning_rate": 3.6261261261261266e-06, "epoch": 0.03627453741515758, "percentage": 3.63, "elapsed_time": "0:29:06", "remaining_time": "12:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 4438, "loss": 0.2203, "learning_rate": 3.648648648648649e-06, "epoch": 0.03649984510096601, "percentage": 3.65, "elapsed_time": "0:29:16", "remaining_time": "12:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 4438, "loss": 0.2004, "learning_rate": 3.6711711711711716e-06, "epoch": 0.03672515278677444, "percentage": 3.67, "elapsed_time": "0:29:27", "remaining_time": "12:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 4438, "loss": 0.2184, "learning_rate": 3.693693693693694e-06, "epoch": 0.03695046047258287, "percentage": 3.7, "elapsed_time": "0:29:37", "remaining_time": "12:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 4438, "loss": 0.2113, "learning_rate": 3.7162162162162162e-06, "epoch": 0.037175768158391305, "percentage": 3.72, "elapsed_time": "0:29:48", "remaining_time": "12:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 4438, "loss": 0.2177, "learning_rate": 3.7387387387387394e-06, "epoch": 0.03740107584419974, "percentage": 3.74, "elapsed_time": "0:29:59", "remaining_time": "12:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 4438, "loss": 0.2267, "learning_rate": 3.7612612612612612e-06, "epoch": 0.03762638353000817, "percentage": 3.76, "elapsed_time": "0:30:08", "remaining_time": "12:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 4438, "loss": 0.2262, "learning_rate": 3.7837837837837844e-06, "epoch": 0.0378516912158166, "percentage": 3.79, "elapsed_time": "0:30:18", "remaining_time": "12:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 4438, "loss": 0.2107, "learning_rate": 3.8063063063063067e-06, "epoch": 0.03807699890162503, "percentage": 3.81, "elapsed_time": "0:30:29", "remaining_time": "12:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 4438, "loss": 0.2257, "learning_rate": 3.828828828828829e-06, "epoch": 0.038302306587433464, "percentage": 3.83, "elapsed_time": "0:30:41", "remaining_time": "12:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 4438, "loss": 0.2192, "learning_rate": 3.851351351351352e-06, "epoch": 0.038527614273241896, "percentage": 3.85, "elapsed_time": "0:30:53", "remaining_time": "12:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 4438, "loss": 0.2241, "learning_rate": 3.8738738738738744e-06, "epoch": 0.03875292195905033, "percentage": 3.88, "elapsed_time": "0:31:03", "remaining_time": "12:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 4438, "loss": 0.2091, "learning_rate": 3.896396396396397e-06, "epoch": 0.03897822964485876, "percentage": 3.9, "elapsed_time": "0:31:15", "remaining_time": "12:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 4438, "loss": 0.2278, "learning_rate": 3.918918918918919e-06, "epoch": 0.03920353733066719, "percentage": 3.92, "elapsed_time": "0:31:25", "remaining_time": "12:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 4438, "loss": 0.2242, "learning_rate": 3.941441441441442e-06, "epoch": 0.039428845016475624, "percentage": 3.94, "elapsed_time": "0:31:35", "remaining_time": "12:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 4438, "loss": 0.2211, "learning_rate": 3.9639639639639645e-06, "epoch": 0.039654152702284055, "percentage": 3.97, "elapsed_time": "0:31:46", "remaining_time": "12:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 4438, "loss": 0.1984, "learning_rate": 3.986486486486487e-06, "epoch": 0.03987946038809249, "percentage": 3.99, "elapsed_time": "0:31:56", "remaining_time": "12:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 4438, "loss": 0.2247, "learning_rate": 4.009009009009009e-06, "epoch": 0.04010476807390092, "percentage": 4.01, "elapsed_time": "0:32:07", "remaining_time": "12:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 4438, "loss": 0.208, "learning_rate": 4.031531531531531e-06, "epoch": 0.04033007575970935, "percentage": 4.03, "elapsed_time": "0:32:17", "remaining_time": "12:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 4438, "loss": 0.2336, "learning_rate": 4.0540540540540545e-06, "epoch": 0.04055538344551778, "percentage": 4.06, "elapsed_time": "0:32:28", "remaining_time": "12:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 4438, "loss": 0.2315, "learning_rate": 4.076576576576577e-06, "epoch": 0.040780691131326215, "percentage": 4.08, "elapsed_time": "0:32:38", "remaining_time": "12:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 4438, "loss": 0.2012, "learning_rate": 4.099099099099099e-06, "epoch": 0.041005998817134647, "percentage": 4.1, "elapsed_time": "0:32:48", "remaining_time": "12:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 4438, "loss": 0.1914, "learning_rate": 4.121621621621622e-06, "epoch": 0.04123130650294308, "percentage": 4.12, "elapsed_time": "0:32:59", "remaining_time": "12:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 4438, "loss": 0.2021, "learning_rate": 4.1441441441441446e-06, "epoch": 0.04145661418875152, "percentage": 4.15, "elapsed_time": "0:33:09", "remaining_time": "12:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 4438, "loss": 0.2342, "learning_rate": 4.166666666666667e-06, "epoch": 0.04168192187455995, "percentage": 4.17, "elapsed_time": "0:33:21", "remaining_time": "12:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 4438, "loss": 0.2172, "learning_rate": 4.189189189189189e-06, "epoch": 0.04190722956036838, "percentage": 4.19, "elapsed_time": "0:33:31", "remaining_time": "12:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 4438, "loss": 0.2287, "learning_rate": 4.2117117117117115e-06, "epoch": 0.04213253724617681, "percentage": 4.21, "elapsed_time": "0:33:41", "remaining_time": "12:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 4438, "loss": 0.2049, "learning_rate": 4.234234234234235e-06, "epoch": 0.042357844931985245, "percentage": 4.24, "elapsed_time": "0:33:52", "remaining_time": "12:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 4438, "loss": 0.1962, "learning_rate": 4.256756756756757e-06, "epoch": 0.042583152617793676, "percentage": 4.26, "elapsed_time": "0:34:03", "remaining_time": "12:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 4438, "loss": 0.2069, "learning_rate": 4.27927927927928e-06, "epoch": 0.04280846030360211, "percentage": 4.28, "elapsed_time": "0:34:13", "remaining_time": "12:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 4438, "loss": 0.2166, "learning_rate": 4.301801801801802e-06, "epoch": 0.04303376798941054, "percentage": 4.3, "elapsed_time": "0:34:24", "remaining_time": "12:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 4438, "loss": 0.2157, "learning_rate": 4.324324324324325e-06, "epoch": 0.04325907567521897, "percentage": 4.33, "elapsed_time": "0:34:36", "remaining_time": "12:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 4438, "loss": 0.2107, "learning_rate": 4.346846846846847e-06, "epoch": 0.043484383361027404, "percentage": 4.35, "elapsed_time": "0:34:46", "remaining_time": "12:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 4438, "loss": 0.2309, "learning_rate": 4.369369369369369e-06, "epoch": 0.043709691046835836, "percentage": 4.37, "elapsed_time": "0:34:57", "remaining_time": "12:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 4438, "loss": 0.2071, "learning_rate": 4.391891891891892e-06, "epoch": 0.04393499873264427, "percentage": 4.39, "elapsed_time": "0:35:09", "remaining_time": "12:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 4438, "loss": 0.2107, "learning_rate": 4.414414414414415e-06, "epoch": 0.0441603064184527, "percentage": 4.42, "elapsed_time": "0:35:20", "remaining_time": "12:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 4438, "loss": 0.2136, "learning_rate": 4.436936936936938e-06, "epoch": 0.04438561410426113, "percentage": 4.44, "elapsed_time": "0:35:30", "remaining_time": "12:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 4438, "loss": 0.2073, "learning_rate": 4.45945945945946e-06, "epoch": 0.04461092179006956, "percentage": 4.46, "elapsed_time": "0:35:41", "remaining_time": "12:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 4438, "loss": 0.2297, "learning_rate": 4.4819819819819824e-06, "epoch": 0.044836229475877995, "percentage": 4.48, "elapsed_time": "0:35:51", "remaining_time": "12:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 4438, "loss": 0.2131, "learning_rate": 4.504504504504505e-06, "epoch": 0.04506153716168643, "percentage": 4.51, "elapsed_time": "0:36:02", "remaining_time": "12:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 4438, "loss": 0.2171, "learning_rate": 4.527027027027027e-06, "epoch": 0.04528684484749486, "percentage": 4.53, "elapsed_time": "0:36:13", "remaining_time": "12:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 4438, "loss": 0.2042, "learning_rate": 4.54954954954955e-06, "epoch": 0.04551215253330329, "percentage": 4.55, "elapsed_time": "0:36:24", "remaining_time": "12:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 4438, "loss": 0.225, "learning_rate": 4.5720720720720725e-06, "epoch": 0.04573746021911172, "percentage": 4.57, "elapsed_time": "0:36:32", "remaining_time": "12:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 4438, "loss": 0.2209, "learning_rate": 4.594594594594596e-06, "epoch": 0.045962767904920154, "percentage": 4.6, "elapsed_time": "0:36:44", "remaining_time": "12:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 4438, "loss": 0.2244, "learning_rate": 4.617117117117118e-06, "epoch": 0.046188075590728586, "percentage": 4.62, "elapsed_time": "0:36:55", "remaining_time": "12:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 4438, "loss": 0.2311, "learning_rate": 4.63963963963964e-06, "epoch": 0.04641338327653702, "percentage": 4.64, "elapsed_time": "0:37:07", "remaining_time": "12:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 4438, "loss": 0.2195, "learning_rate": 4.6621621621621625e-06, "epoch": 0.04663869096234545, "percentage": 4.66, "elapsed_time": "0:37:17", "remaining_time": "12:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 4438, "loss": 0.2195, "learning_rate": 4.684684684684685e-06, "epoch": 0.04686399864815388, "percentage": 4.69, "elapsed_time": "0:37:25", "remaining_time": "12:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 4438, "loss": 0.2116, "learning_rate": 4.707207207207208e-06, "epoch": 0.04708930633396232, "percentage": 4.71, "elapsed_time": "0:37:35", "remaining_time": "12:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 4438, "loss": 0.2207, "learning_rate": 4.72972972972973e-06, "epoch": 0.04731461401977075, "percentage": 4.73, "elapsed_time": "0:37:46", "remaining_time": "12:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 4438, "loss": 0.2016, "learning_rate": 4.7522522522522526e-06, "epoch": 0.047539921705579184, "percentage": 4.75, "elapsed_time": "0:37:56", "remaining_time": "12:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 4438, "loss": 0.2256, "learning_rate": 4.774774774774775e-06, "epoch": 0.047765229391387616, "percentage": 4.78, "elapsed_time": "0:38:07", "remaining_time": "12:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 4438, "loss": 0.1985, "learning_rate": 4.797297297297297e-06, "epoch": 0.04799053707719605, "percentage": 4.8, "elapsed_time": "0:38:17", "remaining_time": "12:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 4438, "loss": 0.2102, "learning_rate": 4.81981981981982e-06, "epoch": 0.04821584476300448, "percentage": 4.82, "elapsed_time": "0:38:27", "remaining_time": "12:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 4438, "loss": 0.2103, "learning_rate": 4.842342342342343e-06, "epoch": 0.04844115244881291, "percentage": 4.84, "elapsed_time": "0:38:39", "remaining_time": "12:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 4438, "loss": 0.2195, "learning_rate": 4.864864864864866e-06, "epoch": 0.048666460134621344, "percentage": 4.87, "elapsed_time": "0:38:49", "remaining_time": "12:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 4438, "loss": 0.2128, "learning_rate": 4.887387387387388e-06, "epoch": 0.048891767820429775, "percentage": 4.89, "elapsed_time": "0:38:58", "remaining_time": "12:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 4438, "loss": 0.2218, "learning_rate": 4.90990990990991e-06, "epoch": 0.04911707550623821, "percentage": 4.91, "elapsed_time": "0:39:10", "remaining_time": "12:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 4438, "loss": 0.2203, "learning_rate": 4.932432432432433e-06, "epoch": 0.04934238319204664, "percentage": 4.93, "elapsed_time": "0:39:20", "remaining_time": "12:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 4438, "loss": 0.2349, "learning_rate": 4.954954954954955e-06, "epoch": 0.04956769087785507, "percentage": 4.96, "elapsed_time": "0:39:31", "remaining_time": "12:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 4438, "loss": 0.2192, "learning_rate": 4.977477477477478e-06, "epoch": 0.0497929985636635, "percentage": 4.98, "elapsed_time": "0:39:41", "remaining_time": "12:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 4438, "loss": 0.2171, "learning_rate": 5e-06, "epoch": 0.050018306249471935, "percentage": 5.0, "elapsed_time": "0:39:51", "remaining_time": "12:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 4438, "loss": 0.2155, "learning_rate": 4.999999305921593e-06, "epoch": 0.050243613935280367, "percentage": 5.02, "elapsed_time": "0:40:01", "remaining_time": "12:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 4438, "loss": 0.2063, "learning_rate": 4.999997223686756e-06, "epoch": 0.0504689216210888, "percentage": 5.05, "elapsed_time": "0:40:13", "remaining_time": "12:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 4438, "loss": 0.2372, "learning_rate": 4.9999937532966454e-06, "epoch": 0.05069422930689723, "percentage": 5.07, "elapsed_time": "0:40:23", "remaining_time": "12:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 4438, "loss": 0.1952, "learning_rate": 4.999988894753189e-06, "epoch": 0.05091953699270566, "percentage": 5.09, "elapsed_time": "0:40:34", "remaining_time": "12:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 4438, "loss": 0.2424, "learning_rate": 4.999982648059082e-06, "epoch": 0.051144844678514094, "percentage": 5.11, "elapsed_time": "0:40:46", "remaining_time": "12:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 4438, "loss": 0.2282, "learning_rate": 4.999975013217796e-06, "epoch": 0.051370152364322526, "percentage": 5.14, "elapsed_time": "0:40:58", "remaining_time": "12:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 4438, "loss": 0.2295, "learning_rate": 4.99996599023357e-06, "epoch": 0.05159546005013096, "percentage": 5.16, "elapsed_time": "0:41:08", "remaining_time": "12:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 4438, "loss": 0.2158, "learning_rate": 4.999955579111413e-06, "epoch": 0.05182076773593939, "percentage": 5.18, "elapsed_time": "0:41:18", "remaining_time": "12:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 4438, "loss": 0.1972, "learning_rate": 4.999943779857106e-06, "epoch": 0.05204607542174782, "percentage": 5.21, "elapsed_time": "0:41:27", "remaining_time": "12:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 4438, "loss": 0.2258, "learning_rate": 4.9999305924772e-06, "epoch": 0.05227138310755625, "percentage": 5.23, "elapsed_time": "0:41:38", "remaining_time": "12:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 4438, "loss": 0.2117, "learning_rate": 4.999916016979019e-06, "epoch": 0.05249669079336469, "percentage": 5.25, "elapsed_time": "0:41:49", "remaining_time": "12:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 4438, "loss": 0.2302, "learning_rate": 4.999900053370657e-06, "epoch": 0.052721998479173124, "percentage": 5.27, "elapsed_time": "0:42:00", "remaining_time": "12:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 4438, "loss": 0.2168, "learning_rate": 4.999882701660975e-06, "epoch": 0.052947306164981556, "percentage": 5.3, "elapsed_time": "0:42:10", "remaining_time": "12:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 4438, "loss": 0.2027, "learning_rate": 4.99986396185961e-06, "epoch": 0.05317261385078999, "percentage": 5.32, "elapsed_time": "0:42:21", "remaining_time": "12:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 4438, "loss": 0.225, "learning_rate": 4.999843833976967e-06, "epoch": 0.05339792153659842, "percentage": 5.34, "elapsed_time": "0:42:33", "remaining_time": "12:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 4438, "loss": 0.1954, "learning_rate": 4.999822318024222e-06, "epoch": 0.05362322922240685, "percentage": 5.36, "elapsed_time": "0:42:43", "remaining_time": "12:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 4438, "loss": 0.23, "learning_rate": 4.999799414013322e-06, "epoch": 0.05384853690821528, "percentage": 5.39, "elapsed_time": "0:42:54", "remaining_time": "12:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 4438, "loss": 0.2008, "learning_rate": 4.9997751219569844e-06, "epoch": 0.054073844594023715, "percentage": 5.41, "elapsed_time": "0:43:05", "remaining_time": "12:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 4438, "loss": 0.1929, "learning_rate": 4.999749441868699e-06, "epoch": 0.05429915227983215, "percentage": 5.43, "elapsed_time": "0:43:15", "remaining_time": "12:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 4438, "loss": 0.1968, "learning_rate": 4.999722373762725e-06, "epoch": 0.05452445996564058, "percentage": 5.45, "elapsed_time": "0:43:25", "remaining_time": "12:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 4438, "loss": 0.2159, "learning_rate": 4.9996939176540895e-06, "epoch": 0.05474976765144901, "percentage": 5.48, "elapsed_time": "0:43:36", "remaining_time": "12:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 4438, "loss": 0.2205, "learning_rate": 4.999664073558596e-06, "epoch": 0.05497507533725744, "percentage": 5.5, "elapsed_time": "0:43:47", "remaining_time": "12:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 4438, "loss": 0.2246, "learning_rate": 4.999632841492815e-06, "epoch": 0.055200383023065874, "percentage": 5.52, "elapsed_time": "0:43:59", "remaining_time": "12:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 4438, "loss": 0.2041, "learning_rate": 4.999600221474089e-06, "epoch": 0.055425690708874306, "percentage": 5.54, "elapsed_time": "0:44:09", "remaining_time": "12:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 4438, "loss": 0.1938, "learning_rate": 4.999566213520529e-06, "epoch": 0.05565099839468274, "percentage": 5.57, "elapsed_time": "0:44:20", "remaining_time": "12:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 4438, "loss": 0.2085, "learning_rate": 4.99953081765102e-06, "epoch": 0.05587630608049117, "percentage": 5.59, "elapsed_time": "0:44:31", "remaining_time": "12:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 4438, "loss": 0.1985, "learning_rate": 4.999494033885215e-06, "epoch": 0.0561016137662996, "percentage": 5.61, "elapsed_time": "0:44:41", "remaining_time": "12:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 4438, "loss": 0.2268, "learning_rate": 4.999455862243539e-06, "epoch": 0.056326921452108034, "percentage": 5.63, "elapsed_time": "0:44:52", "remaining_time": "12:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 4438, "loss": 0.2207, "learning_rate": 4.999416302747189e-06, "epoch": 0.056552229137916465, "percentage": 5.66, "elapsed_time": "0:45:02", "remaining_time": "12:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 4438, "loss": 0.2274, "learning_rate": 4.999375355418128e-06, "epoch": 0.0567775368237249, "percentage": 5.68, "elapsed_time": "0:45:14", "remaining_time": "12:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 4438, "loss": 0.2052, "learning_rate": 4.999333020279094e-06, "epoch": 0.05700284450953333, "percentage": 5.7, "elapsed_time": "0:45:25", "remaining_time": "12:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 4438, "loss": 0.2138, "learning_rate": 4.999289297353593e-06, "epoch": 0.05722815219534176, "percentage": 5.72, "elapsed_time": "0:45:36", "remaining_time": "12:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 4438, "loss": 0.2155, "learning_rate": 4.9992441866659054e-06, "epoch": 0.05745345988115019, "percentage": 5.75, "elapsed_time": "0:45:47", "remaining_time": "12:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 4438, "loss": 0.1914, "learning_rate": 4.999197688241076e-06, "epoch": 0.057678767566958625, "percentage": 5.77, "elapsed_time": "0:45:59", "remaining_time": "12:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 4438, "loss": 0.2021, "learning_rate": 4.999149802104926e-06, "epoch": 0.05790407525276706, "percentage": 5.79, "elapsed_time": "0:46:11", "remaining_time": "12:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 4438, "loss": 0.2126, "learning_rate": 4.999100528284045e-06, "epoch": 0.058129382938575495, "percentage": 5.81, "elapsed_time": "0:46:20", "remaining_time": "12:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 4438, "loss": 0.2205, "learning_rate": 4.999049866805793e-06, "epoch": 0.05835469062438393, "percentage": 5.84, "elapsed_time": "0:46:32", "remaining_time": "12:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 4438, "loss": 0.1998, "learning_rate": 4.998997817698298e-06, "epoch": 0.05857999831019236, "percentage": 5.86, "elapsed_time": "0:46:41", "remaining_time": "12:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 4438, "loss": 0.231, "learning_rate": 4.998944380990462e-06, "epoch": 0.05880530599600079, "percentage": 5.88, "elapsed_time": "0:46:53", "remaining_time": "12:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 4438, "loss": 0.2193, "learning_rate": 4.998889556711958e-06, "epoch": 0.05903061368180922, "percentage": 5.9, "elapsed_time": "0:47:02", "remaining_time": "12:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 4438, "loss": 0.1997, "learning_rate": 4.998833344893226e-06, "epoch": 0.059255921367617655, "percentage": 5.93, "elapsed_time": "0:47:13", "remaining_time": "12:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 4438, "loss": 0.2246, "learning_rate": 4.998775745565479e-06, "epoch": 0.059481229053426087, "percentage": 5.95, "elapsed_time": "0:47:24", "remaining_time": "12:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 4438, "loss": 0.2254, "learning_rate": 4.998716758760701e-06, "epoch": 0.05970653673923452, "percentage": 5.97, "elapsed_time": "0:47:34", "remaining_time": "12:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 4438, "loss": 0.2118, "learning_rate": 4.998656384511643e-06, "epoch": 0.05993184442504295, "percentage": 5.99, "elapsed_time": "0:47:46", "remaining_time": "12:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 4438, "loss": 0.1759, "learning_rate": 4.998594622851829e-06, "epoch": 0.06015715211085138, "percentage": 6.02, "elapsed_time": "0:47:58", "remaining_time": "12:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 4438, "loss": 0.2228, "learning_rate": 4.9985314738155545e-06, "epoch": 0.060382459796659814, "percentage": 6.04, "elapsed_time": "0:48:08", "remaining_time": "12:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 4438, "loss": 0.1966, "learning_rate": 4.9984669374378825e-06, "epoch": 0.060607767482468246, "percentage": 6.06, "elapsed_time": "0:48:19", "remaining_time": "12:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 4438, "loss": 0.242, "learning_rate": 4.9984010137546475e-06, "epoch": 0.06083307516827668, "percentage": 6.08, "elapsed_time": "0:48:30", "remaining_time": "12:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 4438, "loss": 0.2154, "learning_rate": 4.998333702802457e-06, "epoch": 0.06105838285408511, "percentage": 6.11, "elapsed_time": "0:48:40", "remaining_time": "12:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 4438, "loss": 0.2202, "learning_rate": 4.998265004618682e-06, "epoch": 0.06128369053989354, "percentage": 6.13, "elapsed_time": "0:48:50", "remaining_time": "12:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 4438, "loss": 0.2095, "learning_rate": 4.998194919241471e-06, "epoch": 0.06150899822570197, "percentage": 6.15, "elapsed_time": "0:49:00", "remaining_time": "12:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 4438, "loss": 0.2162, "learning_rate": 4.998123446709739e-06, "epoch": 0.061734305911510405, "percentage": 6.17, "elapsed_time": "0:49:11", "remaining_time": "12:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 4438, "loss": 0.204, "learning_rate": 4.998050587063173e-06, "epoch": 0.06195961359731884, "percentage": 6.2, "elapsed_time": "0:49:22", "remaining_time": "12:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 4438, "loss": 0.2058, "learning_rate": 4.997976340342226e-06, "epoch": 0.06218492128312727, "percentage": 6.22, "elapsed_time": "0:49:33", "remaining_time": "12:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 4438, "loss": 0.2178, "learning_rate": 4.997900706588129e-06, "epoch": 0.0624102289689357, "percentage": 6.24, "elapsed_time": "0:49:45", "remaining_time": "12:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 4438, "loss": 0.2161, "learning_rate": 4.997823685842875e-06, "epoch": 0.06263553665474414, "percentage": 6.26, "elapsed_time": "0:49:54", "remaining_time": "12:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 4438, "loss": 0.1939, "learning_rate": 4.997745278149233e-06, "epoch": 0.06286084434055257, "percentage": 6.29, "elapsed_time": "0:50:04", "remaining_time": "12:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 4438, "loss": 0.1979, "learning_rate": 4.997665483550739e-06, "epoch": 0.063086152026361, "percentage": 6.31, "elapsed_time": "0:50:13", "remaining_time": "12:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 4438, "loss": 0.2242, "learning_rate": 4.997584302091699e-06, "epoch": 0.06331145971216944, "percentage": 6.33, "elapsed_time": "0:50:25", "remaining_time": "12:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 4438, "loss": 0.2164, "learning_rate": 4.997501733817191e-06, "epoch": 0.06353676739797787, "percentage": 6.35, "elapsed_time": "0:50:36", "remaining_time": "12:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 4438, "loss": 0.188, "learning_rate": 4.997417778773064e-06, "epoch": 0.0637620750837863, "percentage": 6.38, "elapsed_time": "0:50:45", "remaining_time": "12:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 4438, "loss": 0.2444, "learning_rate": 4.997332437005932e-06, "epoch": 0.06398738276959473, "percentage": 6.4, "elapsed_time": "0:50:56", "remaining_time": "12:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 4438, "loss": 0.2086, "learning_rate": 4.9972457085631825e-06, "epoch": 0.06421269045540316, "percentage": 6.42, "elapsed_time": "0:51:06", "remaining_time": "12:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 4438, "loss": 0.1838, "learning_rate": 4.997157593492974e-06, "epoch": 0.0644379981412116, "percentage": 6.44, "elapsed_time": "0:51:16", "remaining_time": "12:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 4438, "loss": 0.215, "learning_rate": 4.997068091844233e-06, "epoch": 0.06466330582702003, "percentage": 6.47, "elapsed_time": "0:51:28", "remaining_time": "12:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 4438, "loss": 0.2026, "learning_rate": 4.996977203666657e-06, "epoch": 0.06488861351282846, "percentage": 6.49, "elapsed_time": "0:51:38", "remaining_time": "12:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 4438, "loss": 0.2053, "learning_rate": 4.99688492901071e-06, "epoch": 0.06511392119863689, "percentage": 6.51, "elapsed_time": "0:51:49", "remaining_time": "12:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 4438, "loss": 0.2074, "learning_rate": 4.996791267927632e-06, "epoch": 0.06533922888444532, "percentage": 6.53, "elapsed_time": "0:52:01", "remaining_time": "12:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 4438, "loss": 0.203, "learning_rate": 4.996696220469429e-06, "epoch": 0.06556453657025375, "percentage": 6.56, "elapsed_time": "0:52:11", "remaining_time": "12:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 4438, "loss": 0.2236, "learning_rate": 4.996599786688876e-06, "epoch": 0.06578984425606219, "percentage": 6.58, "elapsed_time": "0:52:21", "remaining_time": "12:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 4438, "loss": 0.2184, "learning_rate": 4.996501966639519e-06, "epoch": 0.06601515194187062, "percentage": 6.6, "elapsed_time": "0:52:30", "remaining_time": "12:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 4438, "loss": 0.2402, "learning_rate": 4.996402760375676e-06, "epoch": 0.06624045962767905, "percentage": 6.62, "elapsed_time": "0:52:42", "remaining_time": "12:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 4438, "loss": 0.2218, "learning_rate": 4.99630216795243e-06, "epoch": 0.06646576731348748, "percentage": 6.65, "elapsed_time": "0:52:53", "remaining_time": "12:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 4438, "loss": 0.2086, "learning_rate": 4.996200189425638e-06, "epoch": 0.06669107499929591, "percentage": 6.67, "elapsed_time": "0:53:04", "remaining_time": "12:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 4438, "loss": 0.2232, "learning_rate": 4.996096824851923e-06, "epoch": 0.06691638268510434, "percentage": 6.69, "elapsed_time": "0:53:16", "remaining_time": "12:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 4438, "loss": 0.2109, "learning_rate": 4.9959920742886815e-06, "epoch": 0.06714169037091278, "percentage": 6.71, "elapsed_time": "0:53:28", "remaining_time": "12:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 4438, "loss": 0.2057, "learning_rate": 4.9958859377940765e-06, "epoch": 0.06736699805672121, "percentage": 6.74, "elapsed_time": "0:53:39", "remaining_time": "12:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 4438, "loss": 0.2127, "learning_rate": 4.995778415427042e-06, "epoch": 0.06759230574252964, "percentage": 6.76, "elapsed_time": "0:53:49", "remaining_time": "12:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 4438, "loss": 0.2286, "learning_rate": 4.99566950724728e-06, "epoch": 0.06781761342833807, "percentage": 6.78, "elapsed_time": "0:54:00", "remaining_time": "12:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 4438, "loss": 0.2263, "learning_rate": 4.995559213315267e-06, "epoch": 0.0680429211141465, "percentage": 6.8, "elapsed_time": "0:54:10", "remaining_time": "12:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 4438, "loss": 0.2054, "learning_rate": 4.995447533692239e-06, "epoch": 0.06826822879995494, "percentage": 6.83, "elapsed_time": "0:54:21", "remaining_time": "12:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 4438, "loss": 0.202, "learning_rate": 4.995334468440213e-06, "epoch": 0.06849353648576337, "percentage": 6.85, "elapsed_time": "0:54:30", "remaining_time": "12:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 4438, "loss": 0.1979, "learning_rate": 4.995220017621967e-06, "epoch": 0.0687188441715718, "percentage": 6.87, "elapsed_time": "0:54:41", "remaining_time": "12:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 4438, "loss": 0.2064, "learning_rate": 4.995104181301052e-06, "epoch": 0.06894415185738023, "percentage": 6.89, "elapsed_time": "0:54:51", "remaining_time": "12:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 4438, "loss": 0.216, "learning_rate": 4.994986959541788e-06, "epoch": 0.06916945954318866, "percentage": 6.92, "elapsed_time": "0:55:01", "remaining_time": "12:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 4438, "loss": 0.2021, "learning_rate": 4.994868352409263e-06, "epoch": 0.0693947672289971, "percentage": 6.94, "elapsed_time": "0:55:11", "remaining_time": "12:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 4438, "loss": 0.2059, "learning_rate": 4.994748359969336e-06, "epoch": 0.06962007491480553, "percentage": 6.96, "elapsed_time": "0:55:22", "remaining_time": "12:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 4438, "loss": 0.2114, "learning_rate": 4.9946269822886335e-06, "epoch": 0.06984538260061396, "percentage": 6.99, "elapsed_time": "0:55:33", "remaining_time": "12:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 4438, "loss": 0.2186, "learning_rate": 4.994504219434553e-06, "epoch": 0.07007069028642239, "percentage": 7.01, "elapsed_time": "0:55:45", "remaining_time": "12:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 4438, "loss": 0.2199, "learning_rate": 4.9943800714752586e-06, "epoch": 0.07029599797223082, "percentage": 7.03, "elapsed_time": "0:55:56", "remaining_time": "12:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 4438, "loss": 0.2077, "learning_rate": 4.994254538479687e-06, "epoch": 0.07052130565803925, "percentage": 7.05, "elapsed_time": "0:56:08", "remaining_time": "12:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 4438, "loss": 0.2109, "learning_rate": 4.9941276205175405e-06, "epoch": 0.07074661334384769, "percentage": 7.08, "elapsed_time": "0:56:19", "remaining_time": "12:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 4438, "loss": 0.209, "learning_rate": 4.993999317659293e-06, "epoch": 0.07097192102965612, "percentage": 7.1, "elapsed_time": "0:56:30", "remaining_time": "12:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 4438, "loss": 0.1924, "learning_rate": 4.9938696299761856e-06, "epoch": 0.07119722871546455, "percentage": 7.12, "elapsed_time": "0:56:41", "remaining_time": "12:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 4438, "loss": 0.2377, "learning_rate": 4.9937385575402284e-06, "epoch": 0.07142253640127298, "percentage": 7.14, "elapsed_time": "0:56:52", "remaining_time": "12:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 4438, "loss": 0.201, "learning_rate": 4.993606100424202e-06, "epoch": 0.07164784408708141, "percentage": 7.17, "elapsed_time": "0:57:03", "remaining_time": "12:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 4438, "loss": 0.2078, "learning_rate": 4.9934722587016555e-06, "epoch": 0.07187315177288986, "percentage": 7.19, "elapsed_time": "0:57:13", "remaining_time": "12:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 4438, "loss": 0.2167, "learning_rate": 4.9933370324469045e-06, "epoch": 0.07209845945869829, "percentage": 7.21, "elapsed_time": "0:57:23", "remaining_time": "12:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 4438, "loss": 0.2149, "learning_rate": 4.993200421735037e-06, "epoch": 0.07232376714450672, "percentage": 7.23, "elapsed_time": "0:57:33", "remaining_time": "12:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 4438, "loss": 0.2037, "learning_rate": 4.993062426641906e-06, "epoch": 0.07254907483031516, "percentage": 7.26, "elapsed_time": "0:57:44", "remaining_time": "12:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 4438, "loss": 0.2236, "learning_rate": 4.992923047244136e-06, "epoch": 0.07277438251612359, "percentage": 7.28, "elapsed_time": "0:57:55", "remaining_time": "12:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 4438, "loss": 0.2259, "learning_rate": 4.9927822836191185e-06, "epoch": 0.07299969020193202, "percentage": 7.3, "elapsed_time": "0:58:07", "remaining_time": "12:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 4438, "loss": 0.2147, "learning_rate": 4.992640135845016e-06, "epoch": 0.07322499788774045, "percentage": 7.32, "elapsed_time": "0:58:17", "remaining_time": "12:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 4438, "loss": 0.1979, "learning_rate": 4.992496604000756e-06, "epoch": 0.07345030557354888, "percentage": 7.35, "elapsed_time": "0:58:28", "remaining_time": "12:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 4438, "loss": 0.2026, "learning_rate": 4.992351688166038e-06, "epoch": 0.07367561325935731, "percentage": 7.37, "elapsed_time": "0:58:38", "remaining_time": "12:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 4438, "loss": 0.2202, "learning_rate": 4.992205388421326e-06, "epoch": 0.07390092094516575, "percentage": 7.39, "elapsed_time": "0:58:50", "remaining_time": "12:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 4438, "loss": 0.2113, "learning_rate": 4.992057704847858e-06, "epoch": 0.07412622863097418, "percentage": 7.41, "elapsed_time": "0:59:01", "remaining_time": "12:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 4438, "loss": 0.2078, "learning_rate": 4.991908637527634e-06, "epoch": 0.07435153631678261, "percentage": 7.44, "elapsed_time": "0:59:11", "remaining_time": "12:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 4438, "loss": 0.1949, "learning_rate": 4.9917581865434275e-06, "epoch": 0.07457684400259104, "percentage": 7.46, "elapsed_time": "0:59:22", "remaining_time": "12:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 4438, "loss": 0.2032, "learning_rate": 4.9916063519787775e-06, "epoch": 0.07480215168839947, "percentage": 7.48, "elapsed_time": "0:59:31", "remaining_time": "12:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 4438, "loss": 0.2181, "learning_rate": 4.991453133917993e-06, "epoch": 0.0750274593742079, "percentage": 7.5, "elapsed_time": "0:59:43", "remaining_time": "12:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 4438, "loss": 0.2135, "learning_rate": 4.991298532446149e-06, "epoch": 0.07525276706001634, "percentage": 7.53, "elapsed_time": "0:59:53", "remaining_time": "12:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 4438, "loss": 0.2018, "learning_rate": 4.991142547649091e-06, "epoch": 0.07547807474582477, "percentage": 7.55, "elapsed_time": "1:00:04", "remaining_time": "12:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 4438, "loss": 0.2003, "learning_rate": 4.990985179613431e-06, "epoch": 0.0757033824316332, "percentage": 7.57, "elapsed_time": "1:00:16", "remaining_time": "12:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 4438, "loss": 0.2076, "learning_rate": 4.990826428426549e-06, "epoch": 0.07592869011744163, "percentage": 7.59, "elapsed_time": "1:00:28", "remaining_time": "12:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 4438, "loss": 0.2042, "learning_rate": 4.990666294176596e-06, "epoch": 0.07615399780325006, "percentage": 7.62, "elapsed_time": "1:00:38", "remaining_time": "12:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 4438, "loss": 0.2275, "learning_rate": 4.9905047769524855e-06, "epoch": 0.0763793054890585, "percentage": 7.64, "elapsed_time": "1:00:49", "remaining_time": "12:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 4438, "loss": 0.2019, "learning_rate": 4.990341876843904e-06, "epoch": 0.07660461317486693, "percentage": 7.66, "elapsed_time": "1:00:59", "remaining_time": "12:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 4438, "loss": 0.2152, "learning_rate": 4.990177593941303e-06, "epoch": 0.07682992086067536, "percentage": 7.68, "elapsed_time": "1:01:09", "remaining_time": "12:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 4438, "loss": 0.2014, "learning_rate": 4.9900119283359025e-06, "epoch": 0.07705522854648379, "percentage": 7.71, "elapsed_time": "1:01:19", "remaining_time": "12:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 4438, "loss": 0.1884, "learning_rate": 4.989844880119692e-06, "epoch": 0.07728053623229222, "percentage": 7.73, "elapsed_time": "1:01:29", "remaining_time": "12:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 4438, "loss": 0.2047, "learning_rate": 4.989676449385426e-06, "epoch": 0.07750584391810066, "percentage": 7.75, "elapsed_time": "1:01:40", "remaining_time": "12:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 4438, "loss": 0.2022, "learning_rate": 4.989506636226626e-06, "epoch": 0.07773115160390909, "percentage": 7.77, "elapsed_time": "1:01:52", "remaining_time": "12:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 4438, "loss": 0.1943, "learning_rate": 4.989335440737587e-06, "epoch": 0.07795645928971752, "percentage": 7.8, "elapsed_time": "1:02:03", "remaining_time": "12:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 4438, "loss": 0.1967, "learning_rate": 4.989162863013364e-06, "epoch": 0.07818176697552595, "percentage": 7.82, "elapsed_time": "1:02:13", "remaining_time": "12:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 4438, "loss": 0.1941, "learning_rate": 4.988988903149784e-06, "epoch": 0.07840707466133438, "percentage": 7.84, "elapsed_time": "1:02:24", "remaining_time": "12:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 4438, "loss": 0.2051, "learning_rate": 4.9888135612434415e-06, "epoch": 0.07863238234714282, "percentage": 7.86, "elapsed_time": "1:02:35", "remaining_time": "12:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 4438, "loss": 0.1954, "learning_rate": 4.988636837391696e-06, "epoch": 0.07885769003295125, "percentage": 7.89, "elapsed_time": "1:02:45", "remaining_time": "12:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 4438, "loss": 0.2147, "learning_rate": 4.9884587316926765e-06, "epoch": 0.07908299771875968, "percentage": 7.91, "elapsed_time": "1:02:56", "remaining_time": "12:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 4438, "loss": 0.2091, "learning_rate": 4.988279244245278e-06, "epoch": 0.07930830540456811, "percentage": 7.93, "elapsed_time": "1:03:07", "remaining_time": "12:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 4438, "loss": 0.205, "learning_rate": 4.988098375149163e-06, "epoch": 0.07953361309037654, "percentage": 7.95, "elapsed_time": "1:03:18", "remaining_time": "12:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 4438, "loss": 0.2058, "learning_rate": 4.987916124504761e-06, "epoch": 0.07975892077618497, "percentage": 7.98, "elapsed_time": "1:03:30", "remaining_time": "12:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 4438, "loss": 0.1886, "learning_rate": 4.987732492413271e-06, "epoch": 0.0799842284619934, "percentage": 8.0, "elapsed_time": "1:03:40", "remaining_time": "12:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 4438, "loss": 0.1956, "learning_rate": 4.987547478976655e-06, "epoch": 0.08020953614780184, "percentage": 8.02, "elapsed_time": "1:03:51", "remaining_time": "12:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 4438, "loss": 0.2016, "learning_rate": 4.987361084297645e-06, "epoch": 0.08043484383361027, "percentage": 8.04, "elapsed_time": "1:04:01", "remaining_time": "12:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 4438, "loss": 0.1998, "learning_rate": 4.987173308479738e-06, "epoch": 0.0806601515194187, "percentage": 8.07, "elapsed_time": "1:04:11", "remaining_time": "12:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 4438, "loss": 0.1963, "learning_rate": 4.9869841516272004e-06, "epoch": 0.08088545920522713, "percentage": 8.09, "elapsed_time": "1:04:22", "remaining_time": "12:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 4438, "loss": 0.1934, "learning_rate": 4.9867936138450635e-06, "epoch": 0.08111076689103557, "percentage": 8.11, "elapsed_time": "1:04:35", "remaining_time": "12:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 4438, "loss": 0.2112, "learning_rate": 4.986601695239125e-06, "epoch": 0.081336074576844, "percentage": 8.13, "elapsed_time": "1:04:46", "remaining_time": "12:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 4438, "loss": 0.2008, "learning_rate": 4.98640839591595e-06, "epoch": 0.08156138226265243, "percentage": 8.16, "elapsed_time": "1:04:57", "remaining_time": "12:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 4438, "loss": 0.206, "learning_rate": 4.986213715982873e-06, "epoch": 0.08178668994846086, "percentage": 8.18, "elapsed_time": "1:05:08", "remaining_time": "12:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 4438, "loss": 0.2092, "learning_rate": 4.986017655547989e-06, "epoch": 0.08201199763426929, "percentage": 8.2, "elapsed_time": "1:05:18", "remaining_time": "12:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 4438, "loss": 0.1982, "learning_rate": 4.985820214720165e-06, "epoch": 0.08223730532007772, "percentage": 8.22, "elapsed_time": "1:05:29", "remaining_time": "12:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 4438, "loss": 0.2214, "learning_rate": 4.985621393609032e-06, "epoch": 0.08246261300588616, "percentage": 8.25, "elapsed_time": "1:05:40", "remaining_time": "12:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 4438, "loss": 0.1944, "learning_rate": 4.98542119232499e-06, "epoch": 0.08268792069169459, "percentage": 8.27, "elapsed_time": "1:05:50", "remaining_time": "12:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 4438, "loss": 0.1866, "learning_rate": 4.9852196109792e-06, "epoch": 0.08291322837750303, "percentage": 8.29, "elapsed_time": "1:06:01", "remaining_time": "12:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 4438, "loss": 0.2093, "learning_rate": 4.985016649683594e-06, "epoch": 0.08313853606331147, "percentage": 8.31, "elapsed_time": "1:06:12", "remaining_time": "12:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 4438, "loss": 0.2136, "learning_rate": 4.984812308550869e-06, "epoch": 0.0833638437491199, "percentage": 8.34, "elapsed_time": "1:06:22", "remaining_time": "12:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 4438, "loss": 0.1969, "learning_rate": 4.984606587694488e-06, "epoch": 0.08358915143492833, "percentage": 8.36, "elapsed_time": "1:06:33", "remaining_time": "12:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 4438, "loss": 0.2101, "learning_rate": 4.98439948722868e-06, "epoch": 0.08381445912073676, "percentage": 8.38, "elapsed_time": "1:06:44", "remaining_time": "12:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 4438, "loss": 0.2128, "learning_rate": 4.9841910072684406e-06, "epoch": 0.0840397668065452, "percentage": 8.4, "elapsed_time": "1:06:53", "remaining_time": "12:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 4438, "loss": 0.2073, "learning_rate": 4.98398114792953e-06, "epoch": 0.08426507449235363, "percentage": 8.43, "elapsed_time": "1:07:03", "remaining_time": "12:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 4438, "loss": 0.1991, "learning_rate": 4.9837699093284765e-06, "epoch": 0.08449038217816206, "percentage": 8.45, "elapsed_time": "1:07:14", "remaining_time": "12:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 4438, "loss": 0.2097, "learning_rate": 4.983557291582572e-06, "epoch": 0.08471568986397049, "percentage": 8.47, "elapsed_time": "1:07:24", "remaining_time": "12:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 4438, "loss": 0.1951, "learning_rate": 4.983343294809875e-06, "epoch": 0.08494099754977892, "percentage": 8.49, "elapsed_time": "1:07:35", "remaining_time": "12:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 4438, "loss": 0.1994, "learning_rate": 4.9831279191292114e-06, "epoch": 0.08516630523558735, "percentage": 8.52, "elapsed_time": "1:07:46", "remaining_time": "12:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 4438, "loss": 0.2052, "learning_rate": 4.98291116466017e-06, "epoch": 0.08539161292139578, "percentage": 8.54, "elapsed_time": "1:07:57", "remaining_time": "12:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 4438, "loss": 0.1883, "learning_rate": 4.982693031523107e-06, "epoch": 0.08561692060720422, "percentage": 8.56, "elapsed_time": "1:08:07", "remaining_time": "12:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 4438, "loss": 0.2008, "learning_rate": 4.982473519839144e-06, "epoch": 0.08584222829301265, "percentage": 8.58, "elapsed_time": "1:08:16", "remaining_time": "12:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 4438, "loss": 0.2077, "learning_rate": 4.982252629730167e-06, "epoch": 0.08606753597882108, "percentage": 8.61, "elapsed_time": "1:08:26", "remaining_time": "12:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 4438, "loss": 0.1992, "learning_rate": 4.982030361318827e-06, "epoch": 0.08629284366462951, "percentage": 8.63, "elapsed_time": "1:08:38", "remaining_time": "12:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 4438, "loss": 0.1944, "learning_rate": 4.981806714728543e-06, "epoch": 0.08651815135043794, "percentage": 8.65, "elapsed_time": "1:08:49", "remaining_time": "12:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 4438, "loss": 0.1787, "learning_rate": 4.981581690083498e-06, "epoch": 0.08674345903624638, "percentage": 8.68, "elapsed_time": "1:08:59", "remaining_time": "12:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 4438, "loss": 0.1838, "learning_rate": 4.981355287508638e-06, "epoch": 0.08696876672205481, "percentage": 8.7, "elapsed_time": "1:09:11", "remaining_time": "12:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 4438, "loss": 0.1994, "learning_rate": 4.981127507129677e-06, "epoch": 0.08719407440786324, "percentage": 8.72, "elapsed_time": "1:09:21", "remaining_time": "12:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 4438, "loss": 0.2082, "learning_rate": 4.980898349073094e-06, "epoch": 0.08741938209367167, "percentage": 8.74, "elapsed_time": "1:09:33", "remaining_time": "12:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 4438, "loss": 0.1975, "learning_rate": 4.9806678134661295e-06, "epoch": 0.0876446897794801, "percentage": 8.77, "elapsed_time": "1:09:45", "remaining_time": "12:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 4438, "loss": 0.1968, "learning_rate": 4.980435900436793e-06, "epoch": 0.08786999746528854, "percentage": 8.79, "elapsed_time": "1:09:56", "remaining_time": "12:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 4438, "loss": 0.1951, "learning_rate": 4.980202610113857e-06, "epoch": 0.08809530515109697, "percentage": 8.81, "elapsed_time": "1:10:06", "remaining_time": "12:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 4438, "loss": 0.2237, "learning_rate": 4.9799679426268575e-06, "epoch": 0.0883206128369054, "percentage": 8.83, "elapsed_time": "1:10:17", "remaining_time": "12:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 4438, "loss": 0.2089, "learning_rate": 4.9797318981061e-06, "epoch": 0.08854592052271383, "percentage": 8.86, "elapsed_time": "1:10:28", "remaining_time": "12:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 4438, "loss": 0.2068, "learning_rate": 4.979494476682647e-06, "epoch": 0.08877122820852226, "percentage": 8.88, "elapsed_time": "1:10:39", "remaining_time": "12:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 4438, "loss": 0.1922, "learning_rate": 4.979255678488332e-06, "epoch": 0.0889965358943307, "percentage": 8.9, "elapsed_time": "1:10:49", "remaining_time": "12:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 4438, "loss": 0.2069, "learning_rate": 4.979015503655751e-06, "epoch": 0.08922184358013913, "percentage": 8.92, "elapsed_time": "1:11:02", "remaining_time": "12:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 4438, "loss": 0.2085, "learning_rate": 4.978773952318263e-06, "epoch": 0.08944715126594756, "percentage": 8.95, "elapsed_time": "1:11:13", "remaining_time": "12:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 4438, "loss": 0.2075, "learning_rate": 4.978531024609994e-06, "epoch": 0.08967245895175599, "percentage": 8.97, "elapsed_time": "1:11:23", "remaining_time": "12:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 4438, "loss": 0.2072, "learning_rate": 4.978286720665832e-06, "epoch": 0.08989776663756442, "percentage": 8.99, "elapsed_time": "1:11:33", "remaining_time": "12:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 4438, "loss": 0.1986, "learning_rate": 4.978041040621428e-06, "epoch": 0.09012307432337285, "percentage": 9.01, "elapsed_time": "1:11:44", "remaining_time": "12:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 4438, "loss": 0.2009, "learning_rate": 4.977793984613202e-06, "epoch": 0.09034838200918129, "percentage": 9.04, "elapsed_time": "1:11:55", "remaining_time": "12:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 4438, "loss": 0.1995, "learning_rate": 4.977545552778333e-06, "epoch": 0.09057368969498972, "percentage": 9.06, "elapsed_time": "1:12:05", "remaining_time": "12:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 4438, "loss": 0.2, "learning_rate": 4.977295745254766e-06, "epoch": 0.09079899738079815, "percentage": 9.08, "elapsed_time": "1:12:17", "remaining_time": "12:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 4438, "loss": 0.1829, "learning_rate": 4.977044562181212e-06, "epoch": 0.09102430506660658, "percentage": 9.1, "elapsed_time": "1:12:27", "remaining_time": "12:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 4438, "loss": 0.1979, "learning_rate": 4.9767920036971406e-06, "epoch": 0.09124961275241501, "percentage": 9.13, "elapsed_time": "1:12:38", "remaining_time": "12:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 4438, "loss": 0.1856, "learning_rate": 4.9765380699427905e-06, "epoch": 0.09147492043822344, "percentage": 9.15, "elapsed_time": "1:12:49", "remaining_time": "12:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 4438, "loss": 0.2181, "learning_rate": 4.97628276105916e-06, "epoch": 0.09170022812403188, "percentage": 9.17, "elapsed_time": "1:12:58", "remaining_time": "12:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 4438, "loss": 0.1988, "learning_rate": 4.976026077188013e-06, "epoch": 0.09192553580984031, "percentage": 9.19, "elapsed_time": "1:13:09", "remaining_time": "12:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 4438, "loss": 0.1871, "learning_rate": 4.975768018471877e-06, "epoch": 0.09215084349564874, "percentage": 9.22, "elapsed_time": "1:13:19", "remaining_time": "12:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 4438, "loss": 0.2019, "learning_rate": 4.9755085850540426e-06, "epoch": 0.09237615118145717, "percentage": 9.24, "elapsed_time": "1:13:31", "remaining_time": "12:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 4438, "loss": 0.204, "learning_rate": 4.9752477770785625e-06, "epoch": 0.0926014588672656, "percentage": 9.26, "elapsed_time": "1:13:39", "remaining_time": "12:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 4438, "loss": 0.2005, "learning_rate": 4.974985594690255e-06, "epoch": 0.09282676655307404, "percentage": 9.28, "elapsed_time": "1:13:50", "remaining_time": "12:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 4438, "loss": 0.1778, "learning_rate": 4.9747220380346975e-06, "epoch": 0.09305207423888247, "percentage": 9.31, "elapsed_time": "1:14:00", "remaining_time": "12:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 4438, "loss": 0.21, "learning_rate": 4.9744571072582365e-06, "epoch": 0.0932773819246909, "percentage": 9.33, "elapsed_time": "1:14:09", "remaining_time": "12:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 4438, "loss": 0.1984, "learning_rate": 4.974190802507977e-06, "epoch": 0.09350268961049933, "percentage": 9.35, "elapsed_time": "1:14:20", "remaining_time": "12:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 4438, "loss": 0.1992, "learning_rate": 4.973923123931786e-06, "epoch": 0.09372799729630776, "percentage": 9.37, "elapsed_time": "1:14:30", "remaining_time": "12:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 4438, "loss": 0.1959, "learning_rate": 4.973654071678299e-06, "epoch": 0.09395330498211621, "percentage": 9.4, "elapsed_time": "1:14:40", "remaining_time": "12:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 4438, "loss": 0.2027, "learning_rate": 4.973383645896908e-06, "epoch": 0.09417861266792464, "percentage": 9.42, "elapsed_time": "1:14:51", "remaining_time": "11:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 4438, "loss": 0.1903, "learning_rate": 4.973111846737772e-06, "epoch": 0.09440392035373307, "percentage": 9.44, "elapsed_time": "1:15:03", "remaining_time": "11:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 4438, "loss": 0.1931, "learning_rate": 4.97283867435181e-06, "epoch": 0.0946292280395415, "percentage": 9.46, "elapsed_time": "1:15:13", "remaining_time": "11:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 4438, "loss": 0.211, "learning_rate": 4.972564128890704e-06, "epoch": 0.09485453572534994, "percentage": 9.49, "elapsed_time": "1:15:23", "remaining_time": "11:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 4438, "loss": 0.1978, "learning_rate": 4.972288210506902e-06, "epoch": 0.09507984341115837, "percentage": 9.51, "elapsed_time": "1:15:34", "remaining_time": "11:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 4438, "loss": 0.1926, "learning_rate": 4.972010919353606e-06, "epoch": 0.0953051510969668, "percentage": 9.53, "elapsed_time": "1:15:44", "remaining_time": "11:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 4438, "loss": 0.1937, "learning_rate": 4.971732255584789e-06, "epoch": 0.09553045878277523, "percentage": 9.55, "elapsed_time": "1:15:54", "remaining_time": "11:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 4438, "loss": 0.2052, "learning_rate": 4.971452219355182e-06, "epoch": 0.09575576646858366, "percentage": 9.58, "elapsed_time": "1:16:05", "remaining_time": "11:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 4438, "loss": 0.1964, "learning_rate": 4.971170810820279e-06, "epoch": 0.0959810741543921, "percentage": 9.6, "elapsed_time": "1:16:16", "remaining_time": "11:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 4438, "loss": 0.1928, "learning_rate": 4.970888030136335e-06, "epoch": 0.09620638184020053, "percentage": 9.62, "elapsed_time": "1:16:27", "remaining_time": "11:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 4438, "loss": 0.212, "learning_rate": 4.970603877460367e-06, "epoch": 0.09643168952600896, "percentage": 9.64, "elapsed_time": "1:16:37", "remaining_time": "11:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 4438, "loss": 0.2203, "learning_rate": 4.970318352950155e-06, "epoch": 0.09665699721181739, "percentage": 9.67, "elapsed_time": "1:16:47", "remaining_time": "11:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 4438, "loss": 0.2109, "learning_rate": 4.970031456764242e-06, "epoch": 0.09688230489762582, "percentage": 9.69, "elapsed_time": "1:16:58", "remaining_time": "11:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 4438, "loss": 0.1989, "learning_rate": 4.9697431890619265e-06, "epoch": 0.09710761258343426, "percentage": 9.71, "elapsed_time": "1:17:08", "remaining_time": "11:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 4438, "loss": 0.1925, "learning_rate": 4.969453550003277e-06, "epoch": 0.09733292026924269, "percentage": 9.73, "elapsed_time": "1:17:18", "remaining_time": "11:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 4438, "loss": 0.2022, "learning_rate": 4.969162539749117e-06, "epoch": 0.09755822795505112, "percentage": 9.76, "elapsed_time": "1:17:28", "remaining_time": "11:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 4438, "loss": 0.1842, "learning_rate": 4.9688701584610345e-06, "epoch": 0.09778353564085955, "percentage": 9.78, "elapsed_time": "1:17:39", "remaining_time": "11:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 4438, "loss": 0.1914, "learning_rate": 4.968576406301377e-06, "epoch": 0.09800884332666798, "percentage": 9.8, "elapsed_time": "1:17:50", "remaining_time": "11:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 4438, "loss": 0.1934, "learning_rate": 4.968281283433256e-06, "epoch": 0.09823415101247641, "percentage": 9.82, "elapsed_time": "1:18:01", "remaining_time": "11:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 4438, "loss": 0.1887, "learning_rate": 4.96798479002054e-06, "epoch": 0.09845945869828485, "percentage": 9.85, "elapsed_time": "1:18:13", "remaining_time": "11:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 4438, "loss": 0.1959, "learning_rate": 4.967686926227862e-06, "epoch": 0.09868476638409328, "percentage": 9.87, "elapsed_time": "1:18:24", "remaining_time": "11:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 4438, "loss": 0.2149, "learning_rate": 4.967387692220615e-06, "epoch": 0.09891007406990171, "percentage": 9.89, "elapsed_time": "1:18:34", "remaining_time": "11:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 4438, "loss": 0.1925, "learning_rate": 4.967087088164951e-06, "epoch": 0.09913538175571014, "percentage": 9.91, "elapsed_time": "1:18:44", "remaining_time": "11:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 4438, "loss": 0.1931, "learning_rate": 4.966785114227785e-06, "epoch": 0.09936068944151857, "percentage": 9.94, "elapsed_time": "1:18:54", "remaining_time": "11:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 4438, "loss": 0.2061, "learning_rate": 4.966481770576793e-06, "epoch": 0.099585997127327, "percentage": 9.96, "elapsed_time": "1:19:06", "remaining_time": "11:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 4438, "loss": 0.1853, "learning_rate": 4.966177057380409e-06, "epoch": 0.09981130481313544, "percentage": 9.98, "elapsed_time": "1:19:15", "remaining_time": "11:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 4438, "loss": 0.1972, "learning_rate": 4.965870974807829e-06, "epoch": 0.10003661249894387, "percentage": 10.0, "elapsed_time": "1:19:26", "remaining_time": "11:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 4438, "loss": 0.2147, "learning_rate": 4.96556352302901e-06, "epoch": 0.1002619201847523, "percentage": 10.03, "elapsed_time": "1:19:38", "remaining_time": "11:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 4438, "loss": 0.2011, "learning_rate": 4.965254702214668e-06, "epoch": 0.10048722787056073, "percentage": 10.05, "elapsed_time": "1:19:49", "remaining_time": "11:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 4438, "loss": 0.1946, "learning_rate": 4.96494451253628e-06, "epoch": 0.10071253555636916, "percentage": 10.07, "elapsed_time": "1:20:00", "remaining_time": "11:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 4438, "loss": 0.2197, "learning_rate": 4.964632954166081e-06, "epoch": 0.1009378432421776, "percentage": 10.09, "elapsed_time": "1:20:12", "remaining_time": "11:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 4438, "loss": 0.1691, "learning_rate": 4.964320027277071e-06, "epoch": 0.10116315092798603, "percentage": 10.12, "elapsed_time": "1:20:22", "remaining_time": "11:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 4438, "loss": 0.2015, "learning_rate": 4.964005732043003e-06, "epoch": 0.10138845861379446, "percentage": 10.14, "elapsed_time": "1:20:34", "remaining_time": "11:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 4438, "loss": 0.1953, "learning_rate": 4.963690068638397e-06, "epoch": 0.10161376629960289, "percentage": 10.16, "elapsed_time": "1:20:44", "remaining_time": "11:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 4438, "loss": 0.2014, "learning_rate": 4.963373037238527e-06, "epoch": 0.10183907398541132, "percentage": 10.18, "elapsed_time": "1:20:54", "remaining_time": "11:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 4438, "loss": 0.1957, "learning_rate": 4.963054638019429e-06, "epoch": 0.10206438167121976, "percentage": 10.21, "elapsed_time": "1:21:06", "remaining_time": "11:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 4438, "loss": 0.1875, "learning_rate": 4.9627348711578996e-06, "epoch": 0.10228968935702819, "percentage": 10.23, "elapsed_time": "1:21:17", "remaining_time": "11:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 4438, "loss": 0.2103, "learning_rate": 4.962413736831491e-06, "epoch": 0.10251499704283662, "percentage": 10.25, "elapsed_time": "1:21:28", "remaining_time": "11:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 4438, "loss": 0.207, "learning_rate": 4.962091235218518e-06, "epoch": 0.10274030472864505, "percentage": 10.27, "elapsed_time": "1:21:38", "remaining_time": "11:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 4438, "loss": 0.2063, "learning_rate": 4.961767366498055e-06, "epoch": 0.10296561241445348, "percentage": 10.3, "elapsed_time": "1:21:49", "remaining_time": "11:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 4438, "loss": 0.1943, "learning_rate": 4.961442130849933e-06, "epoch": 0.10319092010026192, "percentage": 10.32, "elapsed_time": "1:21:59", "remaining_time": "11:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 4438, "loss": 0.2184, "learning_rate": 4.961115528454743e-06, "epoch": 0.10341622778607035, "percentage": 10.34, "elapsed_time": "1:22:09", "remaining_time": "11:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 4438, "loss": 0.1928, "learning_rate": 4.960787559493836e-06, "epoch": 0.10364153547187878, "percentage": 10.37, "elapsed_time": "1:22:19", "remaining_time": "11:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 4438, "loss": 0.205, "learning_rate": 4.96045822414932e-06, "epoch": 0.10386684315768721, "percentage": 10.39, "elapsed_time": "1:22:30", "remaining_time": "11:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 4438, "loss": 0.1919, "learning_rate": 4.960127522604065e-06, "epoch": 0.10409215084349564, "percentage": 10.41, "elapsed_time": "1:22:41", "remaining_time": "11:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 4438, "loss": 0.1951, "learning_rate": 4.959795455041694e-06, "epoch": 0.10431745852930407, "percentage": 10.43, "elapsed_time": "1:22:53", "remaining_time": "11:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 4438, "loss": 0.1999, "learning_rate": 4.959462021646593e-06, "epoch": 0.1045427662151125, "percentage": 10.46, "elapsed_time": "1:23:04", "remaining_time": "11:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 4438, "loss": 0.1763, "learning_rate": 4.959127222603905e-06, "epoch": 0.10476807390092094, "percentage": 10.48, "elapsed_time": "1:23:15", "remaining_time": "11:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 4438, "loss": 0.203, "learning_rate": 4.958791058099533e-06, "epoch": 0.10499338158672938, "percentage": 10.5, "elapsed_time": "1:23:27", "remaining_time": "11:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 4438, "loss": 0.1858, "learning_rate": 4.958453528320135e-06, "epoch": 0.10521868927253782, "percentage": 10.52, "elapsed_time": "1:23:38", "remaining_time": "11:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 4438, "loss": 0.1999, "learning_rate": 4.95811463345313e-06, "epoch": 0.10544399695834625, "percentage": 10.55, "elapsed_time": "1:23:48", "remaining_time": "11:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 4438, "loss": 0.2144, "learning_rate": 4.957774373686692e-06, "epoch": 0.10566930464415468, "percentage": 10.57, "elapsed_time": "1:24:01", "remaining_time": "11:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 4438, "loss": 0.2077, "learning_rate": 4.957432749209755e-06, "epoch": 0.10589461232996311, "percentage": 10.59, "elapsed_time": "1:24:12", "remaining_time": "11:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 4438, "loss": 0.1986, "learning_rate": 4.95708976021201e-06, "epoch": 0.10611992001577154, "percentage": 10.61, "elapsed_time": "1:24:22", "remaining_time": "11:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 4438, "loss": 0.1942, "learning_rate": 4.956745406883909e-06, "epoch": 0.10634522770157998, "percentage": 10.64, "elapsed_time": "1:24:33", "remaining_time": "11:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 4438, "loss": 0.1851, "learning_rate": 4.956399689416654e-06, "epoch": 0.10657053538738841, "percentage": 10.66, "elapsed_time": "1:24:42", "remaining_time": "11:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 4438, "loss": 0.2055, "learning_rate": 4.956052608002212e-06, "epoch": 0.10679584307319684, "percentage": 10.68, "elapsed_time": "1:24:54", "remaining_time": "11:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 4438, "loss": 0.2107, "learning_rate": 4.9557041628333046e-06, "epoch": 0.10702115075900527, "percentage": 10.7, "elapsed_time": "1:25:05", "remaining_time": "11:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 4438, "loss": 0.1785, "learning_rate": 4.9553543541034086e-06, "epoch": 0.1072464584448137, "percentage": 10.73, "elapsed_time": "1:25:17", "remaining_time": "11:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 4438, "loss": 0.1892, "learning_rate": 4.955003182006761e-06, "epoch": 0.10747176613062213, "percentage": 10.75, "elapsed_time": "1:25:28", "remaining_time": "11:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 4438, "loss": 0.2048, "learning_rate": 4.954650646738354e-06, "epoch": 0.10769707381643057, "percentage": 10.77, "elapsed_time": "1:25:38", "remaining_time": "11:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 4438, "loss": 0.199, "learning_rate": 4.954296748493938e-06, "epoch": 0.107922381502239, "percentage": 10.79, "elapsed_time": "1:25:49", "remaining_time": "11:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 4438, "loss": 0.1925, "learning_rate": 4.953941487470017e-06, "epoch": 0.10814768918804743, "percentage": 10.82, "elapsed_time": "1:25:58", "remaining_time": "11:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 4438, "loss": 0.1965, "learning_rate": 4.9535848638638586e-06, "epoch": 0.10837299687385586, "percentage": 10.84, "elapsed_time": "1:26:09", "remaining_time": "11:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 4438, "loss": 0.2186, "learning_rate": 4.953226877873479e-06, "epoch": 0.1085983045596643, "percentage": 10.86, "elapsed_time": "1:26:20", "remaining_time": "11:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 4438, "loss": 0.1975, "learning_rate": 4.952867529697656e-06, "epoch": 0.10882361224547273, "percentage": 10.88, "elapsed_time": "1:26:30", "remaining_time": "11:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 4438, "loss": 0.2, "learning_rate": 4.952506819535922e-06, "epoch": 0.10904891993128116, "percentage": 10.91, "elapsed_time": "1:26:41", "remaining_time": "11:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 4438, "loss": 0.2106, "learning_rate": 4.952144747588566e-06, "epoch": 0.10927422761708959, "percentage": 10.93, "elapsed_time": "1:26:52", "remaining_time": "11:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 4438, "loss": 0.2, "learning_rate": 4.951781314056633e-06, "epoch": 0.10949953530289802, "percentage": 10.95, "elapsed_time": "1:27:02", "remaining_time": "11:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 4438, "loss": 0.2018, "learning_rate": 4.951416519141923e-06, "epoch": 0.10972484298870645, "percentage": 10.97, "elapsed_time": "1:27:12", "remaining_time": "11:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 4438, "loss": 0.1877, "learning_rate": 4.951050363046995e-06, "epoch": 0.10995015067451488, "percentage": 11.0, "elapsed_time": "1:27:23", "remaining_time": "11:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 4438, "loss": 0.2161, "learning_rate": 4.95068284597516e-06, "epoch": 0.11017545836032332, "percentage": 11.02, "elapsed_time": "1:27:34", "remaining_time": "11:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 4438, "loss": 0.212, "learning_rate": 4.950313968130488e-06, "epoch": 0.11040076604613175, "percentage": 11.04, "elapsed_time": "1:27:45", "remaining_time": "11:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 4438, "loss": 0.2014, "learning_rate": 4.949943729717802e-06, "epoch": 0.11062607373194018, "percentage": 11.06, "elapsed_time": "1:27:56", "remaining_time": "11:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 4438, "loss": 0.1949, "learning_rate": 4.949572130942683e-06, "epoch": 0.11085138141774861, "percentage": 11.09, "elapsed_time": "1:28:06", "remaining_time": "11:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 4438, "loss": 0.1995, "learning_rate": 4.949199172011464e-06, "epoch": 0.11107668910355704, "percentage": 11.11, "elapsed_time": "1:28:16", "remaining_time": "11:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 4438, "loss": 0.2122, "learning_rate": 4.948824853131237e-06, "epoch": 0.11130199678936548, "percentage": 11.13, "elapsed_time": "1:28:27", "remaining_time": "11:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 4438, "loss": 0.203, "learning_rate": 4.948449174509846e-06, "epoch": 0.11152730447517391, "percentage": 11.15, "elapsed_time": "1:28:39", "remaining_time": "11:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 4438, "loss": 0.1931, "learning_rate": 4.948072136355892e-06, "epoch": 0.11175261216098234, "percentage": 11.18, "elapsed_time": "1:28:48", "remaining_time": "11:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 4438, "loss": 0.2079, "learning_rate": 4.94769373887873e-06, "epoch": 0.11197791984679077, "percentage": 11.2, "elapsed_time": "1:29:00", "remaining_time": "11:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 4438, "loss": 0.2071, "learning_rate": 4.94731398228847e-06, "epoch": 0.1122032275325992, "percentage": 11.22, "elapsed_time": "1:29:11", "remaining_time": "11:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 4438, "loss": 0.2018, "learning_rate": 4.946932866795977e-06, "epoch": 0.11242853521840764, "percentage": 11.24, "elapsed_time": "1:29:21", "remaining_time": "11:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 4438, "loss": 0.2014, "learning_rate": 4.94655039261287e-06, "epoch": 0.11265384290421607, "percentage": 11.27, "elapsed_time": "1:29:31", "remaining_time": "11:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 4438, "eval_loss": 0.19670069217681885, "epoch": 0.11265384290421607, "percentage": 11.27, "elapsed_time": "1:31:33", "remaining_time": "12:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 4438, "loss": 0.1869, "learning_rate": 4.946166559951523e-06, "epoch": 0.1128791505900245, "percentage": 11.29, "elapsed_time": "1:31:43", "remaining_time": "12:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 4438, "loss": 0.2047, "learning_rate": 4.9457813690250635e-06, "epoch": 0.11310445827583293, "percentage": 11.31, "elapsed_time": "1:31:53", "remaining_time": "12:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 4438, "loss": 0.1936, "learning_rate": 4.945394820047373e-06, "epoch": 0.11332976596164136, "percentage": 11.33, "elapsed_time": "1:32:04", "remaining_time": "12:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 4438, "loss": 0.1904, "learning_rate": 4.94500691323309e-06, "epoch": 0.1135550736474498, "percentage": 11.36, "elapsed_time": "1:32:15", "remaining_time": "12:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 4438, "loss": 0.2187, "learning_rate": 4.944617648797602e-06, "epoch": 0.11378038133325823, "percentage": 11.38, "elapsed_time": "1:32:26", "remaining_time": "11:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 4438, "loss": 0.1808, "learning_rate": 4.9442270269570545e-06, "epoch": 0.11400568901906666, "percentage": 11.4, "elapsed_time": "1:32:37", "remaining_time": "11:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 4438, "loss": 0.1702, "learning_rate": 4.943835047928346e-06, "epoch": 0.11423099670487509, "percentage": 11.42, "elapsed_time": "1:32:48", "remaining_time": "11:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 4438, "loss": 0.2109, "learning_rate": 4.943441711929126e-06, "epoch": 0.11445630439068352, "percentage": 11.45, "elapsed_time": "1:32:59", "remaining_time": "11:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 4438, "loss": 0.2074, "learning_rate": 4.9430470191778e-06, "epoch": 0.11468161207649195, "percentage": 11.47, "elapsed_time": "1:33:10", "remaining_time": "11:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 4438, "loss": 0.1966, "learning_rate": 4.942650969893527e-06, "epoch": 0.11490691976230039, "percentage": 11.49, "elapsed_time": "1:33:21", "remaining_time": "11:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 4438, "loss": 0.2072, "learning_rate": 4.942253564296217e-06, "epoch": 0.11513222744810882, "percentage": 11.51, "elapsed_time": "1:33:31", "remaining_time": "11:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 4438, "loss": 0.1953, "learning_rate": 4.941854802606537e-06, "epoch": 0.11535753513391725, "percentage": 11.54, "elapsed_time": "1:33:42", "remaining_time": "11:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 4438, "loss": 0.1757, "learning_rate": 4.9414546850459014e-06, "epoch": 0.11558284281972568, "percentage": 11.56, "elapsed_time": "1:33:53", "remaining_time": "11:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 4438, "loss": 0.1793, "learning_rate": 4.941053211836482e-06, "epoch": 0.11580815050553411, "percentage": 11.58, "elapsed_time": "1:34:03", "remaining_time": "11:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 4438, "loss": 0.1937, "learning_rate": 4.940650383201202e-06, "epoch": 0.11603345819134256, "percentage": 11.6, "elapsed_time": "1:34:13", "remaining_time": "11:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 4438, "loss": 0.1917, "learning_rate": 4.940246199363737e-06, "epoch": 0.11625876587715099, "percentage": 11.63, "elapsed_time": "1:34:24", "remaining_time": "11:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 4438, "loss": 0.1977, "learning_rate": 4.939840660548515e-06, "epoch": 0.11648407356295942, "percentage": 11.65, "elapsed_time": "1:34:34", "remaining_time": "11:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 4438, "loss": 0.1835, "learning_rate": 4.939433766980717e-06, "epoch": 0.11670938124876785, "percentage": 11.67, "elapsed_time": "1:34:44", "remaining_time": "11:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 4438, "loss": 0.2035, "learning_rate": 4.939025518886276e-06, "epoch": 0.11693468893457629, "percentage": 11.69, "elapsed_time": "1:34:55", "remaining_time": "11:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 4438, "loss": 0.1888, "learning_rate": 4.9386159164918764e-06, "epoch": 0.11715999662038472, "percentage": 11.72, "elapsed_time": "1:35:05", "remaining_time": "11:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 4438, "loss": 0.2058, "learning_rate": 4.938204960024955e-06, "epoch": 0.11738530430619315, "percentage": 11.74, "elapsed_time": "1:35:16", "remaining_time": "11:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 4438, "loss": 0.1912, "learning_rate": 4.937792649713701e-06, "epoch": 0.11761061199200158, "percentage": 11.76, "elapsed_time": "1:35:27", "remaining_time": "11:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 4438, "loss": 0.1839, "learning_rate": 4.937378985787055e-06, "epoch": 0.11783591967781001, "percentage": 11.78, "elapsed_time": "1:35:38", "remaining_time": "11:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 4438, "loss": 0.1879, "learning_rate": 4.9369639684747095e-06, "epoch": 0.11806122736361845, "percentage": 11.81, "elapsed_time": "1:35:50", "remaining_time": "11:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 4438, "loss": 0.2036, "learning_rate": 4.936547598007107e-06, "epoch": 0.11828653504942688, "percentage": 11.83, "elapsed_time": "1:36:02", "remaining_time": "11:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 4438, "loss": 0.1759, "learning_rate": 4.936129874615443e-06, "epoch": 0.11851184273523531, "percentage": 11.85, "elapsed_time": "1:36:12", "remaining_time": "11:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 4438, "loss": 0.1984, "learning_rate": 4.935710798531664e-06, "epoch": 0.11873715042104374, "percentage": 11.87, "elapsed_time": "1:36:22", "remaining_time": "11:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 4438, "loss": 0.207, "learning_rate": 4.935290369988468e-06, "epoch": 0.11896245810685217, "percentage": 11.9, "elapsed_time": "1:36:32", "remaining_time": "11:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 4438, "loss": 0.2081, "learning_rate": 4.934868589219302e-06, "epoch": 0.1191877657926606, "percentage": 11.92, "elapsed_time": "1:36:43", "remaining_time": "11:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 4438, "loss": 0.1899, "learning_rate": 4.934445456458366e-06, "epoch": 0.11941307347846904, "percentage": 11.94, "elapsed_time": "1:36:53", "remaining_time": "11:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 4438, "loss": 0.2124, "learning_rate": 4.934020971940609e-06, "epoch": 0.11963838116427747, "percentage": 11.96, "elapsed_time": "1:37:03", "remaining_time": "11:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 4438, "loss": 0.1951, "learning_rate": 4.933595135901733e-06, "epoch": 0.1198636888500859, "percentage": 11.99, "elapsed_time": "1:37:13", "remaining_time": "11:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 4438, "loss": 0.1881, "learning_rate": 4.933167948578187e-06, "epoch": 0.12008899653589433, "percentage": 12.01, "elapsed_time": "1:37:24", "remaining_time": "11:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 4438, "loss": 0.2045, "learning_rate": 4.932739410207172e-06, "epoch": 0.12031430422170276, "percentage": 12.03, "elapsed_time": "1:37:33", "remaining_time": "11:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 4438, "loss": 0.1976, "learning_rate": 4.932309521026643e-06, "epoch": 0.1205396119075112, "percentage": 12.05, "elapsed_time": "1:37:43", "remaining_time": "11:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 4438, "loss": 0.1893, "learning_rate": 4.931878281275296e-06, "epoch": 0.12076491959331963, "percentage": 12.08, "elapsed_time": "1:37:54", "remaining_time": "11:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 4438, "loss": 0.1864, "learning_rate": 4.931445691192587e-06, "epoch": 0.12099022727912806, "percentage": 12.1, "elapsed_time": "1:38:06", "remaining_time": "11:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 4438, "loss": 0.195, "learning_rate": 4.931011751018715e-06, "epoch": 0.12121553496493649, "percentage": 12.12, "elapsed_time": "1:38:15", "remaining_time": "11:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 4438, "loss": 0.1782, "learning_rate": 4.930576460994631e-06, "epoch": 0.12144084265074492, "percentage": 12.15, "elapsed_time": "1:38:25", "remaining_time": "11:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 4438, "loss": 0.2007, "learning_rate": 4.930139821362036e-06, "epoch": 0.12166615033655336, "percentage": 12.17, "elapsed_time": "1:38:37", "remaining_time": "11:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 4438, "loss": 0.2006, "learning_rate": 4.929701832363379e-06, "epoch": 0.12189145802236179, "percentage": 12.19, "elapsed_time": "1:38:46", "remaining_time": "11:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 4438, "loss": 0.1778, "learning_rate": 4.929262494241859e-06, "epoch": 0.12211676570817022, "percentage": 12.21, "elapsed_time": "1:38:56", "remaining_time": "11:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 4438, "loss": 0.1903, "learning_rate": 4.928821807241425e-06, "epoch": 0.12234207339397865, "percentage": 12.24, "elapsed_time": "1:39:06", "remaining_time": "11:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 4438, "loss": 0.1887, "learning_rate": 4.928379771606773e-06, "epoch": 0.12256738107978708, "percentage": 12.26, "elapsed_time": "1:39:15", "remaining_time": "11:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 4438, "loss": 0.2071, "learning_rate": 4.927936387583348e-06, "epoch": 0.12279268876559551, "percentage": 12.28, "elapsed_time": "1:39:26", "remaining_time": "11:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 4438, "loss": 0.1823, "learning_rate": 4.927491655417347e-06, "epoch": 0.12301799645140395, "percentage": 12.3, "elapsed_time": "1:39:36", "remaining_time": "11:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 4438, "loss": 0.2031, "learning_rate": 4.927045575355712e-06, "epoch": 0.12324330413721238, "percentage": 12.33, "elapsed_time": "1:39:46", "remaining_time": "11:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 4438, "loss": 0.1941, "learning_rate": 4.926598147646134e-06, "epoch": 0.12346861182302081, "percentage": 12.35, "elapsed_time": "1:39:57", "remaining_time": "11:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 4438, "loss": 0.1748, "learning_rate": 4.9261493725370546e-06, "epoch": 0.12369391950882924, "percentage": 12.37, "elapsed_time": "1:40:08", "remaining_time": "11:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 4438, "loss": 0.1956, "learning_rate": 4.9256992502776605e-06, "epoch": 0.12391922719463767, "percentage": 12.39, "elapsed_time": "1:40:18", "remaining_time": "11:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 4438, "loss": 0.1791, "learning_rate": 4.925247781117888e-06, "epoch": 0.1241445348804461, "percentage": 12.42, "elapsed_time": "1:40:29", "remaining_time": "11:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 4438, "loss": 0.1788, "learning_rate": 4.924794965308421e-06, "epoch": 0.12436984256625454, "percentage": 12.44, "elapsed_time": "1:40:39", "remaining_time": "11:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 4438, "loss": 0.2084, "learning_rate": 4.924340803100692e-06, "epoch": 0.12459515025206297, "percentage": 12.46, "elapsed_time": "1:40:49", "remaining_time": "11:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 4438, "loss": 0.1937, "learning_rate": 4.9238852947468796e-06, "epoch": 0.1248204579378714, "percentage": 12.48, "elapsed_time": "1:40:58", "remaining_time": "11:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 4438, "loss": 0.1937, "learning_rate": 4.923428440499912e-06, "epoch": 0.12504576562367983, "percentage": 12.51, "elapsed_time": "1:41:09", "remaining_time": "11:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 4438, "loss": 0.1976, "learning_rate": 4.922970240613461e-06, "epoch": 0.12527107330948828, "percentage": 12.53, "elapsed_time": "1:41:20", "remaining_time": "11:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 4438, "loss": 0.1964, "learning_rate": 4.92251069534195e-06, "epoch": 0.1254963809952967, "percentage": 12.55, "elapsed_time": "1:41:31", "remaining_time": "11:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 4438, "loss": 0.2018, "learning_rate": 4.922049804940546e-06, "epoch": 0.12572168868110514, "percentage": 12.57, "elapsed_time": "1:41:41", "remaining_time": "11:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 4438, "loss": 0.1979, "learning_rate": 4.9215875696651645e-06, "epoch": 0.12594699636691356, "percentage": 12.6, "elapsed_time": "1:41:51", "remaining_time": "11:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 4438, "loss": 0.2022, "learning_rate": 4.9211239897724685e-06, "epoch": 0.126172304052722, "percentage": 12.62, "elapsed_time": "1:42:01", "remaining_time": "11:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 4438, "loss": 0.2059, "learning_rate": 4.920659065519866e-06, "epoch": 0.12639761173853042, "percentage": 12.64, "elapsed_time": "1:42:12", "remaining_time": "11:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 4438, "loss": 0.1913, "learning_rate": 4.920192797165511e-06, "epoch": 0.12662291942433887, "percentage": 12.66, "elapsed_time": "1:42:23", "remaining_time": "11:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 4438, "loss": 0.2029, "learning_rate": 4.919725184968307e-06, "epoch": 0.1268482271101473, "percentage": 12.69, "elapsed_time": "1:42:34", "remaining_time": "11:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 4438, "loss": 0.1858, "learning_rate": 4.9192562291879e-06, "epoch": 0.12707353479595573, "percentage": 12.71, "elapsed_time": "1:42:43", "remaining_time": "11:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 4438, "loss": 0.1881, "learning_rate": 4.9187859300846845e-06, "epoch": 0.12729884248176415, "percentage": 12.73, "elapsed_time": "1:42:54", "remaining_time": "11:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 4438, "loss": 0.2066, "learning_rate": 4.9183142879198e-06, "epoch": 0.1275241501675726, "percentage": 12.75, "elapsed_time": "1:43:04", "remaining_time": "11:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 4438, "loss": 0.1961, "learning_rate": 4.917841302955132e-06, "epoch": 0.12774945785338102, "percentage": 12.78, "elapsed_time": "1:43:14", "remaining_time": "11:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 4438, "loss": 0.1927, "learning_rate": 4.917366975453311e-06, "epoch": 0.12797476553918946, "percentage": 12.8, "elapsed_time": "1:43:24", "remaining_time": "11:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 4438, "loss": 0.1889, "learning_rate": 4.916891305677712e-06, "epoch": 0.12820007322499788, "percentage": 12.82, "elapsed_time": "1:43:33", "remaining_time": "11:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 4438, "loss": 0.2036, "learning_rate": 4.9164142938924595e-06, "epoch": 0.12842538091080632, "percentage": 12.84, "elapsed_time": "1:43:46", "remaining_time": "11:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 4438, "loss": 0.1992, "learning_rate": 4.9159359403624185e-06, "epoch": 0.12865068859661474, "percentage": 12.87, "elapsed_time": "1:43:56", "remaining_time": "11:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 4438, "loss": 0.1785, "learning_rate": 4.915456245353202e-06, "epoch": 0.1288759962824232, "percentage": 12.89, "elapsed_time": "1:44:07", "remaining_time": "11:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 4438, "loss": 0.2014, "learning_rate": 4.914975209131165e-06, "epoch": 0.1291013039682316, "percentage": 12.91, "elapsed_time": "1:44:18", "remaining_time": "11:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 4438, "loss": 0.2001, "learning_rate": 4.914492831963411e-06, "epoch": 0.12932661165404005, "percentage": 12.93, "elapsed_time": "1:44:30", "remaining_time": "11:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 4438, "loss": 0.204, "learning_rate": 4.9140091141177856e-06, "epoch": 0.12955191933984847, "percentage": 12.96, "elapsed_time": "1:44:39", "remaining_time": "11:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 4438, "loss": 0.2023, "learning_rate": 4.9135240558628786e-06, "epoch": 0.12977722702565692, "percentage": 12.98, "elapsed_time": "1:44:50", "remaining_time": "11:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 4438, "loss": 0.1951, "learning_rate": 4.913037657468025e-06, "epoch": 0.13000253471146533, "percentage": 13.0, "elapsed_time": "1:45:01", "remaining_time": "11:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 4438, "loss": 0.1855, "learning_rate": 4.9125499192033035e-06, "epoch": 0.13022784239727378, "percentage": 13.02, "elapsed_time": "1:45:12", "remaining_time": "11:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 4438, "loss": 0.1727, "learning_rate": 4.912060841339536e-06, "epoch": 0.1304531500830822, "percentage": 13.05, "elapsed_time": "1:45:23", "remaining_time": "11:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 4438, "loss": 0.1824, "learning_rate": 4.911570424148293e-06, "epoch": 0.13067845776889064, "percentage": 13.07, "elapsed_time": "1:45:33", "remaining_time": "11:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 4438, "loss": 0.2052, "learning_rate": 4.911078667901881e-06, "epoch": 0.13090376545469906, "percentage": 13.09, "elapsed_time": "1:45:45", "remaining_time": "11:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 4438, "loss": 0.1874, "learning_rate": 4.910585572873355e-06, "epoch": 0.1311290731405075, "percentage": 13.11, "elapsed_time": "1:45:55", "remaining_time": "11:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 4438, "loss": 0.1692, "learning_rate": 4.9100911393365134e-06, "epoch": 0.13135438082631593, "percentage": 13.14, "elapsed_time": "1:46:05", "remaining_time": "11:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 4438, "loss": 0.2037, "learning_rate": 4.9095953675658945e-06, "epoch": 0.13157968851212437, "percentage": 13.16, "elapsed_time": "1:46:17", "remaining_time": "11:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 4438, "loss": 0.1754, "learning_rate": 4.909098257836784e-06, "epoch": 0.1318049961979328, "percentage": 13.18, "elapsed_time": "1:46:28", "remaining_time": "11:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 4438, "loss": 0.2, "learning_rate": 4.908599810425208e-06, "epoch": 0.13203030388374123, "percentage": 13.2, "elapsed_time": "1:46:39", "remaining_time": "11:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 4438, "loss": 0.1893, "learning_rate": 4.908100025607935e-06, "epoch": 0.13225561156954965, "percentage": 13.23, "elapsed_time": "1:46:50", "remaining_time": "11:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 4438, "loss": 0.1801, "learning_rate": 4.907598903662477e-06, "epoch": 0.1324809192553581, "percentage": 13.25, "elapsed_time": "1:47:00", "remaining_time": "11:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 4438, "loss": 0.2093, "learning_rate": 4.90709644486709e-06, "epoch": 0.13270622694116654, "percentage": 13.27, "elapsed_time": "1:47:11", "remaining_time": "11:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 4438, "loss": 0.1893, "learning_rate": 4.906592649500767e-06, "epoch": 0.13293153462697496, "percentage": 13.29, "elapsed_time": "1:47:21", "remaining_time": "11:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 4438, "loss": 0.1889, "learning_rate": 4.906087517843251e-06, "epoch": 0.1331568423127834, "percentage": 13.32, "elapsed_time": "1:47:31", "remaining_time": "11:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 4438, "loss": 0.1885, "learning_rate": 4.9055810501750205e-06, "epoch": 0.13338214999859183, "percentage": 13.34, "elapsed_time": "1:47:41", "remaining_time": "11:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 4438, "loss": 0.1897, "learning_rate": 4.905073246777298e-06, "epoch": 0.13360745768440027, "percentage": 13.36, "elapsed_time": "1:47:52", "remaining_time": "11:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 4438, "loss": 0.1769, "learning_rate": 4.904564107932048e-06, "epoch": 0.1338327653702087, "percentage": 13.38, "elapsed_time": "1:48:04", "remaining_time": "11:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 4438, "loss": 0.1903, "learning_rate": 4.904053633921977e-06, "epoch": 0.13405807305601714, "percentage": 13.41, "elapsed_time": "1:48:14", "remaining_time": "11:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 4438, "loss": 0.1997, "learning_rate": 4.9035418250305314e-06, "epoch": 0.13428338074182555, "percentage": 13.43, "elapsed_time": "1:48:23", "remaining_time": "11:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 4438, "loss": 0.1818, "learning_rate": 4.9030286815419e-06, "epoch": 0.134508688427634, "percentage": 13.45, "elapsed_time": "1:48:33", "remaining_time": "11:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 4438, "loss": 0.1784, "learning_rate": 4.902514203741013e-06, "epoch": 0.13473399611344242, "percentage": 13.47, "elapsed_time": "1:48:44", "remaining_time": "11:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 4438, "loss": 0.1835, "learning_rate": 4.901998391913539e-06, "epoch": 0.13495930379925086, "percentage": 13.5, "elapsed_time": "1:48:55", "remaining_time": "11:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 4438, "loss": 0.1846, "learning_rate": 4.9014812463458905e-06, "epoch": 0.13518461148505928, "percentage": 13.52, "elapsed_time": "1:49:05", "remaining_time": "11:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 4438, "loss": 0.193, "learning_rate": 4.9009627673252195e-06, "epoch": 0.13540991917086773, "percentage": 13.54, "elapsed_time": "1:49:16", "remaining_time": "11:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 4438, "loss": 0.1983, "learning_rate": 4.9004429551394155e-06, "epoch": 0.13563522685667614, "percentage": 13.56, "elapsed_time": "1:49:28", "remaining_time": "11:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 4438, "loss": 0.2019, "learning_rate": 4.899921810077114e-06, "epoch": 0.1358605345424846, "percentage": 13.59, "elapsed_time": "1:49:38", "remaining_time": "11:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 4438, "loss": 0.1885, "learning_rate": 4.899399332427685e-06, "epoch": 0.136085842228293, "percentage": 13.61, "elapsed_time": "1:49:49", "remaining_time": "11:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 4438, "loss": 0.1885, "learning_rate": 4.898875522481242e-06, "epoch": 0.13631114991410145, "percentage": 13.63, "elapsed_time": "1:49:59", "remaining_time": "11:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 4438, "loss": 0.1942, "learning_rate": 4.898350380528638e-06, "epoch": 0.13653645759990987, "percentage": 13.65, "elapsed_time": "1:50:09", "remaining_time": "11:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 4438, "loss": 0.2017, "learning_rate": 4.897823906861463e-06, "epoch": 0.13676176528571832, "percentage": 13.68, "elapsed_time": "1:50:19", "remaining_time": "11:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 4438, "loss": 0.1924, "learning_rate": 4.89729610177205e-06, "epoch": 0.13698707297152674, "percentage": 13.7, "elapsed_time": "1:50:30", "remaining_time": "11:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 4438, "loss": 0.2164, "learning_rate": 4.896766965553467e-06, "epoch": 0.13721238065733518, "percentage": 13.72, "elapsed_time": "1:50:41", "remaining_time": "11:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 4438, "loss": 0.2049, "learning_rate": 4.896236498499526e-06, "epoch": 0.1374376883431436, "percentage": 13.74, "elapsed_time": "1:50:52", "remaining_time": "11:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 4438, "loss": 0.1805, "learning_rate": 4.8957047009047744e-06, "epoch": 0.13766299602895204, "percentage": 13.77, "elapsed_time": "1:51:02", "remaining_time": "11:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 4438, "loss": 0.1904, "learning_rate": 4.8951715730645e-06, "epoch": 0.13788830371476046, "percentage": 13.79, "elapsed_time": "1:51:14", "remaining_time": "11:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 4438, "loss": 0.1892, "learning_rate": 4.894637115274728e-06, "epoch": 0.1381136114005689, "percentage": 13.81, "elapsed_time": "1:51:24", "remaining_time": "11:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 4438, "loss": 0.2121, "learning_rate": 4.894101327832225e-06, "epoch": 0.13833891908637733, "percentage": 13.84, "elapsed_time": "1:51:35", "remaining_time": "11:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 4438, "loss": 0.1854, "learning_rate": 4.893564211034492e-06, "epoch": 0.13856422677218577, "percentage": 13.86, "elapsed_time": "1:51:48", "remaining_time": "11:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 4438, "loss": 0.196, "learning_rate": 4.89302576517977e-06, "epoch": 0.1387895344579942, "percentage": 13.88, "elapsed_time": "1:51:55", "remaining_time": "11:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 4438, "loss": 0.1889, "learning_rate": 4.892485990567037e-06, "epoch": 0.13901484214380264, "percentage": 13.9, "elapsed_time": "1:52:07", "remaining_time": "11:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 4438, "loss": 0.206, "learning_rate": 4.891944887496013e-06, "epoch": 0.13924014982961105, "percentage": 13.93, "elapsed_time": "1:52:17", "remaining_time": "11:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 4438, "loss": 0.1984, "learning_rate": 4.891402456267149e-06, "epoch": 0.1394654575154195, "percentage": 13.95, "elapsed_time": "1:52:28", "remaining_time": "11:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 4438, "loss": 0.1986, "learning_rate": 4.890858697181638e-06, "epoch": 0.13969076520122792, "percentage": 13.97, "elapsed_time": "1:52:40", "remaining_time": "11:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 4438, "loss": 0.1971, "learning_rate": 4.89031361054141e-06, "epoch": 0.13991607288703636, "percentage": 13.99, "elapsed_time": "1:52:51", "remaining_time": "11:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 4438, "loss": 0.1813, "learning_rate": 4.8897671966491315e-06, "epoch": 0.14014138057284478, "percentage": 14.02, "elapsed_time": "1:53:01", "remaining_time": "11:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 4438, "loss": 0.1852, "learning_rate": 4.889219455808204e-06, "epoch": 0.14036668825865323, "percentage": 14.04, "elapsed_time": "1:53:12", "remaining_time": "11:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 4438, "loss": 0.2021, "learning_rate": 4.888670388322768e-06, "epoch": 0.14059199594446165, "percentage": 14.06, "elapsed_time": "1:53:24", "remaining_time": "11:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 4438, "loss": 0.1772, "learning_rate": 4.888119994497701e-06, "epoch": 0.1408173036302701, "percentage": 14.08, "elapsed_time": "1:53:34", "remaining_time": "11:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 4438, "loss": 0.2052, "learning_rate": 4.887568274638616e-06, "epoch": 0.1410426113160785, "percentage": 14.11, "elapsed_time": "1:53:45", "remaining_time": "11:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 4438, "loss": 0.1982, "learning_rate": 4.887015229051861e-06, "epoch": 0.14126791900188695, "percentage": 14.13, "elapsed_time": "1:53:56", "remaining_time": "11:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 4438, "loss": 0.1922, "learning_rate": 4.886460858044524e-06, "epoch": 0.14149322668769537, "percentage": 14.15, "elapsed_time": "1:54:06", "remaining_time": "11:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 4438, "loss": 0.1917, "learning_rate": 4.885905161924426e-06, "epoch": 0.14171853437350382, "percentage": 14.17, "elapsed_time": "1:54:16", "remaining_time": "11:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 4438, "loss": 0.1862, "learning_rate": 4.8853481410001225e-06, "epoch": 0.14194384205931224, "percentage": 14.2, "elapsed_time": "1:54:28", "remaining_time": "11:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 4438, "loss": 0.194, "learning_rate": 4.8847897955809085e-06, "epoch": 0.14216914974512068, "percentage": 14.22, "elapsed_time": "1:54:40", "remaining_time": "11:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 4438, "loss": 0.1715, "learning_rate": 4.884230125976812e-06, "epoch": 0.1423944574309291, "percentage": 14.24, "elapsed_time": "1:54:51", "remaining_time": "11:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 4438, "loss": 0.1992, "learning_rate": 4.8836691324985955e-06, "epoch": 0.14261976511673755, "percentage": 14.26, "elapsed_time": "1:55:02", "remaining_time": "11:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 4438, "loss": 0.1983, "learning_rate": 4.883106815457758e-06, "epoch": 0.14284507280254596, "percentage": 14.29, "elapsed_time": "1:55:13", "remaining_time": "11:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 4438, "loss": 0.1865, "learning_rate": 4.882543175166535e-06, "epoch": 0.1430703804883544, "percentage": 14.31, "elapsed_time": "1:55:23", "remaining_time": "11:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 4438, "loss": 0.2045, "learning_rate": 4.881978211937895e-06, "epoch": 0.14329568817416283, "percentage": 14.33, "elapsed_time": "1:55:33", "remaining_time": "11:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 4438, "loss": 0.1955, "learning_rate": 4.8814119260855374e-06, "epoch": 0.14352099585997127, "percentage": 14.35, "elapsed_time": "1:55:43", "remaining_time": "11:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 4438, "loss": 0.1829, "learning_rate": 4.8808443179239025e-06, "epoch": 0.14374630354577972, "percentage": 14.38, "elapsed_time": "1:55:53", "remaining_time": "11:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 4438, "loss": 0.1811, "learning_rate": 4.880275387768162e-06, "epoch": 0.14397161123158814, "percentage": 14.4, "elapsed_time": "1:56:04", "remaining_time": "11:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 4438, "loss": 0.1889, "learning_rate": 4.87970513593422e-06, "epoch": 0.14419691891739658, "percentage": 14.42, "elapsed_time": "1:56:14", "remaining_time": "11:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 4438, "loss": 0.2228, "learning_rate": 4.879133562738719e-06, "epoch": 0.144422226603205, "percentage": 14.44, "elapsed_time": "1:56:25", "remaining_time": "11:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 4438, "loss": 0.1982, "learning_rate": 4.878560668499029e-06, "epoch": 0.14464753428901345, "percentage": 14.47, "elapsed_time": "1:56:35", "remaining_time": "11:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 4438, "loss": 0.18, "learning_rate": 4.8779864535332585e-06, "epoch": 0.14487284197482186, "percentage": 14.49, "elapsed_time": "1:56:46", "remaining_time": "11:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 4438, "loss": 0.186, "learning_rate": 4.877410918160247e-06, "epoch": 0.1450981496606303, "percentage": 14.51, "elapsed_time": "1:56:54", "remaining_time": "11:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 4438, "loss": 0.2101, "learning_rate": 4.876834062699569e-06, "epoch": 0.14532345734643873, "percentage": 14.53, "elapsed_time": "1:57:06", "remaining_time": "11:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 4438, "loss": 0.1989, "learning_rate": 4.87625588747153e-06, "epoch": 0.14554876503224717, "percentage": 14.56, "elapsed_time": "1:57:17", "remaining_time": "11:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 4438, "loss": 0.1878, "learning_rate": 4.875676392797169e-06, "epoch": 0.1457740727180556, "percentage": 14.58, "elapsed_time": "1:57:29", "remaining_time": "11:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 4438, "loss": 0.2025, "learning_rate": 4.875095578998258e-06, "epoch": 0.14599938040386404, "percentage": 14.6, "elapsed_time": "1:57:40", "remaining_time": "11:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 4438, "loss": 0.1793, "learning_rate": 4.874513446397301e-06, "epoch": 0.14622468808967246, "percentage": 14.62, "elapsed_time": "1:57:49", "remaining_time": "11:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 4438, "loss": 0.1864, "learning_rate": 4.873929995317535e-06, "epoch": 0.1464499957754809, "percentage": 14.65, "elapsed_time": "1:57:59", "remaining_time": "11:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 4438, "loss": 0.1941, "learning_rate": 4.873345226082929e-06, "epoch": 0.14667530346128932, "percentage": 14.67, "elapsed_time": "1:58:09", "remaining_time": "11:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 4438, "loss": 0.1912, "learning_rate": 4.872759139018183e-06, "epoch": 0.14690061114709776, "percentage": 14.69, "elapsed_time": "1:58:18", "remaining_time": "11:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 4438, "loss": 0.2075, "learning_rate": 4.872171734448728e-06, "epoch": 0.14712591883290618, "percentage": 14.71, "elapsed_time": "1:58:28", "remaining_time": "11:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 4438, "loss": 0.1832, "learning_rate": 4.87158301270073e-06, "epoch": 0.14735122651871463, "percentage": 14.74, "elapsed_time": "1:58:39", "remaining_time": "11:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 4438, "loss": 0.1829, "learning_rate": 4.870992974101084e-06, "epoch": 0.14757653420452305, "percentage": 14.76, "elapsed_time": "1:58:51", "remaining_time": "11:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 4438, "loss": 0.2091, "learning_rate": 4.870401618977415e-06, "epoch": 0.1478018418903315, "percentage": 14.78, "elapsed_time": "1:59:01", "remaining_time": "11:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 4438, "loss": 0.1946, "learning_rate": 4.869808947658082e-06, "epoch": 0.1480271495761399, "percentage": 14.8, "elapsed_time": "1:59:13", "remaining_time": "11:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 4438, "loss": 0.1989, "learning_rate": 4.869214960472172e-06, "epoch": 0.14825245726194836, "percentage": 14.83, "elapsed_time": "1:59:25", "remaining_time": "11:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 4438, "loss": 0.2007, "learning_rate": 4.868619657749505e-06, "epoch": 0.14847776494775677, "percentage": 14.85, "elapsed_time": "1:59:37", "remaining_time": "11:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 4438, "loss": 0.2015, "learning_rate": 4.868023039820629e-06, "epoch": 0.14870307263356522, "percentage": 14.87, "elapsed_time": "1:59:49", "remaining_time": "11:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 4438, "loss": 0.1796, "learning_rate": 4.867425107016826e-06, "epoch": 0.14892838031937364, "percentage": 14.89, "elapsed_time": "1:59:58", "remaining_time": "11:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 4438, "loss": 0.171, "learning_rate": 4.8668258596701035e-06, "epoch": 0.14915368800518208, "percentage": 14.92, "elapsed_time": "2:00:09", "remaining_time": "11:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 4438, "loss": 0.1783, "learning_rate": 4.866225298113203e-06, "epoch": 0.1493789956909905, "percentage": 14.94, "elapsed_time": "2:00:19", "remaining_time": "11:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 4438, "loss": 0.2031, "learning_rate": 4.865623422679593e-06, "epoch": 0.14960430337679895, "percentage": 14.96, "elapsed_time": "2:00:30", "remaining_time": "11:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 4438, "loss": 0.207, "learning_rate": 4.865020233703472e-06, "epoch": 0.14982961106260737, "percentage": 14.98, "elapsed_time": "2:00:41", "remaining_time": "11:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 4438, "loss": 0.1875, "learning_rate": 4.864415731519769e-06, "epoch": 0.1500549187484158, "percentage": 15.01, "elapsed_time": "2:00:53", "remaining_time": "11:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 4438, "loss": 0.1943, "learning_rate": 4.863809916464142e-06, "epoch": 0.15028022643422423, "percentage": 15.03, "elapsed_time": "2:01:02", "remaining_time": "11:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 4438, "loss": 0.1933, "learning_rate": 4.8632027888729765e-06, "epoch": 0.15050553412003267, "percentage": 15.05, "elapsed_time": "2:01:12", "remaining_time": "11:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 4438, "loss": 0.1679, "learning_rate": 4.862594349083389e-06, "epoch": 0.1507308418058411, "percentage": 15.07, "elapsed_time": "2:01:23", "remaining_time": "11:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 4438, "loss": 0.1932, "learning_rate": 4.861984597433223e-06, "epoch": 0.15095614949164954, "percentage": 15.1, "elapsed_time": "2:01:34", "remaining_time": "11:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 4438, "loss": 0.1736, "learning_rate": 4.861373534261049e-06, "epoch": 0.15118145717745796, "percentage": 15.12, "elapsed_time": "2:01:44", "remaining_time": "11:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 4438, "loss": 0.2005, "learning_rate": 4.860761159906171e-06, "epoch": 0.1514067648632664, "percentage": 15.14, "elapsed_time": "2:01:56", "remaining_time": "11:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 4438, "loss": 0.1747, "learning_rate": 4.8601474747086145e-06, "epoch": 0.15163207254907482, "percentage": 15.16, "elapsed_time": "2:02:07", "remaining_time": "11:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 4438, "loss": 0.1982, "learning_rate": 4.859532479009138e-06, "epoch": 0.15185738023488327, "percentage": 15.19, "elapsed_time": "2:02:17", "remaining_time": "11:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 4438, "loss": 0.182, "learning_rate": 4.8589161731492255e-06, "epoch": 0.15208268792069168, "percentage": 15.21, "elapsed_time": "2:02:28", "remaining_time": "11:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 4438, "loss": 0.1898, "learning_rate": 4.858298557471089e-06, "epoch": 0.15230799560650013, "percentage": 15.23, "elapsed_time": "2:02:39", "remaining_time": "11:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 4438, "loss": 0.1972, "learning_rate": 4.857679632317664e-06, "epoch": 0.15253330329230855, "percentage": 15.25, "elapsed_time": "2:02:50", "remaining_time": "11:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 4438, "loss": 0.183, "learning_rate": 4.857059398032622e-06, "epoch": 0.152758610978117, "percentage": 15.28, "elapsed_time": "2:03:02", "remaining_time": "11:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 4438, "loss": 0.1921, "learning_rate": 4.856437854960352e-06, "epoch": 0.1529839186639254, "percentage": 15.3, "elapsed_time": "2:03:13", "remaining_time": "11:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 4438, "loss": 0.2011, "learning_rate": 4.855815003445975e-06, "epoch": 0.15320922634973386, "percentage": 15.32, "elapsed_time": "2:03:24", "remaining_time": "11:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 4438, "loss": 0.1889, "learning_rate": 4.855190843835338e-06, "epoch": 0.15343453403554227, "percentage": 15.34, "elapsed_time": "2:03:34", "remaining_time": "11:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 4438, "loss": 0.2077, "learning_rate": 4.8545653764750125e-06, "epoch": 0.15365984172135072, "percentage": 15.37, "elapsed_time": "2:03:45", "remaining_time": "11:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 4438, "loss": 0.1867, "learning_rate": 4.853938601712297e-06, "epoch": 0.15388514940715914, "percentage": 15.39, "elapsed_time": "2:03:56", "remaining_time": "11:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 4438, "loss": 0.191, "learning_rate": 4.853310519895217e-06, "epoch": 0.15411045709296758, "percentage": 15.41, "elapsed_time": "2:04:07", "remaining_time": "11:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 4438, "loss": 0.1976, "learning_rate": 4.852681131372522e-06, "epoch": 0.154335764778776, "percentage": 15.43, "elapsed_time": "2:04:17", "remaining_time": "11:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 4438, "loss": 0.1966, "learning_rate": 4.85205043649369e-06, "epoch": 0.15456107246458445, "percentage": 15.46, "elapsed_time": "2:04:29", "remaining_time": "11:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 4438, "loss": 0.1849, "learning_rate": 4.851418435608919e-06, "epoch": 0.1547863801503929, "percentage": 15.48, "elapsed_time": "2:04:39", "remaining_time": "11:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 4438, "loss": 0.1862, "learning_rate": 4.850785129069139e-06, "epoch": 0.1550116878362013, "percentage": 15.5, "elapsed_time": "2:04:49", "remaining_time": "11:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 4438, "loss": 0.1864, "learning_rate": 4.850150517225999e-06, "epoch": 0.15523699552200976, "percentage": 15.53, "elapsed_time": "2:05:00", "remaining_time": "11:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 4438, "loss": 0.1795, "learning_rate": 4.849514600431877e-06, "epoch": 0.15546230320781818, "percentage": 15.55, "elapsed_time": "2:05:13", "remaining_time": "11:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 4438, "loss": 0.1991, "learning_rate": 4.848877379039874e-06, "epoch": 0.15568761089362662, "percentage": 15.57, "elapsed_time": "2:05:24", "remaining_time": "11:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 4438, "loss": 0.1843, "learning_rate": 4.848238853403813e-06, "epoch": 0.15591291857943504, "percentage": 15.59, "elapsed_time": "2:05:35", "remaining_time": "11:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 4438, "loss": 0.1951, "learning_rate": 4.847599023878245e-06, "epoch": 0.15613822626524348, "percentage": 15.62, "elapsed_time": "2:05:46", "remaining_time": "11:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 4438, "loss": 0.1942, "learning_rate": 4.846957890818444e-06, "epoch": 0.1563635339510519, "percentage": 15.64, "elapsed_time": "2:05:57", "remaining_time": "11:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 4438, "loss": 0.184, "learning_rate": 4.846315454580406e-06, "epoch": 0.15658884163686035, "percentage": 15.66, "elapsed_time": "2:06:08", "remaining_time": "11:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 4438, "loss": 0.1827, "learning_rate": 4.845671715520853e-06, "epoch": 0.15681414932266877, "percentage": 15.68, "elapsed_time": "2:06:19", "remaining_time": "11:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 4438, "loss": 0.1771, "learning_rate": 4.845026673997229e-06, "epoch": 0.1570394570084772, "percentage": 15.71, "elapsed_time": "2:06:29", "remaining_time": "11:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 4438, "loss": 0.1919, "learning_rate": 4.844380330367701e-06, "epoch": 0.15726476469428563, "percentage": 15.73, "elapsed_time": "2:06:41", "remaining_time": "11:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 4438, "loss": 0.1892, "learning_rate": 4.843732684991161e-06, "epoch": 0.15749007238009408, "percentage": 15.75, "elapsed_time": "2:06:51", "remaining_time": "11:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 4438, "loss": 0.2068, "learning_rate": 4.84308373822722e-06, "epoch": 0.1577153800659025, "percentage": 15.77, "elapsed_time": "2:07:02", "remaining_time": "11:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 4438, "loss": 0.1784, "learning_rate": 4.842433490436217e-06, "epoch": 0.15794068775171094, "percentage": 15.8, "elapsed_time": "2:07:11", "remaining_time": "11:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 4438, "loss": 0.1981, "learning_rate": 4.841781941979207e-06, "epoch": 0.15816599543751936, "percentage": 15.82, "elapsed_time": "2:07:22", "remaining_time": "11:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 4438, "loss": 0.1883, "learning_rate": 4.8411290932179734e-06, "epoch": 0.1583913031233278, "percentage": 15.84, "elapsed_time": "2:07:31", "remaining_time": "11:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 4438, "loss": 0.1947, "learning_rate": 4.840474944515017e-06, "epoch": 0.15861661080913622, "percentage": 15.86, "elapsed_time": "2:07:42", "remaining_time": "11:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 4438, "loss": 0.1949, "learning_rate": 4.839819496233562e-06, "epoch": 0.15884191849494467, "percentage": 15.89, "elapsed_time": "2:07:52", "remaining_time": "11:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 4438, "loss": 0.1862, "learning_rate": 4.839162748737556e-06, "epoch": 0.15906722618075309, "percentage": 15.91, "elapsed_time": "2:08:02", "remaining_time": "11:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 4438, "loss": 0.1897, "learning_rate": 4.838504702391665e-06, "epoch": 0.15929253386656153, "percentage": 15.93, "elapsed_time": "2:08:13", "remaining_time": "11:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 4438, "loss": 0.2044, "learning_rate": 4.8378453575612785e-06, "epoch": 0.15951784155236995, "percentage": 15.95, "elapsed_time": "2:08:23", "remaining_time": "11:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 4438, "loss": 0.1799, "learning_rate": 4.837184714612506e-06, "epoch": 0.1597431492381784, "percentage": 15.98, "elapsed_time": "2:08:32", "remaining_time": "11:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 4438, "loss": 0.1776, "learning_rate": 4.836522773912178e-06, "epoch": 0.1599684569239868, "percentage": 16.0, "elapsed_time": "2:08:42", "remaining_time": "11:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 4438, "loss": 0.1919, "learning_rate": 4.835859535827844e-06, "epoch": 0.16019376460979526, "percentage": 16.02, "elapsed_time": "2:08:53", "remaining_time": "11:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 4438, "loss": 0.1989, "learning_rate": 4.835195000727778e-06, "epoch": 0.16041907229560368, "percentage": 16.04, "elapsed_time": "2:09:04", "remaining_time": "11:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 4438, "loss": 0.1972, "learning_rate": 4.834529168980969e-06, "epoch": 0.16064437998141212, "percentage": 16.07, "elapsed_time": "2:09:14", "remaining_time": "11:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 4438, "loss": 0.1868, "learning_rate": 4.83386204095713e-06, "epoch": 0.16086968766722054, "percentage": 16.09, "elapsed_time": "2:09:26", "remaining_time": "11:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 4438, "loss": 0.1902, "learning_rate": 4.833193617026692e-06, "epoch": 0.16109499535302899, "percentage": 16.11, "elapsed_time": "2:09:37", "remaining_time": "11:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 4438, "loss": 0.1814, "learning_rate": 4.832523897560806e-06, "epoch": 0.1613203030388374, "percentage": 16.13, "elapsed_time": "2:09:48", "remaining_time": "11:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 4438, "loss": 0.1896, "learning_rate": 4.831852882931342e-06, "epoch": 0.16154561072464585, "percentage": 16.16, "elapsed_time": "2:09:59", "remaining_time": "11:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 4438, "loss": 0.1958, "learning_rate": 4.83118057351089e-06, "epoch": 0.16177091841045427, "percentage": 16.18, "elapsed_time": "2:10:09", "remaining_time": "11:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 4438, "loss": 0.1821, "learning_rate": 4.830506969672758e-06, "epoch": 0.1619962260962627, "percentage": 16.2, "elapsed_time": "2:10:20", "remaining_time": "11:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 4438, "loss": 0.2017, "learning_rate": 4.829832071790972e-06, "epoch": 0.16222153378207113, "percentage": 16.22, "elapsed_time": "2:10:31", "remaining_time": "11:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 4438, "loss": 0.1979, "learning_rate": 4.829155880240279e-06, "epoch": 0.16244684146787958, "percentage": 16.25, "elapsed_time": "2:10:42", "remaining_time": "11:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 4438, "loss": 0.1821, "learning_rate": 4.828478395396143e-06, "epoch": 0.162672149153688, "percentage": 16.27, "elapsed_time": "2:10:51", "remaining_time": "11:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 4438, "loss": 0.1787, "learning_rate": 4.8277996176347465e-06, "epoch": 0.16289745683949644, "percentage": 16.29, "elapsed_time": "2:11:01", "remaining_time": "11:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 4438, "loss": 0.1785, "learning_rate": 4.827119547332988e-06, "epoch": 0.16312276452530486, "percentage": 16.31, "elapsed_time": "2:11:12", "remaining_time": "11:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 4438, "loss": 0.1831, "learning_rate": 4.826438184868486e-06, "epoch": 0.1633480722111133, "percentage": 16.34, "elapsed_time": "2:11:24", "remaining_time": "11:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 4438, "loss": 0.1856, "learning_rate": 4.825755530619576e-06, "epoch": 0.16357337989692172, "percentage": 16.36, "elapsed_time": "2:11:35", "remaining_time": "11:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 4438, "loss": 0.1871, "learning_rate": 4.825071584965308e-06, "epoch": 0.16379868758273017, "percentage": 16.38, "elapsed_time": "2:11:46", "remaining_time": "11:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 4438, "loss": 0.1974, "learning_rate": 4.824386348285456e-06, "epoch": 0.16402399526853859, "percentage": 16.4, "elapsed_time": "2:11:59", "remaining_time": "11:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 4438, "loss": 0.1943, "learning_rate": 4.823699820960502e-06, "epoch": 0.16424930295434703, "percentage": 16.43, "elapsed_time": "2:12:10", "remaining_time": "11:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 4438, "loss": 0.185, "learning_rate": 4.8230120033716525e-06, "epoch": 0.16447461064015545, "percentage": 16.45, "elapsed_time": "2:12:19", "remaining_time": "11:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 4438, "loss": 0.1761, "learning_rate": 4.822322895900825e-06, "epoch": 0.1646999183259639, "percentage": 16.47, "elapsed_time": "2:12:30", "remaining_time": "11:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 4438, "loss": 0.1772, "learning_rate": 4.821632498930656e-06, "epoch": 0.1649252260117723, "percentage": 16.49, "elapsed_time": "2:12:41", "remaining_time": "11:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 4438, "loss": 0.1797, "learning_rate": 4.820940812844496e-06, "epoch": 0.16515053369758076, "percentage": 16.52, "elapsed_time": "2:12:51", "remaining_time": "11:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 4438, "loss": 0.1853, "learning_rate": 4.820247838026414e-06, "epoch": 0.16537584138338918, "percentage": 16.54, "elapsed_time": "2:13:02", "remaining_time": "11:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 4438, "loss": 0.1707, "learning_rate": 4.819553574861192e-06, "epoch": 0.16560114906919762, "percentage": 16.56, "elapsed_time": "2:13:13", "remaining_time": "11:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 4438, "loss": 0.1774, "learning_rate": 4.81885802373433e-06, "epoch": 0.16582645675500607, "percentage": 16.58, "elapsed_time": "2:13:24", "remaining_time": "11:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 4438, "loss": 0.2033, "learning_rate": 4.818161185032039e-06, "epoch": 0.1660517644408145, "percentage": 16.61, "elapsed_time": "2:13:34", "remaining_time": "11:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 4438, "loss": 0.2032, "learning_rate": 4.8174630591412495e-06, "epoch": 0.16627707212662293, "percentage": 16.63, "elapsed_time": "2:13:45", "remaining_time": "11:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 4438, "loss": 0.1965, "learning_rate": 4.816763646449605e-06, "epoch": 0.16650237981243135, "percentage": 16.65, "elapsed_time": "2:13:57", "remaining_time": "11:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 4438, "loss": 0.1826, "learning_rate": 4.816062947345462e-06, "epoch": 0.1667276874982398, "percentage": 16.67, "elapsed_time": "2:14:07", "remaining_time": "11:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 4438, "loss": 0.2072, "learning_rate": 4.815360962217894e-06, "epoch": 0.16695299518404821, "percentage": 16.7, "elapsed_time": "2:14:19", "remaining_time": "11:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 4438, "loss": 0.1865, "learning_rate": 4.814657691456685e-06, "epoch": 0.16717830286985666, "percentage": 16.72, "elapsed_time": "2:14:28", "remaining_time": "11:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 4438, "loss": 0.1976, "learning_rate": 4.813953135452338e-06, "epoch": 0.16740361055566508, "percentage": 16.74, "elapsed_time": "2:14:39", "remaining_time": "11:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 4438, "loss": 0.1905, "learning_rate": 4.813247294596065e-06, "epoch": 0.16762891824147352, "percentage": 16.76, "elapsed_time": "2:14:49", "remaining_time": "11:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 4438, "loss": 0.1876, "learning_rate": 4.812540169279793e-06, "epoch": 0.16785422592728194, "percentage": 16.79, "elapsed_time": "2:15:02", "remaining_time": "11:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 4438, "loss": 0.1856, "learning_rate": 4.8118317598961625e-06, "epoch": 0.1680795336130904, "percentage": 16.81, "elapsed_time": "2:15:12", "remaining_time": "11:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 4438, "loss": 0.1807, "learning_rate": 4.811122066838527e-06, "epoch": 0.1683048412988988, "percentage": 16.83, "elapsed_time": "2:15:23", "remaining_time": "11:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 4438, "loss": 0.1826, "learning_rate": 4.810411090500952e-06, "epoch": 0.16853014898470725, "percentage": 16.85, "elapsed_time": "2:15:33", "remaining_time": "11:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 4438, "loss": 0.1755, "learning_rate": 4.809698831278217e-06, "epoch": 0.16875545667051567, "percentage": 16.88, "elapsed_time": "2:15:44", "remaining_time": "11:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 4438, "loss": 0.2149, "learning_rate": 4.808985289565813e-06, "epoch": 0.16898076435632411, "percentage": 16.9, "elapsed_time": "2:15:55", "remaining_time": "11:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 4438, "loss": 0.1962, "learning_rate": 4.808270465759943e-06, "epoch": 0.16920607204213253, "percentage": 16.92, "elapsed_time": "2:16:05", "remaining_time": "11:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 4438, "loss": 0.2046, "learning_rate": 4.807554360257522e-06, "epoch": 0.16943137972794098, "percentage": 16.94, "elapsed_time": "2:16:15", "remaining_time": "11:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 4438, "loss": 0.1921, "learning_rate": 4.806836973456175e-06, "epoch": 0.1696566874137494, "percentage": 16.97, "elapsed_time": "2:16:25", "remaining_time": "11:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 4438, "loss": 0.1759, "learning_rate": 4.8061183057542424e-06, "epoch": 0.16988199509955784, "percentage": 16.99, "elapsed_time": "2:16:36", "remaining_time": "11:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 4438, "loss": 0.1796, "learning_rate": 4.8053983575507735e-06, "epoch": 0.17010730278536626, "percentage": 17.01, "elapsed_time": "2:16:45", "remaining_time": "11:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 4438, "loss": 0.189, "learning_rate": 4.804677129245527e-06, "epoch": 0.1703326104711747, "percentage": 17.03, "elapsed_time": "2:16:56", "remaining_time": "11:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 4438, "loss": 0.176, "learning_rate": 4.8039546212389765e-06, "epoch": 0.17055791815698312, "percentage": 17.06, "elapsed_time": "2:17:07", "remaining_time": "11:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 4438, "loss": 0.1871, "learning_rate": 4.803230833932302e-06, "epoch": 0.17078322584279157, "percentage": 17.08, "elapsed_time": "2:17:18", "remaining_time": "11:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 4438, "loss": 0.1807, "learning_rate": 4.802505767727395e-06, "epoch": 0.1710085335286, "percentage": 17.1, "elapsed_time": "2:17:27", "remaining_time": "11:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 4438, "loss": 0.1971, "learning_rate": 4.80177942302686e-06, "epoch": 0.17123384121440843, "percentage": 17.12, "elapsed_time": "2:17:39", "remaining_time": "11:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 4438, "loss": 0.1786, "learning_rate": 4.8010518002340065e-06, "epoch": 0.17145914890021685, "percentage": 17.15, "elapsed_time": "2:17:49", "remaining_time": "11:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 4438, "loss": 0.1711, "learning_rate": 4.800322899752859e-06, "epoch": 0.1716844565860253, "percentage": 17.17, "elapsed_time": "2:17:59", "remaining_time": "11:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 4438, "loss": 0.1981, "learning_rate": 4.799592721988147e-06, "epoch": 0.17190976427183371, "percentage": 17.19, "elapsed_time": "2:18:10", "remaining_time": "11:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 4438, "loss": 0.176, "learning_rate": 4.798861267345312e-06, "epoch": 0.17213507195764216, "percentage": 17.21, "elapsed_time": "2:18:22", "remaining_time": "11:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 4438, "loss": 0.1901, "learning_rate": 4.798128536230502e-06, "epoch": 0.17236037964345058, "percentage": 17.24, "elapsed_time": "2:18:33", "remaining_time": "11:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 4438, "loss": 0.191, "learning_rate": 4.797394529050577e-06, "epoch": 0.17258568732925902, "percentage": 17.26, "elapsed_time": "2:18:45", "remaining_time": "11:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 4438, "loss": 0.183, "learning_rate": 4.796659246213103e-06, "epoch": 0.17281099501506744, "percentage": 17.28, "elapsed_time": "2:18:55", "remaining_time": "11:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 4438, "loss": 0.1714, "learning_rate": 4.795922688126355e-06, "epoch": 0.1730363027008759, "percentage": 17.31, "elapsed_time": "2:19:07", "remaining_time": "11:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 4438, "loss": 0.2035, "learning_rate": 4.795184855199316e-06, "epoch": 0.1732616103866843, "percentage": 17.33, "elapsed_time": "2:19:18", "remaining_time": "11:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 4438, "loss": 0.1964, "learning_rate": 4.794445747841679e-06, "epoch": 0.17348691807249275, "percentage": 17.35, "elapsed_time": "2:19:28", "remaining_time": "11:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 4438, "loss": 0.194, "learning_rate": 4.79370536646384e-06, "epoch": 0.17371222575830117, "percentage": 17.37, "elapsed_time": "2:19:39", "remaining_time": "11:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 4438, "loss": 0.1822, "learning_rate": 4.792963711476908e-06, "epoch": 0.17393753344410962, "percentage": 17.4, "elapsed_time": "2:19:50", "remaining_time": "11:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 4438, "loss": 0.1776, "learning_rate": 4.792220783292694e-06, "epoch": 0.17416284112991803, "percentage": 17.42, "elapsed_time": "2:20:01", "remaining_time": "11:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 4438, "loss": 0.1872, "learning_rate": 4.791476582323719e-06, "epoch": 0.17438814881572648, "percentage": 17.44, "elapsed_time": "2:20:12", "remaining_time": "11:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 4438, "loss": 0.1906, "learning_rate": 4.790731108983211e-06, "epoch": 0.1746134565015349, "percentage": 17.46, "elapsed_time": "2:20:23", "remaining_time": "11:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 4438, "loss": 0.1709, "learning_rate": 4.7899843636851014e-06, "epoch": 0.17483876418734334, "percentage": 17.49, "elapsed_time": "2:20:34", "remaining_time": "11:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 4438, "loss": 0.1871, "learning_rate": 4.789236346844034e-06, "epoch": 0.17506407187315176, "percentage": 17.51, "elapsed_time": "2:20:44", "remaining_time": "11:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 4438, "loss": 0.1873, "learning_rate": 4.78848705887535e-06, "epoch": 0.1752893795589602, "percentage": 17.53, "elapsed_time": "2:20:55", "remaining_time": "11:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 4438, "loss": 0.1862, "learning_rate": 4.7877365001951045e-06, "epoch": 0.17551468724476862, "percentage": 17.55, "elapsed_time": "2:21:06", "remaining_time": "11:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 4438, "loss": 0.1706, "learning_rate": 4.786984671220053e-06, "epoch": 0.17573999493057707, "percentage": 17.58, "elapsed_time": "2:21:16", "remaining_time": "11:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 4438, "loss": 0.1959, "learning_rate": 4.786231572367659e-06, "epoch": 0.1759653026163855, "percentage": 17.6, "elapsed_time": "2:21:28", "remaining_time": "11:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 4438, "loss": 0.1828, "learning_rate": 4.785477204056089e-06, "epoch": 0.17619061030219393, "percentage": 17.62, "elapsed_time": "2:21:38", "remaining_time": "11:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 4438, "loss": 0.1914, "learning_rate": 4.784721566704217e-06, "epoch": 0.17641591798800235, "percentage": 17.64, "elapsed_time": "2:21:48", "remaining_time": "11:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 4438, "loss": 0.1867, "learning_rate": 4.78396466073162e-06, "epoch": 0.1766412256738108, "percentage": 17.67, "elapsed_time": "2:21:59", "remaining_time": "11:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 4438, "loss": 0.1845, "learning_rate": 4.7832064865585795e-06, "epoch": 0.17686653335961924, "percentage": 17.69, "elapsed_time": "2:22:10", "remaining_time": "11:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 4438, "loss": 0.1798, "learning_rate": 4.78244704460608e-06, "epoch": 0.17709184104542766, "percentage": 17.71, "elapsed_time": "2:22:19", "remaining_time": "11:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 4438, "loss": 0.1799, "learning_rate": 4.781686335295813e-06, "epoch": 0.1773171487312361, "percentage": 17.73, "elapsed_time": "2:22:30", "remaining_time": "11:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 4438, "loss": 0.1852, "learning_rate": 4.7809243590501725e-06, "epoch": 0.17754245641704453, "percentage": 17.76, "elapsed_time": "2:22:40", "remaining_time": "11:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 4438, "loss": 0.1891, "learning_rate": 4.780161116292254e-06, "epoch": 0.17776776410285297, "percentage": 17.78, "elapsed_time": "2:22:51", "remaining_time": "11:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 4438, "loss": 0.1896, "learning_rate": 4.779396607445858e-06, "epoch": 0.1779930717886614, "percentage": 17.8, "elapsed_time": "2:23:03", "remaining_time": "11:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 4438, "loss": 0.1873, "learning_rate": 4.778630832935489e-06, "epoch": 0.17821837947446983, "percentage": 17.82, "elapsed_time": "2:23:13", "remaining_time": "11:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 4438, "loss": 0.1792, "learning_rate": 4.777863793186351e-06, "epoch": 0.17844368716027825, "percentage": 17.85, "elapsed_time": "2:23:24", "remaining_time": "11:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 4438, "loss": 0.1709, "learning_rate": 4.777095488624355e-06, "epoch": 0.1786689948460867, "percentage": 17.87, "elapsed_time": "2:23:34", "remaining_time": "10:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 4438, "loss": 0.2033, "learning_rate": 4.776325919676109e-06, "epoch": 0.17889430253189512, "percentage": 17.89, "elapsed_time": "2:23:45", "remaining_time": "10:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 4438, "loss": 0.1792, "learning_rate": 4.775555086768929e-06, "epoch": 0.17911961021770356, "percentage": 17.91, "elapsed_time": "2:23:54", "remaining_time": "10:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 4438, "loss": 0.1764, "learning_rate": 4.774782990330828e-06, "epoch": 0.17934491790351198, "percentage": 17.94, "elapsed_time": "2:24:05", "remaining_time": "10:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 4438, "loss": 0.1987, "learning_rate": 4.774009630790522e-06, "epoch": 0.17957022558932043, "percentage": 17.96, "elapsed_time": "2:24:16", "remaining_time": "10:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 4438, "loss": 0.1646, "learning_rate": 4.77323500857743e-06, "epoch": 0.17979553327512884, "percentage": 17.98, "elapsed_time": "2:24:26", "remaining_time": "10:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 4438, "loss": 0.1894, "learning_rate": 4.77245912412167e-06, "epoch": 0.1800208409609373, "percentage": 18.0, "elapsed_time": "2:24:36", "remaining_time": "10:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 4438, "loss": 0.1812, "learning_rate": 4.771681977854062e-06, "epoch": 0.1802461486467457, "percentage": 18.03, "elapsed_time": "2:24:49", "remaining_time": "10:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 4438, "loss": 0.1834, "learning_rate": 4.7709035702061275e-06, "epoch": 0.18047145633255415, "percentage": 18.05, "elapsed_time": "2:24:59", "remaining_time": "10:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 4438, "loss": 0.1882, "learning_rate": 4.770123901610085e-06, "epoch": 0.18069676401836257, "percentage": 18.07, "elapsed_time": "2:25:10", "remaining_time": "10:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 4438, "loss": 0.1823, "learning_rate": 4.7693429724988565e-06, "epoch": 0.18092207170417102, "percentage": 18.09, "elapsed_time": "2:25:19", "remaining_time": "10:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 4438, "loss": 0.193, "learning_rate": 4.768560783306064e-06, "epoch": 0.18114737938997943, "percentage": 18.12, "elapsed_time": "2:25:28", "remaining_time": "10:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 4438, "loss": 0.1768, "learning_rate": 4.767777334466025e-06, "epoch": 0.18137268707578788, "percentage": 18.14, "elapsed_time": "2:25:39", "remaining_time": "10:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 4438, "loss": 0.1843, "learning_rate": 4.7669926264137625e-06, "epoch": 0.1815979947615963, "percentage": 18.16, "elapsed_time": "2:25:50", "remaining_time": "10:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 4438, "loss": 0.1675, "learning_rate": 4.766206659584994e-06, "epoch": 0.18182330244740474, "percentage": 18.18, "elapsed_time": "2:26:01", "remaining_time": "10:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 4438, "loss": 0.1899, "learning_rate": 4.765419434416138e-06, "epoch": 0.18204861013321316, "percentage": 18.21, "elapsed_time": "2:26:12", "remaining_time": "10:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 4438, "loss": 0.2051, "learning_rate": 4.7646309513443115e-06, "epoch": 0.1822739178190216, "percentage": 18.23, "elapsed_time": "2:26:24", "remaining_time": "10:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 4438, "loss": 0.1792, "learning_rate": 4.763841210807329e-06, "epoch": 0.18249922550483003, "percentage": 18.25, "elapsed_time": "2:26:34", "remaining_time": "10:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 4438, "loss": 0.1863, "learning_rate": 4.763050213243705e-06, "epoch": 0.18272453319063847, "percentage": 18.27, "elapsed_time": "2:26:45", "remaining_time": "10:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 4438, "loss": 0.199, "learning_rate": 4.762257959092651e-06, "epoch": 0.1829498408764469, "percentage": 18.3, "elapsed_time": "2:26:56", "remaining_time": "10:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 4438, "loss": 0.1917, "learning_rate": 4.7614644487940755e-06, "epoch": 0.18317514856225534, "percentage": 18.32, "elapsed_time": "2:27:07", "remaining_time": "10:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 4438, "loss": 0.1946, "learning_rate": 4.760669682788584e-06, "epoch": 0.18340045624806375, "percentage": 18.34, "elapsed_time": "2:27:18", "remaining_time": "10:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 4438, "loss": 0.1999, "learning_rate": 4.759873661517484e-06, "epoch": 0.1836257639338722, "percentage": 18.36, "elapsed_time": "2:27:28", "remaining_time": "10:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 4438, "loss": 0.1691, "learning_rate": 4.759076385422773e-06, "epoch": 0.18385107161968062, "percentage": 18.39, "elapsed_time": "2:27:39", "remaining_time": "10:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 4438, "loss": 0.1863, "learning_rate": 4.75827785494715e-06, "epoch": 0.18407637930548906, "percentage": 18.41, "elapsed_time": "2:27:50", "remaining_time": "10:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 4438, "loss": 0.1705, "learning_rate": 4.7574780705340094e-06, "epoch": 0.18430168699129748, "percentage": 18.43, "elapsed_time": "2:28:00", "remaining_time": "10:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 4438, "loss": 0.1949, "learning_rate": 4.756677032627442e-06, "epoch": 0.18452699467710593, "percentage": 18.45, "elapsed_time": "2:28:13", "remaining_time": "10:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 4438, "loss": 0.1827, "learning_rate": 4.755874741672233e-06, "epoch": 0.18475230236291434, "percentage": 18.48, "elapsed_time": "2:28:22", "remaining_time": "10:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 4438, "loss": 0.1781, "learning_rate": 4.755071198113865e-06, "epoch": 0.1849776100487228, "percentage": 18.5, "elapsed_time": "2:28:35", "remaining_time": "10:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 4438, "loss": 0.1909, "learning_rate": 4.754266402398517e-06, "epoch": 0.1852029177345312, "percentage": 18.52, "elapsed_time": "2:28:47", "remaining_time": "10:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 4438, "loss": 0.1966, "learning_rate": 4.753460354973061e-06, "epoch": 0.18542822542033965, "percentage": 18.54, "elapsed_time": "2:28:58", "remaining_time": "10:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 4438, "loss": 0.1749, "learning_rate": 4.752653056285066e-06, "epoch": 0.18565353310614807, "percentage": 18.57, "elapsed_time": "2:29:08", "remaining_time": "10:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 4438, "loss": 0.1878, "learning_rate": 4.751844506782793e-06, "epoch": 0.18587884079195652, "percentage": 18.59, "elapsed_time": "2:29:18", "remaining_time": "10:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 4438, "loss": 0.1717, "learning_rate": 4.7510347069152015e-06, "epoch": 0.18610414847776494, "percentage": 18.61, "elapsed_time": "2:29:28", "remaining_time": "10:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 4438, "loss": 0.1863, "learning_rate": 4.750223657131942e-06, "epoch": 0.18632945616357338, "percentage": 18.63, "elapsed_time": "2:29:40", "remaining_time": "10:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 4438, "loss": 0.1786, "learning_rate": 4.74941135788336e-06, "epoch": 0.1865547638493818, "percentage": 18.66, "elapsed_time": "2:29:49", "remaining_time": "10:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 4438, "loss": 0.1611, "learning_rate": 4.748597809620496e-06, "epoch": 0.18678007153519025, "percentage": 18.68, "elapsed_time": "2:30:01", "remaining_time": "10:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 4438, "loss": 0.2032, "learning_rate": 4.747783012795083e-06, "epoch": 0.18700537922099866, "percentage": 18.7, "elapsed_time": "2:30:12", "remaining_time": "10:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 4438, "loss": 0.2007, "learning_rate": 4.746966967859547e-06, "epoch": 0.1872306869068071, "percentage": 18.72, "elapsed_time": "2:30:23", "remaining_time": "10:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 4438, "loss": 0.1811, "learning_rate": 4.746149675267005e-06, "epoch": 0.18745599459261553, "percentage": 18.75, "elapsed_time": "2:30:33", "remaining_time": "10:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 4438, "loss": 0.1622, "learning_rate": 4.745331135471274e-06, "epoch": 0.18768130227842397, "percentage": 18.77, "elapsed_time": "2:30:44", "remaining_time": "10:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 4438, "loss": 0.1797, "learning_rate": 4.744511348926855e-06, "epoch": 0.18790660996423242, "percentage": 18.79, "elapsed_time": "2:30:54", "remaining_time": "10:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 4438, "loss": 0.1847, "learning_rate": 4.743690316088945e-06, "epoch": 0.18813191765004084, "percentage": 18.81, "elapsed_time": "2:31:05", "remaining_time": "10:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 4438, "loss": 0.1987, "learning_rate": 4.742868037413435e-06, "epoch": 0.18835722533584928, "percentage": 18.84, "elapsed_time": "2:31:15", "remaining_time": "10:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 4438, "loss": 0.1834, "learning_rate": 4.742044513356904e-06, "epoch": 0.1885825330216577, "percentage": 18.86, "elapsed_time": "2:31:25", "remaining_time": "10:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 4438, "loss": 0.1743, "learning_rate": 4.741219744376624e-06, "epoch": 0.18880784070746615, "percentage": 18.88, "elapsed_time": "2:31:36", "remaining_time": "10:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 4438, "loss": 0.2052, "learning_rate": 4.74039373093056e-06, "epoch": 0.18903314839327456, "percentage": 18.9, "elapsed_time": "2:31:47", "remaining_time": "10:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 4438, "loss": 0.1763, "learning_rate": 4.739566473477365e-06, "epoch": 0.189258456079083, "percentage": 18.93, "elapsed_time": "2:31:58", "remaining_time": "10:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 4438, "loss": 0.1672, "learning_rate": 4.738737972476385e-06, "epoch": 0.18948376376489143, "percentage": 18.95, "elapsed_time": "2:32:10", "remaining_time": "10:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 4438, "loss": 0.1919, "learning_rate": 4.737908228387656e-06, "epoch": 0.18970907145069987, "percentage": 18.97, "elapsed_time": "2:32:20", "remaining_time": "10:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 4438, "loss": 0.2027, "learning_rate": 4.737077241671904e-06, "epoch": 0.1899343791365083, "percentage": 19.0, "elapsed_time": "2:32:31", "remaining_time": "10:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 4438, "loss": 0.1826, "learning_rate": 4.736245012790543e-06, "epoch": 0.19015968682231674, "percentage": 19.02, "elapsed_time": "2:32:41", "remaining_time": "10:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 4438, "loss": 0.1958, "learning_rate": 4.735411542205681e-06, "epoch": 0.19038499450812515, "percentage": 19.04, "elapsed_time": "2:32:52", "remaining_time": "10:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 4438, "loss": 0.1788, "learning_rate": 4.734576830380113e-06, "epoch": 0.1906103021939336, "percentage": 19.06, "elapsed_time": "2:33:02", "remaining_time": "10:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 4438, "loss": 0.1736, "learning_rate": 4.733740877777322e-06, "epoch": 0.19083560987974202, "percentage": 19.09, "elapsed_time": "2:33:12", "remaining_time": "10:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 4438, "loss": 0.1917, "learning_rate": 4.732903684861482e-06, "epoch": 0.19106091756555046, "percentage": 19.11, "elapsed_time": "2:33:21", "remaining_time": "10:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 4438, "loss": 0.1876, "learning_rate": 4.732065252097455e-06, "epoch": 0.19128622525135888, "percentage": 19.13, "elapsed_time": "2:33:30", "remaining_time": "10:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 4438, "loss": 0.1727, "learning_rate": 4.731225579950791e-06, "epoch": 0.19151153293716733, "percentage": 19.15, "elapsed_time": "2:33:41", "remaining_time": "10:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 4438, "loss": 0.1878, "learning_rate": 4.730384668887731e-06, "epoch": 0.19173684062297575, "percentage": 19.18, "elapsed_time": "2:33:53", "remaining_time": "10:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 4438, "loss": 0.1697, "learning_rate": 4.7295425193751974e-06, "epoch": 0.1919621483087842, "percentage": 19.2, "elapsed_time": "2:34:03", "remaining_time": "10:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 4438, "loss": 0.1987, "learning_rate": 4.728699131880808e-06, "epoch": 0.1921874559945926, "percentage": 19.22, "elapsed_time": "2:34:14", "remaining_time": "10:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 4438, "loss": 0.1657, "learning_rate": 4.727854506872863e-06, "epoch": 0.19241276368040106, "percentage": 19.24, "elapsed_time": "2:34:25", "remaining_time": "10:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 4438, "loss": 0.193, "learning_rate": 4.727008644820351e-06, "epoch": 0.19263807136620947, "percentage": 19.27, "elapsed_time": "2:34:35", "remaining_time": "10:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 4438, "loss": 0.172, "learning_rate": 4.726161546192949e-06, "epoch": 0.19286337905201792, "percentage": 19.29, "elapsed_time": "2:34:47", "remaining_time": "10:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 4438, "loss": 0.1962, "learning_rate": 4.725313211461018e-06, "epoch": 0.19308868673782634, "percentage": 19.31, "elapsed_time": "2:34:58", "remaining_time": "10:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 4438, "loss": 0.1835, "learning_rate": 4.724463641095606e-06, "epoch": 0.19331399442363478, "percentage": 19.33, "elapsed_time": "2:35:08", "remaining_time": "10:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 4438, "loss": 0.186, "learning_rate": 4.72361283556845e-06, "epoch": 0.1935393021094432, "percentage": 19.36, "elapsed_time": "2:35:19", "remaining_time": "10:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 4438, "loss": 0.1823, "learning_rate": 4.7227607953519686e-06, "epoch": 0.19376460979525165, "percentage": 19.38, "elapsed_time": "2:35:30", "remaining_time": "10:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 4438, "loss": 0.1848, "learning_rate": 4.7219075209192686e-06, "epoch": 0.19398991748106006, "percentage": 19.4, "elapsed_time": "2:35:40", "remaining_time": "10:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 4438, "loss": 0.1744, "learning_rate": 4.721053012744142e-06, "epoch": 0.1942152251668685, "percentage": 19.42, "elapsed_time": "2:35:50", "remaining_time": "10:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 4438, "loss": 0.1861, "learning_rate": 4.720197271301064e-06, "epoch": 0.19444053285267693, "percentage": 19.45, "elapsed_time": "2:36:02", "remaining_time": "10:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 4438, "loss": 0.1767, "learning_rate": 4.719340297065198e-06, "epoch": 0.19466584053848537, "percentage": 19.47, "elapsed_time": "2:36:15", "remaining_time": "10:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 4438, "loss": 0.1892, "learning_rate": 4.718482090512389e-06, "epoch": 0.1948911482242938, "percentage": 19.49, "elapsed_time": "2:36:26", "remaining_time": "10:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 4438, "loss": 0.1634, "learning_rate": 4.717622652119166e-06, "epoch": 0.19511645591010224, "percentage": 19.51, "elapsed_time": "2:36:36", "remaining_time": "10:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 4438, "loss": 0.1858, "learning_rate": 4.716761982362744e-06, "epoch": 0.19534176359591066, "percentage": 19.54, "elapsed_time": "2:36:48", "remaining_time": "10:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 4438, "loss": 0.1845, "learning_rate": 4.715900081721021e-06, "epoch": 0.1955670712817191, "percentage": 19.56, "elapsed_time": "2:37:00", "remaining_time": "10:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 4438, "loss": 0.1804, "learning_rate": 4.715036950672578e-06, "epoch": 0.19579237896752752, "percentage": 19.58, "elapsed_time": "2:37:11", "remaining_time": "10:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 4438, "loss": 0.1884, "learning_rate": 4.71417258969668e-06, "epoch": 0.19601768665333597, "percentage": 19.6, "elapsed_time": "2:37:22", "remaining_time": "10:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 4438, "loss": 0.1811, "learning_rate": 4.713306999273273e-06, "epoch": 0.19624299433914438, "percentage": 19.63, "elapsed_time": "2:37:31", "remaining_time": "10:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 4438, "loss": 0.1602, "learning_rate": 4.712440179882989e-06, "epoch": 0.19646830202495283, "percentage": 19.65, "elapsed_time": "2:37:42", "remaining_time": "10:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 4438, "loss": 0.1819, "learning_rate": 4.711572132007139e-06, "epoch": 0.19669360971076125, "percentage": 19.67, "elapsed_time": "2:37:54", "remaining_time": "10:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 4438, "loss": 0.1699, "learning_rate": 4.710702856127718e-06, "epoch": 0.1969189173965697, "percentage": 19.69, "elapsed_time": "2:38:05", "remaining_time": "10:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 4438, "loss": 0.166, "learning_rate": 4.709832352727404e-06, "epoch": 0.1971442250823781, "percentage": 19.72, "elapsed_time": "2:38:16", "remaining_time": "10:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 4438, "loss": 0.2012, "learning_rate": 4.708960622289552e-06, "epoch": 0.19736953276818656, "percentage": 19.74, "elapsed_time": "2:38:26", "remaining_time": "10:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 4438, "loss": 0.1913, "learning_rate": 4.708087665298204e-06, "epoch": 0.19759484045399497, "percentage": 19.76, "elapsed_time": "2:38:38", "remaining_time": "10:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 4438, "loss": 0.1863, "learning_rate": 4.70721348223808e-06, "epoch": 0.19782014813980342, "percentage": 19.78, "elapsed_time": "2:38:49", "remaining_time": "10:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 4438, "loss": 0.1779, "learning_rate": 4.706338073594581e-06, "epoch": 0.19804545582561184, "percentage": 19.81, "elapsed_time": "2:39:00", "remaining_time": "10:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 4438, "loss": 0.1966, "learning_rate": 4.705461439853789e-06, "epoch": 0.19827076351142028, "percentage": 19.83, "elapsed_time": "2:39:11", "remaining_time": "10:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 4438, "loss": 0.1745, "learning_rate": 4.704583581502465e-06, "epoch": 0.1984960711972287, "percentage": 19.85, "elapsed_time": "2:39:22", "remaining_time": "10:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 4438, "loss": 0.202, "learning_rate": 4.703704499028052e-06, "epoch": 0.19872137888303715, "percentage": 19.87, "elapsed_time": "2:39:33", "remaining_time": "10:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 4438, "loss": 0.1739, "learning_rate": 4.702824192918672e-06, "epoch": 0.1989466865688456, "percentage": 19.9, "elapsed_time": "2:39:43", "remaining_time": "10:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 4438, "loss": 0.1787, "learning_rate": 4.701942663663126e-06, "epoch": 0.199171994254654, "percentage": 19.92, "elapsed_time": "2:39:55", "remaining_time": "10:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 4438, "loss": 0.178, "learning_rate": 4.7010599117508936e-06, "epoch": 0.19939730194046246, "percentage": 19.94, "elapsed_time": "2:40:04", "remaining_time": "10:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 4438, "loss": 0.1904, "learning_rate": 4.700175937672134e-06, "epoch": 0.19962260962627087, "percentage": 19.96, "elapsed_time": "2:40:15", "remaining_time": "10:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 4438, "loss": 0.1787, "learning_rate": 4.699290741917686e-06, "epoch": 0.19984791731207932, "percentage": 19.99, "elapsed_time": "2:40:25", "remaining_time": "10:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 4438, "loss": 0.1806, "learning_rate": 4.698404324979066e-06, "epoch": 0.20007322499788774, "percentage": 20.01, "elapsed_time": "2:40:35", "remaining_time": "10:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 4438, "loss": 0.1871, "learning_rate": 4.697516687348466e-06, "epoch": 0.20029853268369618, "percentage": 20.03, "elapsed_time": "2:40:45", "remaining_time": "10:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 4438, "loss": 0.1929, "learning_rate": 4.696627829518761e-06, "epoch": 0.2005238403695046, "percentage": 20.05, "elapsed_time": "2:40:57", "remaining_time": "10:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 4438, "loss": 0.1808, "learning_rate": 4.695737751983499e-06, "epoch": 0.20074914805531305, "percentage": 20.08, "elapsed_time": "2:41:07", "remaining_time": "10:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 4438, "loss": 0.1819, "learning_rate": 4.6948464552369075e-06, "epoch": 0.20097445574112147, "percentage": 20.1, "elapsed_time": "2:41:17", "remaining_time": "10:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 4438, "loss": 0.1766, "learning_rate": 4.69395393977389e-06, "epoch": 0.2011997634269299, "percentage": 20.12, "elapsed_time": "2:41:27", "remaining_time": "10:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 4438, "loss": 0.1771, "learning_rate": 4.693060206090028e-06, "epoch": 0.20142507111273833, "percentage": 20.14, "elapsed_time": "2:41:38", "remaining_time": "10:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 4438, "loss": 0.1876, "learning_rate": 4.692165254681576e-06, "epoch": 0.20165037879854678, "percentage": 20.17, "elapsed_time": "2:41:48", "remaining_time": "10:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 4438, "loss": 0.1789, "learning_rate": 4.69126908604547e-06, "epoch": 0.2018756864843552, "percentage": 20.19, "elapsed_time": "2:41:58", "remaining_time": "10:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 4438, "loss": 0.1907, "learning_rate": 4.690371700679317e-06, "epoch": 0.20210099417016364, "percentage": 20.21, "elapsed_time": "2:42:08", "remaining_time": "10:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 4438, "loss": 0.1878, "learning_rate": 4.689473099081403e-06, "epoch": 0.20232630185597206, "percentage": 20.23, "elapsed_time": "2:42:19", "remaining_time": "10:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 4438, "loss": 0.1636, "learning_rate": 4.688573281750688e-06, "epoch": 0.2025516095417805, "percentage": 20.26, "elapsed_time": "2:42:29", "remaining_time": "10:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 4438, "loss": 0.179, "learning_rate": 4.687672249186805e-06, "epoch": 0.20277691722758892, "percentage": 20.28, "elapsed_time": "2:42:39", "remaining_time": "10:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 4438, "loss": 0.1698, "learning_rate": 4.686770001890067e-06, "epoch": 0.20300222491339737, "percentage": 20.3, "elapsed_time": "2:42:49", "remaining_time": "10:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 4438, "loss": 0.1911, "learning_rate": 4.685866540361456e-06, "epoch": 0.20322753259920578, "percentage": 20.32, "elapsed_time": "2:42:59", "remaining_time": "10:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 4438, "loss": 0.1707, "learning_rate": 4.684961865102631e-06, "epoch": 0.20345284028501423, "percentage": 20.35, "elapsed_time": "2:43:11", "remaining_time": "10:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 4438, "loss": 0.1669, "learning_rate": 4.684055976615924e-06, "epoch": 0.20367814797082265, "percentage": 20.37, "elapsed_time": "2:43:20", "remaining_time": "10:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 4438, "loss": 0.1836, "learning_rate": 4.683148875404343e-06, "epoch": 0.2039034556566311, "percentage": 20.39, "elapsed_time": "2:43:30", "remaining_time": "10:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 4438, "loss": 0.1843, "learning_rate": 4.682240561971565e-06, "epoch": 0.2041287633424395, "percentage": 20.41, "elapsed_time": "2:43:42", "remaining_time": "10:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 4438, "loss": 0.1886, "learning_rate": 4.681331036821945e-06, "epoch": 0.20435407102824796, "percentage": 20.44, "elapsed_time": "2:43:53", "remaining_time": "10:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 4438, "loss": 0.1927, "learning_rate": 4.680420300460505e-06, "epoch": 0.20457937871405638, "percentage": 20.46, "elapsed_time": "2:44:05", "remaining_time": "10:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 4438, "loss": 0.1687, "learning_rate": 4.679508353392946e-06, "epoch": 0.20480468639986482, "percentage": 20.48, "elapsed_time": "2:44:16", "remaining_time": "10:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 4438, "loss": 0.1672, "learning_rate": 4.678595196125638e-06, "epoch": 0.20502999408567324, "percentage": 20.5, "elapsed_time": "2:44:26", "remaining_time": "10:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 4438, "loss": 0.1785, "learning_rate": 4.677680829165623e-06, "epoch": 0.20525530177148169, "percentage": 20.53, "elapsed_time": "2:44:36", "remaining_time": "10:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 4438, "loss": 0.1743, "learning_rate": 4.676765253020613e-06, "epoch": 0.2054806094572901, "percentage": 20.55, "elapsed_time": "2:44:46", "remaining_time": "10:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 4438, "loss": 0.2006, "learning_rate": 4.675848468198995e-06, "epoch": 0.20570591714309855, "percentage": 20.57, "elapsed_time": "2:44:58", "remaining_time": "10:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 4438, "loss": 0.1762, "learning_rate": 4.674930475209827e-06, "epoch": 0.20593122482890697, "percentage": 20.59, "elapsed_time": "2:45:07", "remaining_time": "10:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 4438, "loss": 0.1684, "learning_rate": 4.674011274562833e-06, "epoch": 0.2061565325147154, "percentage": 20.62, "elapsed_time": "2:45:19", "remaining_time": "10:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 4438, "loss": 0.182, "learning_rate": 4.673090866768412e-06, "epoch": 0.20638184020052383, "percentage": 20.64, "elapsed_time": "2:45:29", "remaining_time": "10:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 4438, "loss": 0.1649, "learning_rate": 4.672169252337633e-06, "epoch": 0.20660714788633228, "percentage": 20.66, "elapsed_time": "2:45:39", "remaining_time": "10:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 4438, "loss": 0.1817, "learning_rate": 4.671246431782234e-06, "epoch": 0.2068324555721407, "percentage": 20.68, "elapsed_time": "2:45:50", "remaining_time": "10:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 4438, "loss": 0.1723, "learning_rate": 4.670322405614621e-06, "epoch": 0.20705776325794914, "percentage": 20.71, "elapsed_time": "2:46:00", "remaining_time": "10:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 4438, "loss": 0.2042, "learning_rate": 4.669397174347874e-06, "epoch": 0.20728307094375756, "percentage": 20.73, "elapsed_time": "2:46:11", "remaining_time": "10:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 4438, "loss": 0.1862, "learning_rate": 4.668470738495738e-06, "epoch": 0.207508378629566, "percentage": 20.75, "elapsed_time": "2:46:22", "remaining_time": "10:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 4438, "loss": 0.1884, "learning_rate": 4.667543098572627e-06, "epoch": 0.20773368631537442, "percentage": 20.78, "elapsed_time": "2:46:32", "remaining_time": "10:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 4438, "loss": 0.1711, "learning_rate": 4.6666142550936286e-06, "epoch": 0.20795899400118287, "percentage": 20.8, "elapsed_time": "2:46:43", "remaining_time": "10:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 4438, "loss": 0.19, "learning_rate": 4.665684208574492e-06, "epoch": 0.20818430168699129, "percentage": 20.82, "elapsed_time": "2:46:54", "remaining_time": "10:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 4438, "loss": 0.1742, "learning_rate": 4.664752959531638e-06, "epoch": 0.20840960937279973, "percentage": 20.84, "elapsed_time": "2:47:05", "remaining_time": "10:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 4438, "loss": 0.1783, "learning_rate": 4.6638205084821544e-06, "epoch": 0.20863491705860815, "percentage": 20.87, "elapsed_time": "2:47:15", "remaining_time": "10:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 4438, "loss": 0.1802, "learning_rate": 4.6628868559437964e-06, "epoch": 0.2088602247444166, "percentage": 20.89, "elapsed_time": "2:47:26", "remaining_time": "10:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 4438, "loss": 0.2069, "learning_rate": 4.661952002434988e-06, "epoch": 0.209085532430225, "percentage": 20.91, "elapsed_time": "2:47:38", "remaining_time": "10:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 4438, "loss": 0.189, "learning_rate": 4.661015948474815e-06, "epoch": 0.20931084011603346, "percentage": 20.93, "elapsed_time": "2:47:48", "remaining_time": "10:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 4438, "loss": 0.1798, "learning_rate": 4.660078694583037e-06, "epoch": 0.20953614780184188, "percentage": 20.96, "elapsed_time": "2:47:59", "remaining_time": "10:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 4438, "loss": 0.1813, "learning_rate": 4.659140241280075e-06, "epoch": 0.20976145548765032, "percentage": 20.98, "elapsed_time": "2:48:10", "remaining_time": "10:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 4438, "loss": 0.1841, "learning_rate": 4.658200589087016e-06, "epoch": 0.20998676317345877, "percentage": 21.0, "elapsed_time": "2:48:20", "remaining_time": "10:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 4438, "loss": 0.1905, "learning_rate": 4.657259738525615e-06, "epoch": 0.21021207085926719, "percentage": 21.02, "elapsed_time": "2:48:30", "remaining_time": "10:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 4438, "loss": 0.1702, "learning_rate": 4.656317690118291e-06, "epoch": 0.21043737854507563, "percentage": 21.05, "elapsed_time": "2:48:42", "remaining_time": "10:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 4438, "loss": 0.1758, "learning_rate": 4.655374444388127e-06, "epoch": 0.21066268623088405, "percentage": 21.07, "elapsed_time": "2:48:52", "remaining_time": "10:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 4438, "loss": 0.1898, "learning_rate": 4.654430001858874e-06, "epoch": 0.2108879939166925, "percentage": 21.09, "elapsed_time": "2:49:02", "remaining_time": "10:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 4438, "loss": 0.1893, "learning_rate": 4.653484363054947e-06, "epoch": 0.2111133016025009, "percentage": 21.11, "elapsed_time": "2:49:14", "remaining_time": "10:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 4438, "loss": 0.1919, "learning_rate": 4.6525375285014195e-06, "epoch": 0.21133860928830936, "percentage": 21.14, "elapsed_time": "2:49:26", "remaining_time": "10:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 4438, "loss": 0.1763, "learning_rate": 4.651589498724037e-06, "epoch": 0.21156391697411778, "percentage": 21.16, "elapsed_time": "2:49:37", "remaining_time": "10:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 4438, "loss": 0.194, "learning_rate": 4.650640274249205e-06, "epoch": 0.21178922465992622, "percentage": 21.18, "elapsed_time": "2:49:47", "remaining_time": "10:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 4438, "loss": 0.1748, "learning_rate": 4.649689855603992e-06, "epoch": 0.21201453234573464, "percentage": 21.2, "elapsed_time": "2:49:58", "remaining_time": "10:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 4438, "loss": 0.1824, "learning_rate": 4.648738243316128e-06, "epoch": 0.2122398400315431, "percentage": 21.23, "elapsed_time": "2:50:08", "remaining_time": "10:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 4438, "loss": 0.1787, "learning_rate": 4.647785437914011e-06, "epoch": 0.2124651477173515, "percentage": 21.25, "elapsed_time": "2:50:19", "remaining_time": "10:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 4438, "loss": 0.1721, "learning_rate": 4.646831439926696e-06, "epoch": 0.21269045540315995, "percentage": 21.27, "elapsed_time": "2:50:30", "remaining_time": "10:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 4438, "loss": 0.1811, "learning_rate": 4.645876249883903e-06, "epoch": 0.21291576308896837, "percentage": 21.29, "elapsed_time": "2:50:39", "remaining_time": "10:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 4438, "loss": 0.1609, "learning_rate": 4.644919868316014e-06, "epoch": 0.21314107077477681, "percentage": 21.32, "elapsed_time": "2:50:50", "remaining_time": "10:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 4438, "loss": 0.203, "learning_rate": 4.643962295754073e-06, "epoch": 0.21336637846058523, "percentage": 21.34, "elapsed_time": "2:51:01", "remaining_time": "10:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 4438, "loss": 0.1719, "learning_rate": 4.643003532729783e-06, "epoch": 0.21359168614639368, "percentage": 21.36, "elapsed_time": "2:51:12", "remaining_time": "10:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 4438, "loss": 0.1795, "learning_rate": 4.642043579775509e-06, "epoch": 0.2138169938322021, "percentage": 21.38, "elapsed_time": "2:51:23", "remaining_time": "10:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 4438, "loss": 0.1797, "learning_rate": 4.641082437424277e-06, "epoch": 0.21404230151801054, "percentage": 21.41, "elapsed_time": "2:51:35", "remaining_time": "10:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 4438, "loss": 0.1811, "learning_rate": 4.640120106209776e-06, "epoch": 0.21426760920381896, "percentage": 21.43, "elapsed_time": "2:51:45", "remaining_time": "10:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 4438, "loss": 0.1879, "learning_rate": 4.639156586666349e-06, "epoch": 0.2144929168896274, "percentage": 21.45, "elapsed_time": "2:51:55", "remaining_time": "10:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 4438, "loss": 0.2032, "learning_rate": 4.638191879329005e-06, "epoch": 0.21471822457543582, "percentage": 21.47, "elapsed_time": "2:52:07", "remaining_time": "10:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 4438, "loss": 0.1737, "learning_rate": 4.63722598473341e-06, "epoch": 0.21494353226124427, "percentage": 21.5, "elapsed_time": "2:52:16", "remaining_time": "10:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 4438, "loss": 0.179, "learning_rate": 4.636258903415888e-06, "epoch": 0.2151688399470527, "percentage": 21.52, "elapsed_time": "2:52:26", "remaining_time": "10:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 4438, "loss": 0.1827, "learning_rate": 4.635290635913425e-06, "epoch": 0.21539414763286113, "percentage": 21.54, "elapsed_time": "2:52:36", "remaining_time": "10:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 4438, "loss": 0.199, "learning_rate": 4.63432118276366e-06, "epoch": 0.21561945531866955, "percentage": 21.56, "elapsed_time": "2:52:47", "remaining_time": "10:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 4438, "loss": 0.1866, "learning_rate": 4.633350544504899e-06, "epoch": 0.215844763004478, "percentage": 21.59, "elapsed_time": "2:52:58", "remaining_time": "10:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 4438, "loss": 0.1826, "learning_rate": 4.632378721676098e-06, "epoch": 0.21607007069028641, "percentage": 21.61, "elapsed_time": "2:53:08", "remaining_time": "10:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 4438, "loss": 0.1761, "learning_rate": 4.6314057148168765e-06, "epoch": 0.21629537837609486, "percentage": 21.63, "elapsed_time": "2:53:18", "remaining_time": "10:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 4438, "loss": 0.1825, "learning_rate": 4.6304315244675065e-06, "epoch": 0.21652068606190328, "percentage": 21.65, "elapsed_time": "2:53:27", "remaining_time": "10:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 4438, "loss": 0.1895, "learning_rate": 4.629456151168921e-06, "epoch": 0.21674599374771172, "percentage": 21.68, "elapsed_time": "2:53:38", "remaining_time": "10:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 4438, "loss": 0.1809, "learning_rate": 4.628479595462708e-06, "epoch": 0.21697130143352014, "percentage": 21.7, "elapsed_time": "2:53:48", "remaining_time": "10:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 4438, "loss": 0.1777, "learning_rate": 4.627501857891113e-06, "epoch": 0.2171966091193286, "percentage": 21.72, "elapsed_time": "2:54:01", "remaining_time": "10:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 4438, "loss": 0.1947, "learning_rate": 4.626522938997037e-06, "epoch": 0.217421916805137, "percentage": 21.74, "elapsed_time": "2:54:12", "remaining_time": "10:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 4438, "loss": 0.1919, "learning_rate": 4.625542839324036e-06, "epoch": 0.21764722449094545, "percentage": 21.77, "elapsed_time": "2:54:23", "remaining_time": "10:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 4438, "loss": 0.1734, "learning_rate": 4.624561559416324e-06, "epoch": 0.21787253217675387, "percentage": 21.79, "elapsed_time": "2:54:34", "remaining_time": "10:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 4438, "loss": 0.1866, "learning_rate": 4.623579099818769e-06, "epoch": 0.21809783986256231, "percentage": 21.81, "elapsed_time": "2:54:43", "remaining_time": "10:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 4438, "loss": 0.1667, "learning_rate": 4.6225954610768945e-06, "epoch": 0.21832314754837073, "percentage": 21.83, "elapsed_time": "2:54:55", "remaining_time": "10:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 4438, "loss": 0.1848, "learning_rate": 4.621610643736878e-06, "epoch": 0.21854845523417918, "percentage": 21.86, "elapsed_time": "2:55:05", "remaining_time": "10:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 4438, "loss": 0.1771, "learning_rate": 4.620624648345552e-06, "epoch": 0.2187737629199876, "percentage": 21.88, "elapsed_time": "2:55:16", "remaining_time": "10:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 4438, "loss": 0.185, "learning_rate": 4.6196374754504024e-06, "epoch": 0.21899907060579604, "percentage": 21.9, "elapsed_time": "2:55:27", "remaining_time": "10:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 4438, "loss": 0.1973, "learning_rate": 4.61864912559957e-06, "epoch": 0.21922437829160446, "percentage": 21.92, "elapsed_time": "2:55:39", "remaining_time": "10:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 4438, "loss": 0.1659, "learning_rate": 4.617659599341849e-06, "epoch": 0.2194496859774129, "percentage": 21.95, "elapsed_time": "2:55:49", "remaining_time": "10:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 4438, "loss": 0.1817, "learning_rate": 4.616668897226686e-06, "epoch": 0.21967499366322132, "percentage": 21.97, "elapsed_time": "2:55:59", "remaining_time": "10:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 4438, "loss": 0.1819, "learning_rate": 4.615677019804182e-06, "epoch": 0.21990030134902977, "percentage": 21.99, "elapsed_time": "2:56:10", "remaining_time": "10:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 4438, "loss": 0.171, "learning_rate": 4.6146839676250875e-06, "epoch": 0.2201256090348382, "percentage": 22.01, "elapsed_time": "2:56:20", "remaining_time": "10:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 4438, "loss": 0.1912, "learning_rate": 4.6136897412408084e-06, "epoch": 0.22035091672064663, "percentage": 22.04, "elapsed_time": "2:56:30", "remaining_time": "10:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 4438, "loss": 0.1776, "learning_rate": 4.612694341203403e-06, "epoch": 0.22057622440645505, "percentage": 22.06, "elapsed_time": "2:56:41", "remaining_time": "10:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 4438, "loss": 0.1971, "learning_rate": 4.611697768065577e-06, "epoch": 0.2208015320922635, "percentage": 22.08, "elapsed_time": "2:56:53", "remaining_time": "10:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 4438, "loss": 0.1718, "learning_rate": 4.610700022380692e-06, "epoch": 0.22102683977807194, "percentage": 22.1, "elapsed_time": "2:57:03", "remaining_time": "10:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 4438, "loss": 0.1586, "learning_rate": 4.609701104702759e-06, "epoch": 0.22125214746388036, "percentage": 22.13, "elapsed_time": "2:57:14", "remaining_time": "10:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 4438, "loss": 0.16, "learning_rate": 4.6087010155864394e-06, "epoch": 0.2214774551496888, "percentage": 22.15, "elapsed_time": "2:57:24", "remaining_time": "10:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 4438, "loss": 0.1886, "learning_rate": 4.607699755587046e-06, "epoch": 0.22170276283549722, "percentage": 22.17, "elapsed_time": "2:57:35", "remaining_time": "10:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 4438, "loss": 0.2008, "learning_rate": 4.60669732526054e-06, "epoch": 0.22192807052130567, "percentage": 22.19, "elapsed_time": "2:57:47", "remaining_time": "10:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 4438, "loss": 0.1897, "learning_rate": 4.605693725163536e-06, "epoch": 0.2221533782071141, "percentage": 22.22, "elapsed_time": "2:57:58", "remaining_time": "10:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 4438, "loss": 0.1866, "learning_rate": 4.6046889558532925e-06, "epoch": 0.22237868589292253, "percentage": 22.24, "elapsed_time": "2:58:09", "remaining_time": "10:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 4438, "loss": 0.1753, "learning_rate": 4.603683017887722e-06, "epoch": 0.22260399357873095, "percentage": 22.26, "elapsed_time": "2:58:19", "remaining_time": "10:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 4438, "loss": 0.1772, "learning_rate": 4.602675911825386e-06, "epoch": 0.2228293012645394, "percentage": 22.28, "elapsed_time": "2:58:31", "remaining_time": "10:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 4438, "loss": 0.1707, "learning_rate": 4.6016676382254895e-06, "epoch": 0.22305460895034782, "percentage": 22.31, "elapsed_time": "2:58:41", "remaining_time": "10:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 4438, "loss": 0.1718, "learning_rate": 4.600658197647892e-06, "epoch": 0.22327991663615626, "percentage": 22.33, "elapsed_time": "2:58:53", "remaining_time": "10:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 4438, "loss": 0.1871, "learning_rate": 4.5996475906530955e-06, "epoch": 0.22350522432196468, "percentage": 22.35, "elapsed_time": "2:59:03", "remaining_time": "10:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 4438, "loss": 0.1764, "learning_rate": 4.598635817802256e-06, "epoch": 0.22373053200777313, "percentage": 22.37, "elapsed_time": "2:59:14", "remaining_time": "10:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 4438, "loss": 0.1725, "learning_rate": 4.597622879657171e-06, "epoch": 0.22395583969358154, "percentage": 22.4, "elapsed_time": "2:59:24", "remaining_time": "10:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 4438, "loss": 0.1728, "learning_rate": 4.596608776780287e-06, "epoch": 0.22418114737939, "percentage": 22.42, "elapsed_time": "2:59:35", "remaining_time": "10:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 4438, "loss": 0.1811, "learning_rate": 4.595593509734699e-06, "epoch": 0.2244064550651984, "percentage": 22.44, "elapsed_time": "2:59:45", "remaining_time": "10:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 4438, "loss": 0.1695, "learning_rate": 4.594577079084146e-06, "epoch": 0.22463176275100685, "percentage": 22.47, "elapsed_time": "2:59:54", "remaining_time": "10:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 4438, "loss": 0.1799, "learning_rate": 4.593559485393015e-06, "epoch": 0.22485707043681527, "percentage": 22.49, "elapsed_time": "3:00:04", "remaining_time": "10:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 4438, "loss": 0.1886, "learning_rate": 4.592540729226336e-06, "epoch": 0.22508237812262372, "percentage": 22.51, "elapsed_time": "3:00:14", "remaining_time": "10:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 4438, "loss": 0.1775, "learning_rate": 4.591520811149787e-06, "epoch": 0.22530768580843213, "percentage": 22.53, "elapsed_time": "3:00:25", "remaining_time": "10:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 4438, "eval_loss": 0.1791670173406601, "epoch": 0.22530768580843213, "percentage": 22.53, "elapsed_time": "3:02:28", "remaining_time": "10:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 4438, "loss": 0.1732, "learning_rate": 4.590499731729692e-06, "epoch": 0.22553299349424058, "percentage": 22.56, "elapsed_time": "3:02:39", "remaining_time": "10:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 4438, "loss": 0.1599, "learning_rate": 4.589477491533016e-06, "epoch": 0.225758301180049, "percentage": 22.58, "elapsed_time": "3:02:50", "remaining_time": "10:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 4438, "loss": 0.1815, "learning_rate": 4.588454091127373e-06, "epoch": 0.22598360886585744, "percentage": 22.6, "elapsed_time": "3:03:02", "remaining_time": "10:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 4438, "loss": 0.1893, "learning_rate": 4.587429531081019e-06, "epoch": 0.22620891655166586, "percentage": 22.62, "elapsed_time": "3:03:15", "remaining_time": "10:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 4438, "loss": 0.1652, "learning_rate": 4.586403811962852e-06, "epoch": 0.2264342242374743, "percentage": 22.65, "elapsed_time": "3:03:27", "remaining_time": "10:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 4438, "loss": 0.1687, "learning_rate": 4.585376934342418e-06, "epoch": 0.22665953192328273, "percentage": 22.67, "elapsed_time": "3:03:38", "remaining_time": "10:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 4438, "loss": 0.1722, "learning_rate": 4.584348898789901e-06, "epoch": 0.22688483960909117, "percentage": 22.69, "elapsed_time": "3:03:48", "remaining_time": "10:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 4438, "loss": 0.1821, "learning_rate": 4.583319705876133e-06, "epoch": 0.2271101472948996, "percentage": 22.71, "elapsed_time": "3:03:59", "remaining_time": "10:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 4438, "loss": 0.1709, "learning_rate": 4.5822893561725864e-06, "epoch": 0.22733545498070803, "percentage": 22.74, "elapsed_time": "3:04:08", "remaining_time": "10:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 4438, "loss": 0.1933, "learning_rate": 4.581257850251376e-06, "epoch": 0.22756076266651645, "percentage": 22.76, "elapsed_time": "3:04:19", "remaining_time": "10:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 4438, "loss": 0.1733, "learning_rate": 4.580225188685257e-06, "epoch": 0.2277860703523249, "percentage": 22.78, "elapsed_time": "3:04:30", "remaining_time": "10:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 4438, "loss": 0.1685, "learning_rate": 4.579191372047631e-06, "epoch": 0.22801137803813332, "percentage": 22.8, "elapsed_time": "3:04:40", "remaining_time": "10:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 4438, "loss": 0.2105, "learning_rate": 4.578156400912535e-06, "epoch": 0.22823668572394176, "percentage": 22.83, "elapsed_time": "3:04:51", "remaining_time": "10:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 4438, "loss": 0.1802, "learning_rate": 4.577120275854649e-06, "epoch": 0.22846199340975018, "percentage": 22.85, "elapsed_time": "3:05:02", "remaining_time": "10:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 4438, "loss": 0.183, "learning_rate": 4.576082997449298e-06, "epoch": 0.22868730109555863, "percentage": 22.87, "elapsed_time": "3:05:11", "remaining_time": "10:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 4438, "loss": 0.1868, "learning_rate": 4.5750445662724426e-06, "epoch": 0.22891260878136704, "percentage": 22.89, "elapsed_time": "3:05:21", "remaining_time": "10:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 4438, "loss": 0.1744, "learning_rate": 4.574004982900684e-06, "epoch": 0.2291379164671755, "percentage": 22.92, "elapsed_time": "3:05:31", "remaining_time": "10:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 4438, "loss": 0.1854, "learning_rate": 4.572964247911265e-06, "epoch": 0.2293632241529839, "percentage": 22.94, "elapsed_time": "3:05:42", "remaining_time": "10:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 4438, "loss": 0.1884, "learning_rate": 4.5719223618820666e-06, "epoch": 0.22958853183879235, "percentage": 22.96, "elapsed_time": "3:05:54", "remaining_time": "10:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 4438, "loss": 0.1766, "learning_rate": 4.5708793253916104e-06, "epoch": 0.22981383952460077, "percentage": 22.98, "elapsed_time": "3:06:03", "remaining_time": "10:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 4438, "loss": 0.1648, "learning_rate": 4.569835139019054e-06, "epoch": 0.23003914721040922, "percentage": 23.01, "elapsed_time": "3:06:13", "remaining_time": "10:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 4438, "loss": 0.1898, "learning_rate": 4.568789803344196e-06, "epoch": 0.23026445489621764, "percentage": 23.03, "elapsed_time": "3:06:24", "remaining_time": "10:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 4438, "loss": 0.1772, "learning_rate": 4.567743318947472e-06, "epoch": 0.23048976258202608, "percentage": 23.05, "elapsed_time": "3:06:33", "remaining_time": "10:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 4438, "loss": 0.198, "learning_rate": 4.566695686409957e-06, "epoch": 0.2307150702678345, "percentage": 23.07, "elapsed_time": "3:06:44", "remaining_time": "10:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 4438, "loss": 0.1764, "learning_rate": 4.56564690631336e-06, "epoch": 0.23094037795364294, "percentage": 23.1, "elapsed_time": "3:06:54", "remaining_time": "10:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 4438, "loss": 0.167, "learning_rate": 4.564596979240031e-06, "epoch": 0.23116568563945136, "percentage": 23.12, "elapsed_time": "3:07:04", "remaining_time": "10:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 4438, "loss": 0.1704, "learning_rate": 4.563545905772956e-06, "epoch": 0.2313909933252598, "percentage": 23.14, "elapsed_time": "3:07:14", "remaining_time": "10:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 4438, "loss": 0.1714, "learning_rate": 4.562493686495756e-06, "epoch": 0.23161630101106823, "percentage": 23.16, "elapsed_time": "3:07:23", "remaining_time": "10:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 4438, "loss": 0.1623, "learning_rate": 4.56144032199269e-06, "epoch": 0.23184160869687667, "percentage": 23.19, "elapsed_time": "3:07:33", "remaining_time": "10:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 4438, "loss": 0.1668, "learning_rate": 4.56038581284865e-06, "epoch": 0.23206691638268512, "percentage": 23.21, "elapsed_time": "3:07:44", "remaining_time": "10:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 4438, "loss": 0.1743, "learning_rate": 4.559330159649166e-06, "epoch": 0.23229222406849354, "percentage": 23.23, "elapsed_time": "3:07:54", "remaining_time": "10:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 4438, "loss": 0.1693, "learning_rate": 4.558273362980406e-06, "epoch": 0.23251753175430198, "percentage": 23.25, "elapsed_time": "3:08:04", "remaining_time": "10:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 4438, "loss": 0.1724, "learning_rate": 4.557215423429167e-06, "epoch": 0.2327428394401104, "percentage": 23.28, "elapsed_time": "3:08:16", "remaining_time": "10:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 4438, "loss": 0.1785, "learning_rate": 4.556156341582884e-06, "epoch": 0.23296814712591885, "percentage": 23.3, "elapsed_time": "3:08:26", "remaining_time": "10:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 4438, "loss": 0.169, "learning_rate": 4.555096118029625e-06, "epoch": 0.23319345481172726, "percentage": 23.32, "elapsed_time": "3:08:37", "remaining_time": "10:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 4438, "loss": 0.1757, "learning_rate": 4.5540347533580935e-06, "epoch": 0.2334187624975357, "percentage": 23.34, "elapsed_time": "3:08:48", "remaining_time": "10:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 4438, "loss": 0.1665, "learning_rate": 4.5529722481576265e-06, "epoch": 0.23364407018334413, "percentage": 23.37, "elapsed_time": "3:08:58", "remaining_time": "10:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 4438, "loss": 0.1734, "learning_rate": 4.551908603018191e-06, "epoch": 0.23386937786915257, "percentage": 23.39, "elapsed_time": "3:09:08", "remaining_time": "10:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 4438, "loss": 0.1797, "learning_rate": 4.550843818530392e-06, "epoch": 0.234094685554961, "percentage": 23.41, "elapsed_time": "3:09:18", "remaining_time": "10:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 4438, "loss": 0.1644, "learning_rate": 4.549777895285464e-06, "epoch": 0.23431999324076944, "percentage": 23.43, "elapsed_time": "3:09:29", "remaining_time": "10:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 4438, "loss": 0.1778, "learning_rate": 4.548710833875273e-06, "epoch": 0.23454530092657785, "percentage": 23.46, "elapsed_time": "3:09:38", "remaining_time": "10:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 4438, "loss": 0.1733, "learning_rate": 4.547642634892321e-06, "epoch": 0.2347706086123863, "percentage": 23.48, "elapsed_time": "3:09:49", "remaining_time": "10:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 4438, "loss": 0.1708, "learning_rate": 4.5465732989297365e-06, "epoch": 0.23499591629819472, "percentage": 23.5, "elapsed_time": "3:09:59", "remaining_time": "10:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 4438, "loss": 0.1843, "learning_rate": 4.545502826581284e-06, "epoch": 0.23522122398400316, "percentage": 23.52, "elapsed_time": "3:10:08", "remaining_time": "10:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 4438, "loss": 0.1914, "learning_rate": 4.5444312184413554e-06, "epoch": 0.23544653166981158, "percentage": 23.55, "elapsed_time": "3:10:20", "remaining_time": "10:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 4438, "loss": 0.176, "learning_rate": 4.543358475104975e-06, "epoch": 0.23567183935562003, "percentage": 23.57, "elapsed_time": "3:10:29", "remaining_time": "10:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 4438, "loss": 0.1614, "learning_rate": 4.5422845971677985e-06, "epoch": 0.23589714704142845, "percentage": 23.59, "elapsed_time": "3:10:40", "remaining_time": "10:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 4438, "loss": 0.1665, "learning_rate": 4.541209585226109e-06, "epoch": 0.2361224547272369, "percentage": 23.61, "elapsed_time": "3:10:52", "remaining_time": "10:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 4438, "loss": 0.17, "learning_rate": 4.5401334398768195e-06, "epoch": 0.2363477624130453, "percentage": 23.64, "elapsed_time": "3:11:01", "remaining_time": "10:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 4438, "loss": 0.1735, "learning_rate": 4.539056161717477e-06, "epoch": 0.23657307009885375, "percentage": 23.66, "elapsed_time": "3:11:13", "remaining_time": "10:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 4438, "loss": 0.1614, "learning_rate": 4.53797775134625e-06, "epoch": 0.23679837778466217, "percentage": 23.68, "elapsed_time": "3:11:23", "remaining_time": "10:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 4438, "loss": 0.1815, "learning_rate": 4.536898209361942e-06, "epoch": 0.23702368547047062, "percentage": 23.7, "elapsed_time": "3:11:33", "remaining_time": "10:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 4438, "loss": 0.1737, "learning_rate": 4.535817536363981e-06, "epoch": 0.23724899315627904, "percentage": 23.73, "elapsed_time": "3:11:45", "remaining_time": "10:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 4438, "loss": 0.161, "learning_rate": 4.5347357329524254e-06, "epoch": 0.23747430084208748, "percentage": 23.75, "elapsed_time": "3:11:54", "remaining_time": "10:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 4438, "loss": 0.1746, "learning_rate": 4.53365279972796e-06, "epoch": 0.2376996085278959, "percentage": 23.77, "elapsed_time": "3:12:03", "remaining_time": "10:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 4438, "loss": 0.1728, "learning_rate": 4.532568737291898e-06, "epoch": 0.23792491621370435, "percentage": 23.79, "elapsed_time": "3:12:13", "remaining_time": "10:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 4438, "loss": 0.1917, "learning_rate": 4.531483546246177e-06, "epoch": 0.23815022389951276, "percentage": 23.82, "elapsed_time": "3:12:24", "remaining_time": "10:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 4438, "loss": 0.1809, "learning_rate": 4.530397227193365e-06, "epoch": 0.2383755315853212, "percentage": 23.84, "elapsed_time": "3:12:37", "remaining_time": "10:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 4438, "loss": 0.1819, "learning_rate": 4.529309780736654e-06, "epoch": 0.23860083927112963, "percentage": 23.86, "elapsed_time": "3:12:47", "remaining_time": "10:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 4438, "loss": 0.1884, "learning_rate": 4.528221207479862e-06, "epoch": 0.23882614695693807, "percentage": 23.88, "elapsed_time": "3:12:59", "remaining_time": "10:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 4438, "loss": 0.1668, "learning_rate": 4.527131508027433e-06, "epoch": 0.2390514546427465, "percentage": 23.91, "elapsed_time": "3:13:09", "remaining_time": "10:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 4438, "loss": 0.1803, "learning_rate": 4.5260406829844364e-06, "epoch": 0.23927676232855494, "percentage": 23.93, "elapsed_time": "3:13:21", "remaining_time": "10:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 4438, "loss": 0.2003, "learning_rate": 4.524948732956568e-06, "epoch": 0.23950207001436336, "percentage": 23.95, "elapsed_time": "3:13:32", "remaining_time": "10:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 4438, "loss": 0.1808, "learning_rate": 4.523855658550146e-06, "epoch": 0.2397273777001718, "percentage": 23.97, "elapsed_time": "3:13:43", "remaining_time": "10:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 4438, "loss": 0.1817, "learning_rate": 4.522761460372114e-06, "epoch": 0.23995268538598022, "percentage": 24.0, "elapsed_time": "3:13:54", "remaining_time": "10:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 4438, "loss": 0.1735, "learning_rate": 4.521666139030039e-06, "epoch": 0.24017799307178866, "percentage": 24.02, "elapsed_time": "3:14:05", "remaining_time": "10:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 4438, "loss": 0.1532, "learning_rate": 4.520569695132113e-06, "epoch": 0.24040330075759708, "percentage": 24.04, "elapsed_time": "3:14:15", "remaining_time": "10:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 4438, "loss": 0.1842, "learning_rate": 4.51947212928715e-06, "epoch": 0.24062860844340553, "percentage": 24.06, "elapsed_time": "3:14:26", "remaining_time": "10:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 4438, "loss": 0.1838, "learning_rate": 4.518373442104587e-06, "epoch": 0.24085391612921395, "percentage": 24.09, "elapsed_time": "3:14:37", "remaining_time": "10:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 4438, "loss": 0.169, "learning_rate": 4.5172736341944845e-06, "epoch": 0.2410792238150224, "percentage": 24.11, "elapsed_time": "3:14:48", "remaining_time": "10:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 4438, "loss": 0.1745, "learning_rate": 4.516172706167525e-06, "epoch": 0.2413045315008308, "percentage": 24.13, "elapsed_time": "3:14:58", "remaining_time": "10:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 4438, "loss": 0.1781, "learning_rate": 4.515070658635013e-06, "epoch": 0.24152983918663926, "percentage": 24.16, "elapsed_time": "3:15:08", "remaining_time": "10:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 4438, "loss": 0.1725, "learning_rate": 4.513967492208874e-06, "epoch": 0.24175514687244767, "percentage": 24.18, "elapsed_time": "3:15:20", "remaining_time": "10:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 4438, "loss": 0.1968, "learning_rate": 4.512863207501654e-06, "epoch": 0.24198045455825612, "percentage": 24.2, "elapsed_time": "3:15:31", "remaining_time": "10:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 4438, "loss": 0.1715, "learning_rate": 4.511757805126523e-06, "epoch": 0.24220576224406454, "percentage": 24.22, "elapsed_time": "3:15:41", "remaining_time": "10:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 4438, "loss": 0.1737, "learning_rate": 4.510651285697269e-06, "epoch": 0.24243106992987298, "percentage": 24.25, "elapsed_time": "3:15:53", "remaining_time": "10:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 4438, "loss": 0.1723, "learning_rate": 4.509543649828302e-06, "epoch": 0.2426563776156814, "percentage": 24.27, "elapsed_time": "3:16:04", "remaining_time": "10:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 4438, "loss": 0.1742, "learning_rate": 4.5084348981346495e-06, "epoch": 0.24288168530148985, "percentage": 24.29, "elapsed_time": "3:16:14", "remaining_time": "10:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 4438, "loss": 0.181, "learning_rate": 4.507325031231959e-06, "epoch": 0.2431069929872983, "percentage": 24.31, "elapsed_time": "3:16:24", "remaining_time": "10:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 4438, "loss": 0.1771, "learning_rate": 4.506214049736502e-06, "epoch": 0.2433323006731067, "percentage": 24.34, "elapsed_time": "3:16:35", "remaining_time": "10:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 4438, "loss": 0.1942, "learning_rate": 4.505101954265161e-06, "epoch": 0.24355760835891516, "percentage": 24.36, "elapsed_time": "3:16:46", "remaining_time": "10:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 4438, "loss": 0.1635, "learning_rate": 4.503988745435443e-06, "epoch": 0.24378291604472357, "percentage": 24.38, "elapsed_time": "3:16:57", "remaining_time": "10:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 4438, "loss": 0.1834, "learning_rate": 4.502874423865473e-06, "epoch": 0.24400822373053202, "percentage": 24.4, "elapsed_time": "3:17:06", "remaining_time": "10:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 4438, "loss": 0.1711, "learning_rate": 4.5017589901739885e-06, "epoch": 0.24423353141634044, "percentage": 24.43, "elapsed_time": "3:17:17", "remaining_time": "10:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 4438, "loss": 0.1808, "learning_rate": 4.500642444980352e-06, "epoch": 0.24445883910214888, "percentage": 24.45, "elapsed_time": "3:17:26", "remaining_time": "10:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 4438, "loss": 0.1664, "learning_rate": 4.499524788904537e-06, "epoch": 0.2446841467879573, "percentage": 24.47, "elapsed_time": "3:17:36", "remaining_time": "10:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 4438, "loss": 0.1781, "learning_rate": 4.498406022567137e-06, "epoch": 0.24490945447376575, "percentage": 24.49, "elapsed_time": "3:17:47", "remaining_time": "10:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 4438, "loss": 0.173, "learning_rate": 4.497286146589361e-06, "epoch": 0.24513476215957417, "percentage": 24.52, "elapsed_time": "3:17:58", "remaining_time": "10:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 4438, "loss": 0.1705, "learning_rate": 4.4961651615930344e-06, "epoch": 0.2453600698453826, "percentage": 24.54, "elapsed_time": "3:18:09", "remaining_time": "10:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 4438, "loss": 0.1708, "learning_rate": 4.4950430682005995e-06, "epoch": 0.24558537753119103, "percentage": 24.56, "elapsed_time": "3:18:20", "remaining_time": "10:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 4438, "loss": 0.1516, "learning_rate": 4.493919867035112e-06, "epoch": 0.24581068521699947, "percentage": 24.58, "elapsed_time": "3:18:30", "remaining_time": "10:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 4438, "loss": 0.1623, "learning_rate": 4.492795558720242e-06, "epoch": 0.2460359929028079, "percentage": 24.61, "elapsed_time": "3:18:40", "remaining_time": "10:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 4438, "loss": 0.1639, "learning_rate": 4.491670143880279e-06, "epoch": 0.24626130058861634, "percentage": 24.63, "elapsed_time": "3:18:52", "remaining_time": "10:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 4438, "loss": 0.1864, "learning_rate": 4.490543623140123e-06, "epoch": 0.24648660827442476, "percentage": 24.65, "elapsed_time": "3:19:02", "remaining_time": "10:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 4438, "loss": 0.1829, "learning_rate": 4.489415997125288e-06, "epoch": 0.2467119159602332, "percentage": 24.67, "elapsed_time": "3:19:13", "remaining_time": "10:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 4438, "loss": 0.1819, "learning_rate": 4.488287266461904e-06, "epoch": 0.24693722364604162, "percentage": 24.7, "elapsed_time": "3:19:24", "remaining_time": "10:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 4438, "loss": 0.1801, "learning_rate": 4.487157431776712e-06, "epoch": 0.24716253133185007, "percentage": 24.72, "elapsed_time": "3:19:34", "remaining_time": "10:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 4438, "loss": 0.1775, "learning_rate": 4.486026493697067e-06, "epoch": 0.24738783901765848, "percentage": 24.74, "elapsed_time": "3:19:45", "remaining_time": "10:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 4438, "loss": 0.1678, "learning_rate": 4.484894452850937e-06, "epoch": 0.24761314670346693, "percentage": 24.76, "elapsed_time": "3:19:55", "remaining_time": "10:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 4438, "loss": 0.1972, "learning_rate": 4.483761309866902e-06, "epoch": 0.24783845438927535, "percentage": 24.79, "elapsed_time": "3:20:06", "remaining_time": "10:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 4438, "loss": 0.1936, "learning_rate": 4.482627065374155e-06, "epoch": 0.2480637620750838, "percentage": 24.81, "elapsed_time": "3:20:16", "remaining_time": "10:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 4438, "loss": 0.1701, "learning_rate": 4.481491720002499e-06, "epoch": 0.2482890697608922, "percentage": 24.83, "elapsed_time": "3:20:27", "remaining_time": "10:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 4438, "loss": 0.1765, "learning_rate": 4.4803552743823495e-06, "epoch": 0.24851437744670066, "percentage": 24.85, "elapsed_time": "3:20:38", "remaining_time": "10:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 4438, "loss": 0.1802, "learning_rate": 4.479217729144731e-06, "epoch": 0.24873968513250908, "percentage": 24.88, "elapsed_time": "3:20:49", "remaining_time": "10:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 4438, "loss": 0.1606, "learning_rate": 4.478079084921282e-06, "epoch": 0.24896499281831752, "percentage": 24.9, "elapsed_time": "3:21:01", "remaining_time": "10:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 4438, "loss": 0.1704, "learning_rate": 4.476939342344246e-06, "epoch": 0.24919030050412594, "percentage": 24.92, "elapsed_time": "3:21:13", "remaining_time": "10:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 4438, "loss": 0.1755, "learning_rate": 4.475798502046484e-06, "epoch": 0.24941560818993438, "percentage": 24.94, "elapsed_time": "3:21:23", "remaining_time": "10:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 4438, "loss": 0.1641, "learning_rate": 4.474656564661458e-06, "epoch": 0.2496409158757428, "percentage": 24.97, "elapsed_time": "3:21:34", "remaining_time": "10:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 4438, "loss": 0.1869, "learning_rate": 4.473513530823246e-06, "epoch": 0.24986622356155125, "percentage": 24.99, "elapsed_time": "3:21:46", "remaining_time": "10:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 4438, "loss": 0.1786, "learning_rate": 4.472369401166531e-06, "epoch": 0.25009153124735967, "percentage": 25.01, "elapsed_time": "3:21:57", "remaining_time": "10:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 4438, "loss": 0.1703, "learning_rate": 4.471224176326605e-06, "epoch": 0.2503168389331681, "percentage": 25.03, "elapsed_time": "3:22:07", "remaining_time": "10:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 4438, "loss": 0.1834, "learning_rate": 4.47007785693937e-06, "epoch": 0.25054214661897656, "percentage": 25.06, "elapsed_time": "3:22:17", "remaining_time": "10:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 4438, "loss": 0.1782, "learning_rate": 4.468930443641333e-06, "epoch": 0.250767454304785, "percentage": 25.08, "elapsed_time": "3:22:27", "remaining_time": "10:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 4438, "loss": 0.1845, "learning_rate": 4.467781937069611e-06, "epoch": 0.2509927619905934, "percentage": 25.1, "elapsed_time": "3:22:37", "remaining_time": "10:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 4438, "loss": 0.1733, "learning_rate": 4.466632337861926e-06, "epoch": 0.2512180696764018, "percentage": 25.12, "elapsed_time": "3:22:48", "remaining_time": "10:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 4438, "loss": 0.1849, "learning_rate": 4.465481646656608e-06, "epoch": 0.2514433773622103, "percentage": 25.15, "elapsed_time": "3:22:59", "remaining_time": "10:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 4438, "loss": 0.1736, "learning_rate": 4.464329864092593e-06, "epoch": 0.2516686850480187, "percentage": 25.17, "elapsed_time": "3:23:10", "remaining_time": "10:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 4438, "loss": 0.1835, "learning_rate": 4.463176990809423e-06, "epoch": 0.2518939927338271, "percentage": 25.19, "elapsed_time": "3:23:22", "remaining_time": "10:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 4438, "loss": 0.177, "learning_rate": 4.462023027447246e-06, "epoch": 0.25211930041963554, "percentage": 25.21, "elapsed_time": "3:23:33", "remaining_time": "10:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 4438, "loss": 0.1671, "learning_rate": 4.460867974646814e-06, "epoch": 0.252344608105444, "percentage": 25.24, "elapsed_time": "3:23:44", "remaining_time": "10:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 4438, "loss": 0.1964, "learning_rate": 4.459711833049485e-06, "epoch": 0.25256991579125243, "percentage": 25.26, "elapsed_time": "3:23:54", "remaining_time": "10:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 4438, "loss": 0.1758, "learning_rate": 4.45855460329722e-06, "epoch": 0.25279522347706085, "percentage": 25.28, "elapsed_time": "3:24:05", "remaining_time": "10:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 4438, "loss": 0.181, "learning_rate": 4.457396286032589e-06, "epoch": 0.25302053116286927, "percentage": 25.3, "elapsed_time": "3:24:15", "remaining_time": "10:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 4438, "loss": 0.1728, "learning_rate": 4.45623688189876e-06, "epoch": 0.25324583884867774, "percentage": 25.33, "elapsed_time": "3:24:26", "remaining_time": "10:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 4438, "loss": 0.1854, "learning_rate": 4.455076391539507e-06, "epoch": 0.25347114653448616, "percentage": 25.35, "elapsed_time": "3:24:36", "remaining_time": "10:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 4438, "loss": 0.1673, "learning_rate": 4.453914815599206e-06, "epoch": 0.2536964542202946, "percentage": 25.37, "elapsed_time": "3:24:47", "remaining_time": "10:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 4438, "loss": 0.1743, "learning_rate": 4.45275215472284e-06, "epoch": 0.25392176190610305, "percentage": 25.39, "elapsed_time": "3:24:58", "remaining_time": "10:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 4438, "loss": 0.1656, "learning_rate": 4.451588409555988e-06, "epoch": 0.25414706959191147, "percentage": 25.42, "elapsed_time": "3:25:08", "remaining_time": "10:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 4438, "loss": 0.1703, "learning_rate": 4.450423580744837e-06, "epoch": 0.2543723772777199, "percentage": 25.44, "elapsed_time": "3:25:18", "remaining_time": "10:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 4438, "loss": 0.1654, "learning_rate": 4.4492576689361705e-06, "epoch": 0.2545976849635283, "percentage": 25.46, "elapsed_time": "3:25:28", "remaining_time": "10:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 4438, "loss": 0.179, "learning_rate": 4.448090674777377e-06, "epoch": 0.2548229926493368, "percentage": 25.48, "elapsed_time": "3:25:37", "remaining_time": "10:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 4438, "loss": 0.1657, "learning_rate": 4.446922598916445e-06, "epoch": 0.2550483003351452, "percentage": 25.51, "elapsed_time": "3:25:47", "remaining_time": "10:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 4438, "loss": 0.1662, "learning_rate": 4.4457534420019644e-06, "epoch": 0.2552736080209536, "percentage": 25.53, "elapsed_time": "3:25:57", "remaining_time": "10:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 4438, "loss": 0.1832, "learning_rate": 4.444583204683123e-06, "epoch": 0.25549891570676203, "percentage": 25.55, "elapsed_time": "3:26:09", "remaining_time": "10:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 4438, "loss": 0.1687, "learning_rate": 4.44341188760971e-06, "epoch": 0.2557242233925705, "percentage": 25.57, "elapsed_time": "3:26:20", "remaining_time": "10:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 4438, "loss": 0.1796, "learning_rate": 4.4422394914321145e-06, "epoch": 0.2559495310783789, "percentage": 25.6, "elapsed_time": "3:26:31", "remaining_time": "10:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 4438, "loss": 0.1723, "learning_rate": 4.4410660168013255e-06, "epoch": 0.25617483876418734, "percentage": 25.62, "elapsed_time": "3:26:41", "remaining_time": "10:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 4438, "loss": 0.1683, "learning_rate": 4.439891464368927e-06, "epoch": 0.25640014644999576, "percentage": 25.64, "elapsed_time": "3:26:52", "remaining_time": "9:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 4438, "loss": 0.1725, "learning_rate": 4.438715834787107e-06, "epoch": 0.25662545413580423, "percentage": 25.66, "elapsed_time": "3:27:03", "remaining_time": "9:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 4438, "loss": 0.1783, "learning_rate": 4.437539128708647e-06, "epoch": 0.25685076182161265, "percentage": 25.69, "elapsed_time": "3:27:15", "remaining_time": "9:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 4438, "loss": 0.1724, "learning_rate": 4.436361346786929e-06, "epoch": 0.25707606950742107, "percentage": 25.71, "elapsed_time": "3:27:24", "remaining_time": "9:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 4438, "loss": 0.1635, "learning_rate": 4.435182489675931e-06, "epoch": 0.2573013771932295, "percentage": 25.73, "elapsed_time": "3:27:35", "remaining_time": "9:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 4438, "loss": 0.1761, "learning_rate": 4.4340025580302285e-06, "epoch": 0.25752668487903796, "percentage": 25.75, "elapsed_time": "3:27:45", "remaining_time": "9:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 4438, "loss": 0.1608, "learning_rate": 4.432821552504994e-06, "epoch": 0.2577519925648464, "percentage": 25.78, "elapsed_time": "3:27:57", "remaining_time": "9:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 4438, "loss": 0.1685, "learning_rate": 4.431639473755994e-06, "epoch": 0.2579773002506548, "percentage": 25.8, "elapsed_time": "3:28:09", "remaining_time": "9:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 4438, "loss": 0.173, "learning_rate": 4.430456322439596e-06, "epoch": 0.2582026079364632, "percentage": 25.82, "elapsed_time": "3:28:19", "remaining_time": "9:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 4438, "loss": 0.1784, "learning_rate": 4.429272099212757e-06, "epoch": 0.2584279156222717, "percentage": 25.84, "elapsed_time": "3:28:29", "remaining_time": "9:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 4438, "loss": 0.1644, "learning_rate": 4.4280868047330325e-06, "epoch": 0.2586532233080801, "percentage": 25.87, "elapsed_time": "3:28:39", "remaining_time": "9:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 4438, "loss": 0.176, "learning_rate": 4.4269004396585735e-06, "epoch": 0.2588785309938885, "percentage": 25.89, "elapsed_time": "3:28:49", "remaining_time": "9:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 4438, "loss": 0.1689, "learning_rate": 4.425713004648123e-06, "epoch": 0.25910383867969694, "percentage": 25.91, "elapsed_time": "3:29:00", "remaining_time": "9:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 4438, "loss": 0.1595, "learning_rate": 4.424524500361021e-06, "epoch": 0.2593291463655054, "percentage": 25.94, "elapsed_time": "3:29:10", "remaining_time": "9:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 4438, "loss": 0.1559, "learning_rate": 4.423334927457198e-06, "epoch": 0.25955445405131383, "percentage": 25.96, "elapsed_time": "3:29:20", "remaining_time": "9:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 4438, "loss": 0.1784, "learning_rate": 4.42214428659718e-06, "epoch": 0.25977976173712225, "percentage": 25.98, "elapsed_time": "3:29:30", "remaining_time": "9:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 4438, "loss": 0.1709, "learning_rate": 4.420952578442086e-06, "epoch": 0.26000506942293067, "percentage": 26.0, "elapsed_time": "3:29:41", "remaining_time": "9:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 4438, "loss": 0.1797, "learning_rate": 4.419759803653627e-06, "epoch": 0.26023037710873914, "percentage": 26.03, "elapsed_time": "3:29:52", "remaining_time": "9:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 4438, "loss": 0.1721, "learning_rate": 4.4185659628941054e-06, "epoch": 0.26045568479454756, "percentage": 26.05, "elapsed_time": "3:30:03", "remaining_time": "9:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 4438, "loss": 0.1537, "learning_rate": 4.417371056826417e-06, "epoch": 0.260680992480356, "percentage": 26.07, "elapsed_time": "3:30:15", "remaining_time": "9:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 4438, "loss": 0.1801, "learning_rate": 4.416175086114049e-06, "epoch": 0.2609063001661644, "percentage": 26.09, "elapsed_time": "3:30:26", "remaining_time": "9:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 4438, "loss": 0.1759, "learning_rate": 4.414978051421081e-06, "epoch": 0.26113160785197287, "percentage": 26.12, "elapsed_time": "3:30:36", "remaining_time": "9:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 4438, "loss": 0.1821, "learning_rate": 4.4137799534121785e-06, "epoch": 0.2613569155377813, "percentage": 26.14, "elapsed_time": "3:30:48", "remaining_time": "9:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 4438, "loss": 0.1719, "learning_rate": 4.412580792752601e-06, "epoch": 0.2615822232235897, "percentage": 26.16, "elapsed_time": "3:30:58", "remaining_time": "9:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 4438, "loss": 0.1726, "learning_rate": 4.4113805701082e-06, "epoch": 0.2618075309093981, "percentage": 26.18, "elapsed_time": "3:31:09", "remaining_time": "9:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 4438, "loss": 0.1615, "learning_rate": 4.410179286145414e-06, "epoch": 0.2620328385952066, "percentage": 26.21, "elapsed_time": "3:31:20", "remaining_time": "9:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 4438, "loss": 0.1757, "learning_rate": 4.408976941531269e-06, "epoch": 0.262258146281015, "percentage": 26.23, "elapsed_time": "3:31:30", "remaining_time": "9:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 4438, "loss": 0.1881, "learning_rate": 4.407773536933384e-06, "epoch": 0.26248345396682343, "percentage": 26.25, "elapsed_time": "3:31:42", "remaining_time": "9:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 4438, "loss": 0.1785, "learning_rate": 4.406569073019965e-06, "epoch": 0.26270876165263185, "percentage": 26.27, "elapsed_time": "3:31:54", "remaining_time": "9:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 4438, "loss": 0.1727, "learning_rate": 4.4053635504598045e-06, "epoch": 0.2629340693384403, "percentage": 26.3, "elapsed_time": "3:32:04", "remaining_time": "9:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 4438, "loss": 0.1715, "learning_rate": 4.404156969922284e-06, "epoch": 0.26315937702424874, "percentage": 26.32, "elapsed_time": "3:32:14", "remaining_time": "9:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 4438, "loss": 0.1773, "learning_rate": 4.402949332077375e-06, "epoch": 0.26338468471005716, "percentage": 26.34, "elapsed_time": "3:32:26", "remaining_time": "9:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 4438, "loss": 0.1668, "learning_rate": 4.401740637595633e-06, "epoch": 0.2636099923958656, "percentage": 26.36, "elapsed_time": "3:32:38", "remaining_time": "9:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 4438, "loss": 0.1706, "learning_rate": 4.400530887148199e-06, "epoch": 0.26383530008167405, "percentage": 26.39, "elapsed_time": "3:32:49", "remaining_time": "9:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 4438, "loss": 0.161, "learning_rate": 4.3993200814068035e-06, "epoch": 0.26406060776748247, "percentage": 26.41, "elapsed_time": "3:32:59", "remaining_time": "9:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 4438, "loss": 0.1833, "learning_rate": 4.398108221043764e-06, "epoch": 0.2642859154532909, "percentage": 26.43, "elapsed_time": "3:33:11", "remaining_time": "9:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 4438, "loss": 0.1763, "learning_rate": 4.396895306731978e-06, "epoch": 0.2645112231390993, "percentage": 26.45, "elapsed_time": "3:33:20", "remaining_time": "9:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 4438, "loss": 0.1883, "learning_rate": 4.395681339144933e-06, "epoch": 0.2647365308249078, "percentage": 26.48, "elapsed_time": "3:33:32", "remaining_time": "9:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 4438, "loss": 0.1723, "learning_rate": 4.394466318956701e-06, "epoch": 0.2649618385107162, "percentage": 26.5, "elapsed_time": "3:33:42", "remaining_time": "9:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 4438, "loss": 0.1725, "learning_rate": 4.393250246841935e-06, "epoch": 0.2651871461965246, "percentage": 26.52, "elapsed_time": "3:33:53", "remaining_time": "9:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 4438, "loss": 0.1689, "learning_rate": 4.392033123475876e-06, "epoch": 0.2654124538823331, "percentage": 26.54, "elapsed_time": "3:34:03", "remaining_time": "9:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 4438, "loss": 0.1735, "learning_rate": 4.390814949534348e-06, "epoch": 0.2656377615681415, "percentage": 26.57, "elapsed_time": "3:34:14", "remaining_time": "9:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 4438, "loss": 0.1728, "learning_rate": 4.389595725693756e-06, "epoch": 0.2658630692539499, "percentage": 26.59, "elapsed_time": "3:34:24", "remaining_time": "9:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 4438, "loss": 0.1648, "learning_rate": 4.388375452631091e-06, "epoch": 0.26608837693975834, "percentage": 26.61, "elapsed_time": "3:34:35", "remaining_time": "9:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 4438, "loss": 0.1567, "learning_rate": 4.387154131023924e-06, "epoch": 0.2663136846255668, "percentage": 26.63, "elapsed_time": "3:34:45", "remaining_time": "9:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 4438, "loss": 0.1778, "learning_rate": 4.385931761550411e-06, "epoch": 0.26653899231137523, "percentage": 26.66, "elapsed_time": "3:34:55", "remaining_time": "9:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 4438, "loss": 0.1758, "learning_rate": 4.384708344889285e-06, "epoch": 0.26676429999718365, "percentage": 26.68, "elapsed_time": "3:35:06", "remaining_time": "9:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 4438, "loss": 0.1778, "learning_rate": 4.383483881719867e-06, "epoch": 0.26698960768299207, "percentage": 26.7, "elapsed_time": "3:35:18", "remaining_time": "9:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 4438, "loss": 0.1725, "learning_rate": 4.382258372722054e-06, "epoch": 0.26721491536880054, "percentage": 26.72, "elapsed_time": "3:35:28", "remaining_time": "9:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 4438, "loss": 0.1618, "learning_rate": 4.381031818576326e-06, "epoch": 0.26744022305460896, "percentage": 26.75, "elapsed_time": "3:35:40", "remaining_time": "9:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 4438, "loss": 0.1707, "learning_rate": 4.379804219963742e-06, "epoch": 0.2676655307404174, "percentage": 26.77, "elapsed_time": "3:35:50", "remaining_time": "9:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 4438, "loss": 0.1721, "learning_rate": 4.378575577565945e-06, "epoch": 0.2678908384262258, "percentage": 26.79, "elapsed_time": "3:36:00", "remaining_time": "9:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 4438, "loss": 0.1604, "learning_rate": 4.377345892065149e-06, "epoch": 0.26811614611203427, "percentage": 26.81, "elapsed_time": "3:36:11", "remaining_time": "9:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 4438, "loss": 0.1741, "learning_rate": 4.376115164144157e-06, "epoch": 0.2683414537978427, "percentage": 26.84, "elapsed_time": "3:36:22", "remaining_time": "9:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 4438, "loss": 0.1718, "learning_rate": 4.374883394486343e-06, "epoch": 0.2685667614836511, "percentage": 26.86, "elapsed_time": "3:36:34", "remaining_time": "9:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 4438, "loss": 0.1669, "learning_rate": 4.373650583775666e-06, "epoch": 0.2687920691694595, "percentage": 26.88, "elapsed_time": "3:36:44", "remaining_time": "9:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 4438, "loss": 0.1827, "learning_rate": 4.3724167326966575e-06, "epoch": 0.269017376855268, "percentage": 26.9, "elapsed_time": "3:36:55", "remaining_time": "9:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 4438, "loss": 0.1631, "learning_rate": 4.37118184193443e-06, "epoch": 0.2692426845410764, "percentage": 26.93, "elapsed_time": "3:37:06", "remaining_time": "9:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 4438, "loss": 0.178, "learning_rate": 4.3699459121746726e-06, "epoch": 0.26946799222688483, "percentage": 26.95, "elapsed_time": "3:37:15", "remaining_time": "9:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 4438, "loss": 0.1623, "learning_rate": 4.368708944103649e-06, "epoch": 0.26969329991269325, "percentage": 26.97, "elapsed_time": "3:37:25", "remaining_time": "9:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 4438, "loss": 0.167, "learning_rate": 4.367470938408204e-06, "epoch": 0.2699186075985017, "percentage": 26.99, "elapsed_time": "3:37:36", "remaining_time": "9:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 4438, "loss": 0.1763, "learning_rate": 4.366231895775755e-06, "epoch": 0.27014391528431014, "percentage": 27.02, "elapsed_time": "3:37:46", "remaining_time": "9:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 4438, "loss": 0.1527, "learning_rate": 4.364991816894296e-06, "epoch": 0.27036922297011856, "percentage": 27.04, "elapsed_time": "3:37:56", "remaining_time": "9:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 4438, "loss": 0.1998, "learning_rate": 4.3637507024523975e-06, "epoch": 0.270594530655927, "percentage": 27.06, "elapsed_time": "3:38:06", "remaining_time": "9:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 4438, "loss": 0.184, "learning_rate": 4.362508553139203e-06, "epoch": 0.27081983834173545, "percentage": 27.08, "elapsed_time": "3:38:18", "remaining_time": "9:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 4438, "loss": 0.1693, "learning_rate": 4.361265369644432e-06, "epoch": 0.27104514602754387, "percentage": 27.11, "elapsed_time": "3:38:29", "remaining_time": "9:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 4438, "loss": 0.1805, "learning_rate": 4.360021152658378e-06, "epoch": 0.2712704537133523, "percentage": 27.13, "elapsed_time": "3:38:38", "remaining_time": "9:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 4438, "loss": 0.164, "learning_rate": 4.3587759028719075e-06, "epoch": 0.2714957613991607, "percentage": 27.15, "elapsed_time": "3:38:50", "remaining_time": "9:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 4438, "loss": 0.1672, "learning_rate": 4.357529620976463e-06, "epoch": 0.2717210690849692, "percentage": 27.17, "elapsed_time": "3:39:00", "remaining_time": "9:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 4438, "loss": 0.173, "learning_rate": 4.356282307664057e-06, "epoch": 0.2719463767707776, "percentage": 27.2, "elapsed_time": "3:39:10", "remaining_time": "9:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 4438, "loss": 0.1636, "learning_rate": 4.355033963627277e-06, "epoch": 0.272171684456586, "percentage": 27.22, "elapsed_time": "3:39:19", "remaining_time": "9:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 4438, "loss": 0.154, "learning_rate": 4.353784589559282e-06, "epoch": 0.27239699214239443, "percentage": 27.24, "elapsed_time": "3:39:30", "remaining_time": "9:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 4438, "loss": 0.173, "learning_rate": 4.352534186153802e-06, "epoch": 0.2726222998282029, "percentage": 27.26, "elapsed_time": "3:39:40", "remaining_time": "9:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 4438, "loss": 0.1683, "learning_rate": 4.35128275410514e-06, "epoch": 0.2728476075140113, "percentage": 27.29, "elapsed_time": "3:39:51", "remaining_time": "9:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 4438, "loss": 0.1804, "learning_rate": 4.3500302941081685e-06, "epoch": 0.27307291519981974, "percentage": 27.31, "elapsed_time": "3:40:02", "remaining_time": "9:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 4438, "loss": 0.1808, "learning_rate": 4.348776806858334e-06, "epoch": 0.27329822288562816, "percentage": 27.33, "elapsed_time": "3:40:13", "remaining_time": "9:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 4438, "loss": 0.1763, "learning_rate": 4.3475222930516484e-06, "epoch": 0.27352353057143663, "percentage": 27.35, "elapsed_time": "3:40:24", "remaining_time": "9:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 4438, "loss": 0.1681, "learning_rate": 4.346266753384699e-06, "epoch": 0.27374883825724505, "percentage": 27.38, "elapsed_time": "3:40:35", "remaining_time": "9:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 4438, "loss": 0.1624, "learning_rate": 4.345010188554638e-06, "epoch": 0.27397414594305347, "percentage": 27.4, "elapsed_time": "3:40:47", "remaining_time": "9:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 4438, "loss": 0.1792, "learning_rate": 4.343752599259192e-06, "epoch": 0.2741994536288619, "percentage": 27.42, "elapsed_time": "3:40:59", "remaining_time": "9:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 4438, "loss": 0.168, "learning_rate": 4.34249398619665e-06, "epoch": 0.27442476131467036, "percentage": 27.44, "elapsed_time": "3:41:08", "remaining_time": "9:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 4438, "loss": 0.1812, "learning_rate": 4.341234350065876e-06, "epoch": 0.2746500690004788, "percentage": 27.47, "elapsed_time": "3:41:19", "remaining_time": "9:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 4438, "loss": 0.163, "learning_rate": 4.339973691566297e-06, "epoch": 0.2748753766862872, "percentage": 27.49, "elapsed_time": "3:41:31", "remaining_time": "9:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 4438, "loss": 0.1616, "learning_rate": 4.33871201139791e-06, "epoch": 0.2751006843720956, "percentage": 27.51, "elapsed_time": "3:41:42", "remaining_time": "9:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 4438, "loss": 0.1666, "learning_rate": 4.337449310261279e-06, "epoch": 0.2753259920579041, "percentage": 27.53, "elapsed_time": "3:41:52", "remaining_time": "9:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 4438, "loss": 0.1825, "learning_rate": 4.336185588857535e-06, "epoch": 0.2755512997437125, "percentage": 27.56, "elapsed_time": "3:42:02", "remaining_time": "9:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 4438, "loss": 0.1731, "learning_rate": 4.334920847888376e-06, "epoch": 0.2757766074295209, "percentage": 27.58, "elapsed_time": "3:42:14", "remaining_time": "9:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 4438, "loss": 0.1794, "learning_rate": 4.333655088056065e-06, "epoch": 0.2760019151153294, "percentage": 27.6, "elapsed_time": "3:42:24", "remaining_time": "9:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 4438, "loss": 0.1875, "learning_rate": 4.332388310063431e-06, "epoch": 0.2762272228011378, "percentage": 27.63, "elapsed_time": "3:42:36", "remaining_time": "9:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 4438, "loss": 0.1714, "learning_rate": 4.331120514613869e-06, "epoch": 0.27645253048694624, "percentage": 27.65, "elapsed_time": "3:42:47", "remaining_time": "9:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 4438, "loss": 0.1686, "learning_rate": 4.329851702411339e-06, "epoch": 0.27667783817275465, "percentage": 27.67, "elapsed_time": "3:42:59", "remaining_time": "9:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 4438, "loss": 0.1576, "learning_rate": 4.328581874160363e-06, "epoch": 0.2769031458585631, "percentage": 27.69, "elapsed_time": "3:43:10", "remaining_time": "9:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 4438, "loss": 0.1566, "learning_rate": 4.327311030566033e-06, "epoch": 0.27712845354437154, "percentage": 27.72, "elapsed_time": "3:43:21", "remaining_time": "9:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 4438, "loss": 0.1761, "learning_rate": 4.326039172333997e-06, "epoch": 0.27735376123017996, "percentage": 27.74, "elapsed_time": "3:43:32", "remaining_time": "9:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 4438, "loss": 0.1751, "learning_rate": 4.324766300170473e-06, "epoch": 0.2775790689159884, "percentage": 27.76, "elapsed_time": "3:43:42", "remaining_time": "9:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 4438, "loss": 0.1668, "learning_rate": 4.323492414782239e-06, "epoch": 0.27780437660179685, "percentage": 27.78, "elapsed_time": "3:43:51", "remaining_time": "9:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 4438, "loss": 0.1616, "learning_rate": 4.322217516876635e-06, "epoch": 0.27802968428760527, "percentage": 27.81, "elapsed_time": "3:44:02", "remaining_time": "9:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 4438, "loss": 0.1827, "learning_rate": 4.320941607161567e-06, "epoch": 0.2782549919734137, "percentage": 27.83, "elapsed_time": "3:44:12", "remaining_time": "9:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 4438, "loss": 0.1707, "learning_rate": 4.3196646863454975e-06, "epoch": 0.2784802996592221, "percentage": 27.85, "elapsed_time": "3:44:21", "remaining_time": "9:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 4438, "loss": 0.1727, "learning_rate": 4.3183867551374535e-06, "epoch": 0.2787056073450306, "percentage": 27.87, "elapsed_time": "3:44:33", "remaining_time": "9:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 4438, "loss": 0.19, "learning_rate": 4.317107814247022e-06, "epoch": 0.278930915030839, "percentage": 27.9, "elapsed_time": "3:44:44", "remaining_time": "9:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 4438, "loss": 0.1756, "learning_rate": 4.3158278643843544e-06, "epoch": 0.2791562227166474, "percentage": 27.92, "elapsed_time": "3:44:54", "remaining_time": "9:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 4438, "loss": 0.1715, "learning_rate": 4.314546906260156e-06, "epoch": 0.27938153040245584, "percentage": 27.94, "elapsed_time": "3:45:05", "remaining_time": "9:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 4438, "loss": 0.1773, "learning_rate": 4.313264940585695e-06, "epoch": 0.2796068380882643, "percentage": 27.96, "elapsed_time": "3:45:17", "remaining_time": "9:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 4438, "loss": 0.1588, "learning_rate": 4.3119819680728e-06, "epoch": 0.2798321457740727, "percentage": 27.99, "elapsed_time": "3:45:28", "remaining_time": "9:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 4438, "loss": 0.1772, "learning_rate": 4.310697989433858e-06, "epoch": 0.28005745345988114, "percentage": 28.01, "elapsed_time": "3:45:39", "remaining_time": "9:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 4438, "loss": 0.1654, "learning_rate": 4.3094130053818164e-06, "epoch": 0.28028276114568956, "percentage": 28.03, "elapsed_time": "3:45:50", "remaining_time": "9:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 4438, "loss": 0.1692, "learning_rate": 4.308127016630176e-06, "epoch": 0.28050806883149804, "percentage": 28.05, "elapsed_time": "3:46:02", "remaining_time": "9:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 4438, "loss": 0.1695, "learning_rate": 4.306840023892998e-06, "epoch": 0.28073337651730645, "percentage": 28.08, "elapsed_time": "3:46:12", "remaining_time": "9:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 4438, "loss": 0.1654, "learning_rate": 4.305552027884904e-06, "epoch": 0.2809586842031149, "percentage": 28.1, "elapsed_time": "3:46:22", "remaining_time": "9:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 4438, "loss": 0.1721, "learning_rate": 4.304263029321069e-06, "epoch": 0.2811839918889233, "percentage": 28.12, "elapsed_time": "3:46:33", "remaining_time": "9:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 4438, "loss": 0.1793, "learning_rate": 4.302973028917226e-06, "epoch": 0.28140929957473176, "percentage": 28.14, "elapsed_time": "3:46:43", "remaining_time": "9:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 4438, "loss": 0.1781, "learning_rate": 4.301682027389663e-06, "epoch": 0.2816346072605402, "percentage": 28.17, "elapsed_time": "3:46:54", "remaining_time": "9:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 4438, "loss": 0.1714, "learning_rate": 4.300390025455227e-06, "epoch": 0.2818599149463486, "percentage": 28.19, "elapsed_time": "3:47:06", "remaining_time": "9:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 4438, "loss": 0.1695, "learning_rate": 4.299097023831318e-06, "epoch": 0.282085222632157, "percentage": 28.21, "elapsed_time": "3:47:16", "remaining_time": "9:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 4438, "loss": 0.1714, "learning_rate": 4.2978030232358904e-06, "epoch": 0.2823105303179655, "percentage": 28.23, "elapsed_time": "3:47:27", "remaining_time": "9:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 4438, "loss": 0.1557, "learning_rate": 4.2965080243874555e-06, "epoch": 0.2825358380037739, "percentage": 28.26, "elapsed_time": "3:47:37", "remaining_time": "9:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 4438, "loss": 0.1786, "learning_rate": 4.295212028005078e-06, "epoch": 0.2827611456895823, "percentage": 28.28, "elapsed_time": "3:47:48", "remaining_time": "9:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 4438, "loss": 0.1552, "learning_rate": 4.293915034808376e-06, "epoch": 0.28298645337539075, "percentage": 28.3, "elapsed_time": "3:47:58", "remaining_time": "9:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 4438, "loss": 0.1617, "learning_rate": 4.292617045517521e-06, "epoch": 0.2832117610611992, "percentage": 28.32, "elapsed_time": "3:48:07", "remaining_time": "9:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 4438, "loss": 0.1494, "learning_rate": 4.29131806085324e-06, "epoch": 0.28343706874700764, "percentage": 28.35, "elapsed_time": "3:48:17", "remaining_time": "9:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 4438, "loss": 0.1676, "learning_rate": 4.290018081536807e-06, "epoch": 0.28366237643281605, "percentage": 28.37, "elapsed_time": "3:48:27", "remaining_time": "9:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 4438, "loss": 0.1651, "learning_rate": 4.288717108290056e-06, "epoch": 0.2838876841186245, "percentage": 28.39, "elapsed_time": "3:48:37", "remaining_time": "9:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 4438, "loss": 0.1821, "learning_rate": 4.287415141835368e-06, "epoch": 0.28411299180443295, "percentage": 28.41, "elapsed_time": "3:48:49", "remaining_time": "9:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 4438, "loss": 0.1663, "learning_rate": 4.2861121828956745e-06, "epoch": 0.28433829949024136, "percentage": 28.44, "elapsed_time": "3:49:00", "remaining_time": "9:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 4438, "loss": 0.182, "learning_rate": 4.284808232194462e-06, "epoch": 0.2845636071760498, "percentage": 28.46, "elapsed_time": "3:49:10", "remaining_time": "9:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 4438, "loss": 0.1675, "learning_rate": 4.283503290455765e-06, "epoch": 0.2847889148618582, "percentage": 28.48, "elapsed_time": "3:49:20", "remaining_time": "9:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 4438, "loss": 0.1678, "learning_rate": 4.28219735840417e-06, "epoch": 0.2850142225476667, "percentage": 28.5, "elapsed_time": "3:49:30", "remaining_time": "9:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 4438, "loss": 0.172, "learning_rate": 4.28089043676481e-06, "epoch": 0.2852395302334751, "percentage": 28.53, "elapsed_time": "3:49:42", "remaining_time": "9:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 4438, "loss": 0.1816, "learning_rate": 4.279582526263371e-06, "epoch": 0.2854648379192835, "percentage": 28.55, "elapsed_time": "3:49:52", "remaining_time": "9:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 4438, "loss": 0.1888, "learning_rate": 4.27827362762609e-06, "epoch": 0.2856901456050919, "percentage": 28.57, "elapsed_time": "3:50:02", "remaining_time": "9:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 4438, "loss": 0.1733, "learning_rate": 4.276963741579745e-06, "epoch": 0.2859154532909004, "percentage": 28.59, "elapsed_time": "3:50:13", "remaining_time": "9:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 4438, "loss": 0.1663, "learning_rate": 4.275652868851669e-06, "epoch": 0.2861407609767088, "percentage": 28.62, "elapsed_time": "3:50:25", "remaining_time": "9:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 4438, "loss": 0.1799, "learning_rate": 4.2743410101697405e-06, "epoch": 0.28636606866251724, "percentage": 28.64, "elapsed_time": "3:50:35", "remaining_time": "9:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 4438, "loss": 0.1786, "learning_rate": 4.2730281662623866e-06, "epoch": 0.28659137634832565, "percentage": 28.66, "elapsed_time": "3:50:45", "remaining_time": "9:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 4438, "loss": 0.1707, "learning_rate": 4.271714337858579e-06, "epoch": 0.28681668403413413, "percentage": 28.68, "elapsed_time": "3:50:56", "remaining_time": "9:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 4438, "loss": 0.1645, "learning_rate": 4.270399525687839e-06, "epoch": 0.28704199171994255, "percentage": 28.71, "elapsed_time": "3:51:06", "remaining_time": "9:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 4438, "loss": 0.1825, "learning_rate": 4.269083730480232e-06, "epoch": 0.28726729940575096, "percentage": 28.73, "elapsed_time": "3:51:17", "remaining_time": "9:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 4438, "loss": 0.1686, "learning_rate": 4.267766952966369e-06, "epoch": 0.28749260709155944, "percentage": 28.75, "elapsed_time": "3:51:27", "remaining_time": "9:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 4438, "loss": 0.1712, "learning_rate": 4.26644919387741e-06, "epoch": 0.28771791477736786, "percentage": 28.77, "elapsed_time": "3:51:39", "remaining_time": "9:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 4438, "loss": 0.1576, "learning_rate": 4.265130453945056e-06, "epoch": 0.2879432224631763, "percentage": 28.8, "elapsed_time": "3:51:49", "remaining_time": "9:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 4438, "loss": 0.1852, "learning_rate": 4.263810733901554e-06, "epoch": 0.2881685301489847, "percentage": 28.82, "elapsed_time": "3:52:00", "remaining_time": "9:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 4438, "loss": 0.1678, "learning_rate": 4.262490034479697e-06, "epoch": 0.28839383783479317, "percentage": 28.84, "elapsed_time": "3:52:11", "remaining_time": "9:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 4438, "loss": 0.1675, "learning_rate": 4.261168356412818e-06, "epoch": 0.2886191455206016, "percentage": 28.86, "elapsed_time": "3:52:22", "remaining_time": "9:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 4438, "loss": 0.1515, "learning_rate": 4.259845700434797e-06, "epoch": 0.28884445320641, "percentage": 28.89, "elapsed_time": "3:52:34", "remaining_time": "9:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 4438, "loss": 0.1709, "learning_rate": 4.258522067280055e-06, "epoch": 0.2890697608922184, "percentage": 28.91, "elapsed_time": "3:52:44", "remaining_time": "9:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 4438, "loss": 0.1577, "learning_rate": 4.257197457683556e-06, "epoch": 0.2892950685780269, "percentage": 28.93, "elapsed_time": "3:52:55", "remaining_time": "9:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 4438, "loss": 0.1833, "learning_rate": 4.2558718723808055e-06, "epoch": 0.2895203762638353, "percentage": 28.95, "elapsed_time": "3:53:07", "remaining_time": "9:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 4438, "loss": 0.1708, "learning_rate": 4.254545312107854e-06, "epoch": 0.28974568394964373, "percentage": 28.98, "elapsed_time": "3:53:16", "remaining_time": "9:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 4438, "loss": 0.186, "learning_rate": 4.253217777601289e-06, "epoch": 0.28997099163545215, "percentage": 29.0, "elapsed_time": "3:53:28", "remaining_time": "9:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 4438, "loss": 0.1875, "learning_rate": 4.251889269598241e-06, "epoch": 0.2901962993212606, "percentage": 29.02, "elapsed_time": "3:53:38", "remaining_time": "9:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 4438, "loss": 0.1614, "learning_rate": 4.250559788836382e-06, "epoch": 0.29042160700706904, "percentage": 29.04, "elapsed_time": "3:53:49", "remaining_time": "9:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 4438, "loss": 0.1743, "learning_rate": 4.249229336053924e-06, "epoch": 0.29064691469287746, "percentage": 29.07, "elapsed_time": "3:54:01", "remaining_time": "9:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 4438, "loss": 0.1659, "learning_rate": 4.247897911989615e-06, "epoch": 0.2908722223786859, "percentage": 29.09, "elapsed_time": "3:54:10", "remaining_time": "9:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 4438, "loss": 0.1727, "learning_rate": 4.2465655173827465e-06, "epoch": 0.29109753006449435, "percentage": 29.11, "elapsed_time": "3:54:20", "remaining_time": "9:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 4438, "loss": 0.1583, "learning_rate": 4.245232152973148e-06, "epoch": 0.29132283775030277, "percentage": 29.13, "elapsed_time": "3:54:31", "remaining_time": "9:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 4438, "loss": 0.1605, "learning_rate": 4.243897819501187e-06, "epoch": 0.2915481454361112, "percentage": 29.16, "elapsed_time": "3:54:39", "remaining_time": "9:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 4438, "loss": 0.1626, "learning_rate": 4.242562517707768e-06, "epoch": 0.2917734531219196, "percentage": 29.18, "elapsed_time": "3:54:50", "remaining_time": "9:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 4438, "loss": 0.1784, "learning_rate": 4.241226248334335e-06, "epoch": 0.2919987608077281, "percentage": 29.2, "elapsed_time": "3:55:01", "remaining_time": "9:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 4438, "loss": 0.1516, "learning_rate": 4.23988901212287e-06, "epoch": 0.2922240684935365, "percentage": 29.22, "elapsed_time": "3:55:10", "remaining_time": "9:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 4438, "loss": 0.1558, "learning_rate": 4.238550809815889e-06, "epoch": 0.2924493761793449, "percentage": 29.25, "elapsed_time": "3:55:21", "remaining_time": "9:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 4438, "loss": 0.1585, "learning_rate": 4.237211642156446e-06, "epoch": 0.29267468386515333, "percentage": 29.27, "elapsed_time": "3:55:31", "remaining_time": "9:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 4438, "loss": 0.1652, "learning_rate": 4.23587150988813e-06, "epoch": 0.2928999915509618, "percentage": 29.29, "elapsed_time": "3:55:41", "remaining_time": "9:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 4438, "loss": 0.1854, "learning_rate": 4.234530413755069e-06, "epoch": 0.2931252992367702, "percentage": 29.32, "elapsed_time": "3:55:52", "remaining_time": "9:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 4438, "loss": 0.169, "learning_rate": 4.233188354501921e-06, "epoch": 0.29335060692257864, "percentage": 29.34, "elapsed_time": "3:56:03", "remaining_time": "9:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 4438, "loss": 0.1668, "learning_rate": 4.231845332873883e-06, "epoch": 0.29357591460838706, "percentage": 29.36, "elapsed_time": "3:56:13", "remaining_time": "9:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 4438, "loss": 0.1606, "learning_rate": 4.230501349616683e-06, "epoch": 0.29380122229419553, "percentage": 29.38, "elapsed_time": "3:56:23", "remaining_time": "9:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 4438, "loss": 0.1731, "learning_rate": 4.2291564054765876e-06, "epoch": 0.29402652998000395, "percentage": 29.41, "elapsed_time": "3:56:34", "remaining_time": "9:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 4438, "loss": 0.1695, "learning_rate": 4.227810501200393e-06, "epoch": 0.29425183766581237, "percentage": 29.43, "elapsed_time": "3:56:46", "remaining_time": "9:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 4438, "loss": 0.1849, "learning_rate": 4.226463637535429e-06, "epoch": 0.2944771453516208, "percentage": 29.45, "elapsed_time": "3:56:57", "remaining_time": "9:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 4438, "loss": 0.1741, "learning_rate": 4.225115815229559e-06, "epoch": 0.29470245303742926, "percentage": 29.47, "elapsed_time": "3:57:06", "remaining_time": "9:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 4438, "loss": 0.1684, "learning_rate": 4.22376703503118e-06, "epoch": 0.2949277607232377, "percentage": 29.5, "elapsed_time": "3:57:18", "remaining_time": "9:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 4438, "loss": 0.1472, "learning_rate": 4.222417297689217e-06, "epoch": 0.2951530684090461, "percentage": 29.52, "elapsed_time": "3:57:29", "remaining_time": "9:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 4438, "loss": 0.1762, "learning_rate": 4.22106660395313e-06, "epoch": 0.2953783760948545, "percentage": 29.54, "elapsed_time": "3:57:39", "remaining_time": "9:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 4438, "loss": 0.1708, "learning_rate": 4.219714954572909e-06, "epoch": 0.295603683780663, "percentage": 29.56, "elapsed_time": "3:57:50", "remaining_time": "9:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 4438, "loss": 0.1776, "learning_rate": 4.218362350299075e-06, "epoch": 0.2958289914664714, "percentage": 29.59, "elapsed_time": "3:58:01", "remaining_time": "9:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 4438, "loss": 0.1911, "learning_rate": 4.217008791882678e-06, "epoch": 0.2960542991522798, "percentage": 29.61, "elapsed_time": "3:58:12", "remaining_time": "9:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 4438, "loss": 0.1732, "learning_rate": 4.215654280075297e-06, "epoch": 0.29627960683808824, "percentage": 29.63, "elapsed_time": "3:58:21", "remaining_time": "9:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 4438, "loss": 0.1741, "learning_rate": 4.214298815629046e-06, "epoch": 0.2965049145238967, "percentage": 29.65, "elapsed_time": "3:58:31", "remaining_time": "9:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 4438, "loss": 0.1566, "learning_rate": 4.212942399296559e-06, "epoch": 0.29673022220970513, "percentage": 29.68, "elapsed_time": "3:58:42", "remaining_time": "9:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 4438, "loss": 0.1834, "learning_rate": 4.211585031831007e-06, "epoch": 0.29695552989551355, "percentage": 29.7, "elapsed_time": "3:58:53", "remaining_time": "9:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 4438, "loss": 0.1691, "learning_rate": 4.210226713986085e-06, "epoch": 0.29718083758132197, "percentage": 29.72, "elapsed_time": "3:59:05", "remaining_time": "9:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 4438, "loss": 0.1615, "learning_rate": 4.208867446516015e-06, "epoch": 0.29740614526713044, "percentage": 29.74, "elapsed_time": "3:59:16", "remaining_time": "9:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 4438, "loss": 0.1595, "learning_rate": 4.2075072301755486e-06, "epoch": 0.29763145295293886, "percentage": 29.77, "elapsed_time": "3:59:25", "remaining_time": "9:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 4438, "loss": 0.1667, "learning_rate": 4.206146065719963e-06, "epoch": 0.2978567606387473, "percentage": 29.79, "elapsed_time": "3:59:35", "remaining_time": "9:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 4438, "loss": 0.1799, "learning_rate": 4.204783953905062e-06, "epoch": 0.29808206832455575, "percentage": 29.81, "elapsed_time": "3:59:46", "remaining_time": "9:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 4438, "loss": 0.163, "learning_rate": 4.203420895487175e-06, "epoch": 0.29830737601036417, "percentage": 29.83, "elapsed_time": "3:59:58", "remaining_time": "9:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 4438, "loss": 0.1671, "learning_rate": 4.202056891223159e-06, "epoch": 0.2985326836961726, "percentage": 29.86, "elapsed_time": "4:00:08", "remaining_time": "9:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 4438, "loss": 0.1627, "learning_rate": 4.200691941870392e-06, "epoch": 0.298757991381981, "percentage": 29.88, "elapsed_time": "4:00:17", "remaining_time": "9:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 4438, "loss": 0.1547, "learning_rate": 4.199326048186783e-06, "epoch": 0.2989832990677895, "percentage": 29.9, "elapsed_time": "4:00:28", "remaining_time": "9:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 4438, "loss": 0.1768, "learning_rate": 4.197959210930759e-06, "epoch": 0.2992086067535979, "percentage": 29.92, "elapsed_time": "4:00:38", "remaining_time": "9:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 4438, "loss": 0.1708, "learning_rate": 4.196591430861275e-06, "epoch": 0.2994339144394063, "percentage": 29.95, "elapsed_time": "4:00:48", "remaining_time": "9:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 4438, "loss": 0.1685, "learning_rate": 4.195222708737809e-06, "epoch": 0.29965922212521473, "percentage": 29.97, "elapsed_time": "4:00:58", "remaining_time": "9:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 4438, "loss": 0.19, "learning_rate": 4.193853045320359e-06, "epoch": 0.2998845298110232, "percentage": 29.99, "elapsed_time": "4:01:08", "remaining_time": "9:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 4438, "loss": 0.1579, "learning_rate": 4.192482441369451e-06, "epoch": 0.3001098374968316, "percentage": 30.01, "elapsed_time": "4:01:19", "remaining_time": "9:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 4438, "loss": 0.1665, "learning_rate": 4.191110897646129e-06, "epoch": 0.30033514518264004, "percentage": 30.04, "elapsed_time": "4:01:30", "remaining_time": "9:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 4438, "loss": 0.174, "learning_rate": 4.189738414911959e-06, "epoch": 0.30056045286844846, "percentage": 30.06, "elapsed_time": "4:01:41", "remaining_time": "9:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 4438, "loss": 0.1852, "learning_rate": 4.188364993929032e-06, "epoch": 0.30078576055425693, "percentage": 30.08, "elapsed_time": "4:01:52", "remaining_time": "9:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 4438, "loss": 0.1708, "learning_rate": 4.186990635459954e-06, "epoch": 0.30101106824006535, "percentage": 30.1, "elapsed_time": "4:02:01", "remaining_time": "9:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 4438, "loss": 0.1614, "learning_rate": 4.185615340267858e-06, "epoch": 0.30123637592587377, "percentage": 30.13, "elapsed_time": "4:02:13", "remaining_time": "9:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 4438, "loss": 0.1891, "learning_rate": 4.184239109116393e-06, "epoch": 0.3014616836116822, "percentage": 30.15, "elapsed_time": "4:02:24", "remaining_time": "9:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 4438, "loss": 0.1632, "learning_rate": 4.182861942769729e-06, "epoch": 0.30168699129749066, "percentage": 30.17, "elapsed_time": "4:02:35", "remaining_time": "9:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 4438, "loss": 0.1679, "learning_rate": 4.181483841992556e-06, "epoch": 0.3019122989832991, "percentage": 30.19, "elapsed_time": "4:02:45", "remaining_time": "9:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 4438, "loss": 0.1643, "learning_rate": 4.18010480755008e-06, "epoch": 0.3021376066691075, "percentage": 30.22, "elapsed_time": "4:02:55", "remaining_time": "9:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 4438, "loss": 0.1665, "learning_rate": 4.178724840208029e-06, "epoch": 0.3023629143549159, "percentage": 30.24, "elapsed_time": "4:03:06", "remaining_time": "9:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 4438, "loss": 0.1614, "learning_rate": 4.1773439407326474e-06, "epoch": 0.3025882220407244, "percentage": 30.26, "elapsed_time": "4:03:17", "remaining_time": "9:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 4438, "loss": 0.1581, "learning_rate": 4.175962109890697e-06, "epoch": 0.3028135297265328, "percentage": 30.28, "elapsed_time": "4:03:26", "remaining_time": "9:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 4438, "loss": 0.1732, "learning_rate": 4.174579348449456e-06, "epoch": 0.3030388374123412, "percentage": 30.31, "elapsed_time": "4:03:37", "remaining_time": "9:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 4438, "loss": 0.1617, "learning_rate": 4.1731956571767215e-06, "epoch": 0.30326414509814964, "percentage": 30.33, "elapsed_time": "4:03:46", "remaining_time": "9:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 4438, "loss": 0.1617, "learning_rate": 4.171811036840805e-06, "epoch": 0.3034894527839581, "percentage": 30.35, "elapsed_time": "4:03:57", "remaining_time": "9:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 4438, "loss": 0.1727, "learning_rate": 4.170425488210534e-06, "epoch": 0.30371476046976653, "percentage": 30.37, "elapsed_time": "4:04:07", "remaining_time": "9:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 4438, "loss": 0.1637, "learning_rate": 4.169039012055255e-06, "epoch": 0.30394006815557495, "percentage": 30.4, "elapsed_time": "4:04:18", "remaining_time": "9:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 4438, "loss": 0.1671, "learning_rate": 4.167651609144822e-06, "epoch": 0.30416537584138337, "percentage": 30.42, "elapsed_time": "4:04:29", "remaining_time": "9:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 4438, "loss": 0.1678, "learning_rate": 4.166263280249613e-06, "epoch": 0.30439068352719184, "percentage": 30.44, "elapsed_time": "4:04:39", "remaining_time": "9:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 4438, "loss": 0.1624, "learning_rate": 4.164874026140511e-06, "epoch": 0.30461599121300026, "percentage": 30.46, "elapsed_time": "4:04:49", "remaining_time": "9:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 4438, "loss": 0.155, "learning_rate": 4.163483847588919e-06, "epoch": 0.3048412988988087, "percentage": 30.49, "elapsed_time": "4:05:02", "remaining_time": "9:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 4438, "loss": 0.1693, "learning_rate": 4.1620927453667515e-06, "epoch": 0.3050666065846171, "percentage": 30.51, "elapsed_time": "4:05:12", "remaining_time": "9:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 4438, "loss": 0.1571, "learning_rate": 4.160700720246435e-06, "epoch": 0.30529191427042557, "percentage": 30.53, "elapsed_time": "4:05:23", "remaining_time": "9:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 4438, "loss": 0.1539, "learning_rate": 4.159307773000909e-06, "epoch": 0.305517221956234, "percentage": 30.55, "elapsed_time": "4:05:32", "remaining_time": "9:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 4438, "loss": 0.1651, "learning_rate": 4.1579139044036265e-06, "epoch": 0.3057425296420424, "percentage": 30.58, "elapsed_time": "4:05:42", "remaining_time": "9:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 4438, "loss": 0.1637, "learning_rate": 4.15651911522855e-06, "epoch": 0.3059678373278508, "percentage": 30.6, "elapsed_time": "4:05:53", "remaining_time": "9:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 4438, "loss": 0.1837, "learning_rate": 4.155123406250153e-06, "epoch": 0.3061931450136593, "percentage": 30.62, "elapsed_time": "4:06:03", "remaining_time": "9:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 4438, "loss": 0.1649, "learning_rate": 4.153726778243422e-06, "epoch": 0.3064184526994677, "percentage": 30.64, "elapsed_time": "4:06:13", "remaining_time": "9:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 4438, "loss": 0.1747, "learning_rate": 4.152329231983852e-06, "epoch": 0.30664376038527613, "percentage": 30.67, "elapsed_time": "4:06:23", "remaining_time": "9:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 4438, "loss": 0.1777, "learning_rate": 4.150930768247449e-06, "epoch": 0.30686906807108455, "percentage": 30.69, "elapsed_time": "4:06:34", "remaining_time": "9:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 4438, "loss": 0.1713, "learning_rate": 4.149531387810727e-06, "epoch": 0.307094375756893, "percentage": 30.71, "elapsed_time": "4:06:44", "remaining_time": "9:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 4438, "loss": 0.159, "learning_rate": 4.148131091450709e-06, "epoch": 0.30731968344270144, "percentage": 30.73, "elapsed_time": "4:06:53", "remaining_time": "9:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 4438, "loss": 0.1505, "learning_rate": 4.14672987994493e-06, "epoch": 0.30754499112850986, "percentage": 30.76, "elapsed_time": "4:07:04", "remaining_time": "9:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 4438, "loss": 0.1766, "learning_rate": 4.145327754071427e-06, "epoch": 0.3077702988143183, "percentage": 30.78, "elapsed_time": "4:07:15", "remaining_time": "9:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 4438, "loss": 0.1758, "learning_rate": 4.1439247146087515e-06, "epoch": 0.30799560650012675, "percentage": 30.8, "elapsed_time": "4:07:25", "remaining_time": "9:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 4438, "loss": 0.1514, "learning_rate": 4.142520762335957e-06, "epoch": 0.30822091418593517, "percentage": 30.82, "elapsed_time": "4:07:36", "remaining_time": "9:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 4438, "loss": 0.1632, "learning_rate": 4.141115898032607e-06, "epoch": 0.3084462218717436, "percentage": 30.85, "elapsed_time": "4:07:47", "remaining_time": "9:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 4438, "loss": 0.1613, "learning_rate": 4.13971012247877e-06, "epoch": 0.308671529557552, "percentage": 30.87, "elapsed_time": "4:07:57", "remaining_time": "9:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 4438, "loss": 0.1739, "learning_rate": 4.138303436455019e-06, "epoch": 0.3088968372433605, "percentage": 30.89, "elapsed_time": "4:08:08", "remaining_time": "9:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 4438, "loss": 0.1711, "learning_rate": 4.136895840742437e-06, "epoch": 0.3091221449291689, "percentage": 30.91, "elapsed_time": "4:08:18", "remaining_time": "9:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 4438, "loss": 0.1606, "learning_rate": 4.1354873361226074e-06, "epoch": 0.3093474526149773, "percentage": 30.94, "elapsed_time": "4:08:28", "remaining_time": "9:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 4438, "loss": 0.166, "learning_rate": 4.134077923377622e-06, "epoch": 0.3095727603007858, "percentage": 30.96, "elapsed_time": "4:08:39", "remaining_time": "9:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 4438, "loss": 0.1765, "learning_rate": 4.132667603290075e-06, "epoch": 0.3097980679865942, "percentage": 30.98, "elapsed_time": "4:08:50", "remaining_time": "9:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 4438, "loss": 0.1889, "learning_rate": 4.131256376643062e-06, "epoch": 0.3100233756724026, "percentage": 31.0, "elapsed_time": "4:09:00", "remaining_time": "9:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 4438, "loss": 0.1607, "learning_rate": 4.129844244220188e-06, "epoch": 0.31024868335821104, "percentage": 31.03, "elapsed_time": "4:09:11", "remaining_time": "9:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 4438, "loss": 0.1576, "learning_rate": 4.128431206805556e-06, "epoch": 0.3104739910440195, "percentage": 31.05, "elapsed_time": "4:09:22", "remaining_time": "9:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 4438, "loss": 0.1582, "learning_rate": 4.127017265183772e-06, "epoch": 0.31069929872982793, "percentage": 31.07, "elapsed_time": "4:09:32", "remaining_time": "9:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 4438, "loss": 0.1773, "learning_rate": 4.125602420139947e-06, "epoch": 0.31092460641563635, "percentage": 31.1, "elapsed_time": "4:09:43", "remaining_time": "9:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 4438, "loss": 0.1533, "learning_rate": 4.124186672459691e-06, "epoch": 0.31114991410144477, "percentage": 31.12, "elapsed_time": "4:09:53", "remaining_time": "9:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 4438, "loss": 0.1701, "learning_rate": 4.122770022929114e-06, "epoch": 0.31137522178725324, "percentage": 31.14, "elapsed_time": "4:10:05", "remaining_time": "9:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 4438, "loss": 0.1686, "learning_rate": 4.121352472334832e-06, "epoch": 0.31160052947306166, "percentage": 31.16, "elapsed_time": "4:10:14", "remaining_time": "9:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 4438, "loss": 0.171, "learning_rate": 4.119934021463956e-06, "epoch": 0.3118258371588701, "percentage": 31.19, "elapsed_time": "4:10:25", "remaining_time": "9:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 4438, "loss": 0.1693, "learning_rate": 4.1185146711040995e-06, "epoch": 0.3120511448446785, "percentage": 31.21, "elapsed_time": "4:10:36", "remaining_time": "9:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 4438, "loss": 0.1759, "learning_rate": 4.117094422043374e-06, "epoch": 0.31227645253048697, "percentage": 31.23, "elapsed_time": "4:10:48", "remaining_time": "9:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 4438, "loss": 0.1684, "learning_rate": 4.115673275070392e-06, "epoch": 0.3125017602162954, "percentage": 31.25, "elapsed_time": "4:10:57", "remaining_time": "9:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 4438, "loss": 0.1653, "learning_rate": 4.114251230974263e-06, "epoch": 0.3127270679021038, "percentage": 31.28, "elapsed_time": "4:11:07", "remaining_time": "9:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 4438, "loss": 0.1784, "learning_rate": 4.1128282905445945e-06, "epoch": 0.3129523755879122, "percentage": 31.3, "elapsed_time": "4:11:17", "remaining_time": "9:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 4438, "loss": 0.1776, "learning_rate": 4.1114044545714935e-06, "epoch": 0.3131776832737207, "percentage": 31.32, "elapsed_time": "4:11:28", "remaining_time": "9:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 4438, "loss": 0.1731, "learning_rate": 4.1099797238455615e-06, "epoch": 0.3134029909595291, "percentage": 31.34, "elapsed_time": "4:11:38", "remaining_time": "9:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 4438, "loss": 0.1582, "learning_rate": 4.1085540991579e-06, "epoch": 0.31362829864533753, "percentage": 31.37, "elapsed_time": "4:11:49", "remaining_time": "9:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 4438, "loss": 0.1873, "learning_rate": 4.107127581300105e-06, "epoch": 0.31385360633114595, "percentage": 31.39, "elapsed_time": "4:12:01", "remaining_time": "9:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 4438, "loss": 0.1669, "learning_rate": 4.105700171064267e-06, "epoch": 0.3140789140169544, "percentage": 31.41, "elapsed_time": "4:12:13", "remaining_time": "9:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 4438, "loss": 0.1613, "learning_rate": 4.104271869242975e-06, "epoch": 0.31430422170276284, "percentage": 31.43, "elapsed_time": "4:12:24", "remaining_time": "9:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 4438, "loss": 0.1806, "learning_rate": 4.102842676629313e-06, "epoch": 0.31452952938857126, "percentage": 31.46, "elapsed_time": "4:12:35", "remaining_time": "9:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 4438, "loss": 0.1709, "learning_rate": 4.101412594016855e-06, "epoch": 0.3147548370743797, "percentage": 31.48, "elapsed_time": "4:12:46", "remaining_time": "9:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 4438, "loss": 0.1588, "learning_rate": 4.0999816221996755e-06, "epoch": 0.31498014476018815, "percentage": 31.5, "elapsed_time": "4:12:56", "remaining_time": "9:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 4438, "loss": 0.1696, "learning_rate": 4.098549761972339e-06, "epoch": 0.31520545244599657, "percentage": 31.52, "elapsed_time": "4:13:06", "remaining_time": "9:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 4438, "loss": 0.173, "learning_rate": 4.097117014129903e-06, "epoch": 0.315430760131805, "percentage": 31.55, "elapsed_time": "4:13:18", "remaining_time": "9:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 4438, "loss": 0.1762, "learning_rate": 4.095683379467922e-06, "epoch": 0.3156560678176134, "percentage": 31.57, "elapsed_time": "4:13:30", "remaining_time": "9:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 4438, "loss": 0.173, "learning_rate": 4.094248858782436e-06, "epoch": 0.3158813755034219, "percentage": 31.59, "elapsed_time": "4:13:40", "remaining_time": "9:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 4438, "loss": 0.1774, "learning_rate": 4.092813452869983e-06, "epoch": 0.3161066831892303, "percentage": 31.61, "elapsed_time": "4:13:51", "remaining_time": "9:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 4438, "loss": 0.1744, "learning_rate": 4.091377162527592e-06, "epoch": 0.3163319908750387, "percentage": 31.64, "elapsed_time": "4:14:02", "remaining_time": "9:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 4438, "loss": 0.1728, "learning_rate": 4.089939988552778e-06, "epoch": 0.31655729856084713, "percentage": 31.66, "elapsed_time": "4:14:13", "remaining_time": "9:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 4438, "loss": 0.1872, "learning_rate": 4.088501931743551e-06, "epoch": 0.3167826062466556, "percentage": 31.68, "elapsed_time": "4:14:26", "remaining_time": "9:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 4438, "loss": 0.1615, "learning_rate": 4.087062992898413e-06, "epoch": 0.317007913932464, "percentage": 31.7, "elapsed_time": "4:14:36", "remaining_time": "9:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 4438, "loss": 0.1758, "learning_rate": 4.08562317281635e-06, "epoch": 0.31723322161827244, "percentage": 31.73, "elapsed_time": "4:14:46", "remaining_time": "9:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 4438, "loss": 0.1715, "learning_rate": 4.084182472296842e-06, "epoch": 0.31745852930408086, "percentage": 31.75, "elapsed_time": "4:14:57", "remaining_time": "9:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 4438, "loss": 0.1721, "learning_rate": 4.082740892139856e-06, "epoch": 0.31768383698988933, "percentage": 31.77, "elapsed_time": "4:15:08", "remaining_time": "9:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 4438, "loss": 0.1602, "learning_rate": 4.081298433145847e-06, "epoch": 0.31790914467569775, "percentage": 31.79, "elapsed_time": "4:15:18", "remaining_time": "9:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 4438, "loss": 0.1729, "learning_rate": 4.07985509611576e-06, "epoch": 0.31813445236150617, "percentage": 31.82, "elapsed_time": "4:15:30", "remaining_time": "9:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 4438, "loss": 0.1671, "learning_rate": 4.078410881851026e-06, "epoch": 0.3183597600473146, "percentage": 31.84, "elapsed_time": "4:15:41", "remaining_time": "9:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 4438, "loss": 0.1667, "learning_rate": 4.076965791153562e-06, "epoch": 0.31858506773312306, "percentage": 31.86, "elapsed_time": "4:15:51", "remaining_time": "9:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 4438, "loss": 0.1836, "learning_rate": 4.075519824825775e-06, "epoch": 0.3188103754189315, "percentage": 31.88, "elapsed_time": "4:16:02", "remaining_time": "9:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 4438, "loss": 0.17, "learning_rate": 4.074072983670555e-06, "epoch": 0.3190356831047399, "percentage": 31.91, "elapsed_time": "4:16:13", "remaining_time": "9:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 4438, "loss": 0.1778, "learning_rate": 4.072625268491279e-06, "epoch": 0.3192609907905483, "percentage": 31.93, "elapsed_time": "4:16:22", "remaining_time": "9:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 4438, "loss": 0.1874, "learning_rate": 4.071176680091809e-06, "epoch": 0.3194862984763568, "percentage": 31.95, "elapsed_time": "4:16:32", "remaining_time": "9:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 4438, "loss": 0.1558, "learning_rate": 4.069727219276493e-06, "epoch": 0.3197116061621652, "percentage": 31.97, "elapsed_time": "4:16:44", "remaining_time": "9:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 4438, "loss": 0.1568, "learning_rate": 4.068276886850162e-06, "epoch": 0.3199369138479736, "percentage": 32.0, "elapsed_time": "4:16:54", "remaining_time": "9:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 4438, "loss": 0.1524, "learning_rate": 4.066825683618132e-06, "epoch": 0.3201622215337821, "percentage": 32.02, "elapsed_time": "4:17:04", "remaining_time": "9:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 4438, "loss": 0.1878, "learning_rate": 4.065373610386201e-06, "epoch": 0.3203875292195905, "percentage": 32.04, "elapsed_time": "4:17:16", "remaining_time": "9:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 4438, "loss": 0.1674, "learning_rate": 4.063920667960652e-06, "epoch": 0.32061283690539893, "percentage": 32.06, "elapsed_time": "4:17:27", "remaining_time": "9:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 4438, "loss": 0.1678, "learning_rate": 4.06246685714825e-06, "epoch": 0.32083814459120735, "percentage": 32.09, "elapsed_time": "4:17:38", "remaining_time": "9:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 4438, "loss": 0.1647, "learning_rate": 4.061012178756242e-06, "epoch": 0.3210634522770158, "percentage": 32.11, "elapsed_time": "4:17:48", "remaining_time": "9:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 4438, "loss": 0.1592, "learning_rate": 4.059556633592356e-06, "epoch": 0.32128875996282424, "percentage": 32.13, "elapsed_time": "4:17:59", "remaining_time": "9:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1427, "total_steps": 4438, "loss": 0.1689, "learning_rate": 4.058100222464802e-06, "epoch": 0.32151406764863266, "percentage": 32.15, "elapsed_time": "4:18:09", "remaining_time": "9:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 4438, "loss": 0.1528, "learning_rate": 4.056642946182271e-06, "epoch": 0.3217393753344411, "percentage": 32.18, "elapsed_time": "4:18:20", "remaining_time": "9:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1429, "total_steps": 4438, "loss": 0.1614, "learning_rate": 4.0551848055539345e-06, "epoch": 0.32196468302024955, "percentage": 32.2, "elapsed_time": "4:18:29", "remaining_time": "9:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 4438, "loss": 0.1737, "learning_rate": 4.0537258013894434e-06, "epoch": 0.32218999070605797, "percentage": 32.22, "elapsed_time": "4:18:41", "remaining_time": "9:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1431, "total_steps": 4438, "loss": 0.1705, "learning_rate": 4.052265934498929e-06, "epoch": 0.3224152983918664, "percentage": 32.24, "elapsed_time": "4:18:51", "remaining_time": "9:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 4438, "loss": 0.1573, "learning_rate": 4.0508052056929995e-06, "epoch": 0.3226406060776748, "percentage": 32.27, "elapsed_time": "4:19:00", "remaining_time": "9:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1433, "total_steps": 4438, "loss": 0.1609, "learning_rate": 4.049343615782744e-06, "epoch": 0.3228659137634833, "percentage": 32.29, "elapsed_time": "4:19:12", "remaining_time": "9:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 4438, "loss": 0.1734, "learning_rate": 4.047881165579729e-06, "epoch": 0.3230912214492917, "percentage": 32.31, "elapsed_time": "4:19:21", "remaining_time": "9:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 4438, "loss": 0.1648, "learning_rate": 4.046417855895999e-06, "epoch": 0.3233165291351001, "percentage": 32.33, "elapsed_time": "4:19:32", "remaining_time": "9:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 4438, "loss": 0.1674, "learning_rate": 4.044953687544074e-06, "epoch": 0.32354183682090853, "percentage": 32.36, "elapsed_time": "4:19:43", "remaining_time": "9:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1437, "total_steps": 4438, "loss": 0.1494, "learning_rate": 4.043488661336953e-06, "epoch": 0.323767144506717, "percentage": 32.38, "elapsed_time": "4:19:53", "remaining_time": "9:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 4438, "loss": 0.1601, "learning_rate": 4.042022778088111e-06, "epoch": 0.3239924521925254, "percentage": 32.4, "elapsed_time": "4:20:03", "remaining_time": "9:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1439, "total_steps": 4438, "loss": 0.1774, "learning_rate": 4.0405560386114975e-06, "epoch": 0.32421775987833384, "percentage": 32.42, "elapsed_time": "4:20:14", "remaining_time": "9:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 4438, "loss": 0.1444, "learning_rate": 4.039088443721538e-06, "epoch": 0.32444306756414226, "percentage": 32.45, "elapsed_time": "4:20:26", "remaining_time": "9:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1441, "total_steps": 4438, "loss": 0.163, "learning_rate": 4.0376199942331335e-06, "epoch": 0.32466837524995074, "percentage": 32.47, "elapsed_time": "4:20:37", "remaining_time": "9:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 4438, "loss": 0.167, "learning_rate": 4.03615069096166e-06, "epoch": 0.32489368293575915, "percentage": 32.49, "elapsed_time": "4:20:47", "remaining_time": "9:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1443, "total_steps": 4438, "loss": 0.1704, "learning_rate": 4.034680534722966e-06, "epoch": 0.32511899062156757, "percentage": 32.51, "elapsed_time": "4:20:57", "remaining_time": "9:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 4438, "loss": 0.1621, "learning_rate": 4.033209526333375e-06, "epoch": 0.325344298307376, "percentage": 32.54, "elapsed_time": "4:21:08", "remaining_time": "9:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 4438, "loss": 0.1791, "learning_rate": 4.0317376666096815e-06, "epoch": 0.32556960599318446, "percentage": 32.56, "elapsed_time": "4:21:18", "remaining_time": "9:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 4438, "loss": 0.1642, "learning_rate": 4.030264956369158e-06, "epoch": 0.3257949136789929, "percentage": 32.58, "elapsed_time": "4:21:28", "remaining_time": "9:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1447, "total_steps": 4438, "loss": 0.1675, "learning_rate": 4.028791396429541e-06, "epoch": 0.3260202213648013, "percentage": 32.6, "elapsed_time": "4:21:39", "remaining_time": "9:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 4438, "loss": 0.1735, "learning_rate": 4.0273169876090475e-06, "epoch": 0.3262455290506097, "percentage": 32.63, "elapsed_time": "4:21:50", "remaining_time": "9:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1449, "total_steps": 4438, "loss": 0.1563, "learning_rate": 4.02584173072636e-06, "epoch": 0.3264708367364182, "percentage": 32.65, "elapsed_time": "4:22:01", "remaining_time": "9:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 4438, "loss": 0.1555, "learning_rate": 4.024365626600632e-06, "epoch": 0.3266961444222266, "percentage": 32.67, "elapsed_time": "4:22:11", "remaining_time": "9:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1451, "total_steps": 4438, "loss": 0.1667, "learning_rate": 4.022888676051492e-06, "epoch": 0.326921452108035, "percentage": 32.69, "elapsed_time": "4:22:24", "remaining_time": "9:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 4438, "loss": 0.1695, "learning_rate": 4.021410879899035e-06, "epoch": 0.32714675979384344, "percentage": 32.72, "elapsed_time": "4:22:34", "remaining_time": "8:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1453, "total_steps": 4438, "loss": 0.1642, "learning_rate": 4.019932238963824e-06, "epoch": 0.3273720674796519, "percentage": 32.74, "elapsed_time": "4:22:46", "remaining_time": "8:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 4438, "loss": 0.1667, "learning_rate": 4.018452754066895e-06, "epoch": 0.32759737516546034, "percentage": 32.76, "elapsed_time": "4:22:56", "remaining_time": "8:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 4438, "loss": 0.1605, "learning_rate": 4.016972426029751e-06, "epoch": 0.32782268285126875, "percentage": 32.79, "elapsed_time": "4:23:07", "remaining_time": "8:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 4438, "loss": 0.1486, "learning_rate": 4.015491255674362e-06, "epoch": 0.32804799053707717, "percentage": 32.81, "elapsed_time": "4:23:18", "remaining_time": "8:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1457, "total_steps": 4438, "loss": 0.1771, "learning_rate": 4.014009243823167e-06, "epoch": 0.32827329822288565, "percentage": 32.83, "elapsed_time": "4:23:27", "remaining_time": "8:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 4438, "loss": 0.1639, "learning_rate": 4.012526391299073e-06, "epoch": 0.32849860590869406, "percentage": 32.85, "elapsed_time": "4:23:38", "remaining_time": "8:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1459, "total_steps": 4438, "loss": 0.1729, "learning_rate": 4.01104269892545e-06, "epoch": 0.3287239135945025, "percentage": 32.88, "elapsed_time": "4:23:49", "remaining_time": "8:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 4438, "loss": 0.1605, "learning_rate": 4.0095581675261405e-06, "epoch": 0.3289492212803109, "percentage": 32.9, "elapsed_time": "4:23:58", "remaining_time": "8:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1461, "total_steps": 4438, "loss": 0.1731, "learning_rate": 4.008072797925447e-06, "epoch": 0.3291745289661194, "percentage": 32.92, "elapsed_time": "4:24:10", "remaining_time": "8:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 4438, "loss": 0.1583, "learning_rate": 4.006586590948141e-06, "epoch": 0.3293998366519278, "percentage": 32.94, "elapsed_time": "4:24:21", "remaining_time": "8:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1463, "total_steps": 4438, "loss": 0.1839, "learning_rate": 4.005099547419458e-06, "epoch": 0.3296251443377362, "percentage": 32.97, "elapsed_time": "4:24:31", "remaining_time": "8:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 4438, "loss": 0.1689, "learning_rate": 4.003611668165097e-06, "epoch": 0.3298504520235446, "percentage": 32.99, "elapsed_time": "4:24:42", "remaining_time": "8:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 4438, "loss": 0.1656, "learning_rate": 4.0021229540112226e-06, "epoch": 0.3300757597093531, "percentage": 33.01, "elapsed_time": "4:24:52", "remaining_time": "8:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 4438, "loss": 0.1709, "learning_rate": 4.000633405784461e-06, "epoch": 0.3303010673951615, "percentage": 33.03, "elapsed_time": "4:25:03", "remaining_time": "8:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1467, "total_steps": 4438, "loss": 0.1677, "learning_rate": 3.999143024311904e-06, "epoch": 0.33052637508096994, "percentage": 33.06, "elapsed_time": "4:25:14", "remaining_time": "8:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 4438, "loss": 0.1729, "learning_rate": 3.997651810421106e-06, "epoch": 0.33075168276677835, "percentage": 33.08, "elapsed_time": "4:25:24", "remaining_time": "8:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1469, "total_steps": 4438, "loss": 0.166, "learning_rate": 3.99615976494008e-06, "epoch": 0.33097699045258683, "percentage": 33.1, "elapsed_time": "4:25:34", "remaining_time": "8:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 4438, "loss": 0.1855, "learning_rate": 3.994666888697304e-06, "epoch": 0.33120229813839525, "percentage": 33.12, "elapsed_time": "4:25:46", "remaining_time": "8:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1471, "total_steps": 4438, "loss": 0.1603, "learning_rate": 3.993173182521718e-06, "epoch": 0.33142760582420366, "percentage": 33.15, "elapsed_time": "4:25:57", "remaining_time": "8:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 4438, "loss": 0.1749, "learning_rate": 3.991678647242719e-06, "epoch": 0.33165291351001214, "percentage": 33.17, "elapsed_time": "4:26:09", "remaining_time": "8:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1473, "total_steps": 4438, "loss": 0.1619, "learning_rate": 3.990183283690169e-06, "epoch": 0.33187822119582056, "percentage": 33.19, "elapsed_time": "4:26:19", "remaining_time": "8:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 4438, "loss": 0.1623, "learning_rate": 3.988687092694386e-06, "epoch": 0.332103528881629, "percentage": 33.21, "elapsed_time": "4:26:30", "remaining_time": "8:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 4438, "loss": 0.1744, "learning_rate": 3.98719007508615e-06, "epoch": 0.3323288365674374, "percentage": 33.24, "elapsed_time": "4:26:41", "remaining_time": "8:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 4438, "loss": 0.1669, "learning_rate": 3.985692231696699e-06, "epoch": 0.33255414425324586, "percentage": 33.26, "elapsed_time": "4:26:52", "remaining_time": "8:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1477, "total_steps": 4438, "loss": 0.1681, "learning_rate": 3.98419356335773e-06, "epoch": 0.3327794519390543, "percentage": 33.28, "elapsed_time": "4:27:04", "remaining_time": "8:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 4438, "loss": 0.1712, "learning_rate": 3.982694070901396e-06, "epoch": 0.3330047596248627, "percentage": 33.3, "elapsed_time": "4:27:14", "remaining_time": "8:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1479, "total_steps": 4438, "loss": 0.1667, "learning_rate": 3.981193755160311e-06, "epoch": 0.3332300673106711, "percentage": 33.33, "elapsed_time": "4:27:25", "remaining_time": "8:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 4438, "loss": 0.1908, "learning_rate": 3.979692616967543e-06, "epoch": 0.3334553749964796, "percentage": 33.35, "elapsed_time": "4:27:36", "remaining_time": "8:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1481, "total_steps": 4438, "loss": 0.1643, "learning_rate": 3.9781906571566195e-06, "epoch": 0.333680682682288, "percentage": 33.37, "elapsed_time": "4:27:48", "remaining_time": "8:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 4438, "loss": 0.1768, "learning_rate": 3.976687876561523e-06, "epoch": 0.33390599036809643, "percentage": 33.39, "elapsed_time": "4:28:00", "remaining_time": "8:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1483, "total_steps": 4438, "loss": 0.1689, "learning_rate": 3.975184276016689e-06, "epoch": 0.33413129805390485, "percentage": 33.42, "elapsed_time": "4:28:10", "remaining_time": "8:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 4438, "loss": 0.1543, "learning_rate": 3.973679856357014e-06, "epoch": 0.3343566057397133, "percentage": 33.44, "elapsed_time": "4:28:20", "remaining_time": "8:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 4438, "loss": 0.1624, "learning_rate": 3.972174618417843e-06, "epoch": 0.33458191342552174, "percentage": 33.46, "elapsed_time": "4:28:33", "remaining_time": "8:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 4438, "loss": 0.1765, "learning_rate": 3.970668563034982e-06, "epoch": 0.33480722111133016, "percentage": 33.48, "elapsed_time": "4:28:44", "remaining_time": "8:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1487, "total_steps": 4438, "loss": 0.1692, "learning_rate": 3.9691616910446845e-06, "epoch": 0.3350325287971386, "percentage": 33.51, "elapsed_time": "4:28:54", "remaining_time": "8:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 4438, "loss": 0.172, "learning_rate": 3.967654003283662e-06, "epoch": 0.33525783648294705, "percentage": 33.53, "elapsed_time": "4:29:04", "remaining_time": "8:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1489, "total_steps": 4438, "loss": 0.1802, "learning_rate": 3.966145500589076e-06, "epoch": 0.33548314416875546, "percentage": 33.55, "elapsed_time": "4:29:16", "remaining_time": "8:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 4438, "loss": 0.1791, "learning_rate": 3.9646361837985435e-06, "epoch": 0.3357084518545639, "percentage": 33.57, "elapsed_time": "4:29:27", "remaining_time": "8:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1491, "total_steps": 4438, "loss": 0.1557, "learning_rate": 3.9631260537501304e-06, "epoch": 0.3359337595403723, "percentage": 33.6, "elapsed_time": "4:29:38", "remaining_time": "8:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 4438, "loss": 0.1743, "learning_rate": 3.961615111282357e-06, "epoch": 0.3361590672261808, "percentage": 33.62, "elapsed_time": "4:29:49", "remaining_time": "8:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1493, "total_steps": 4438, "loss": 0.1674, "learning_rate": 3.960103357234192e-06, "epoch": 0.3363843749119892, "percentage": 33.64, "elapsed_time": "4:29:58", "remaining_time": "8:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 4438, "loss": 0.181, "learning_rate": 3.958590792445057e-06, "epoch": 0.3366096825977976, "percentage": 33.66, "elapsed_time": "4:30:09", "remaining_time": "8:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 4438, "loss": 0.1619, "learning_rate": 3.957077417754822e-06, "epoch": 0.33683499028360603, "percentage": 33.69, "elapsed_time": "4:30:21", "remaining_time": "8:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 4438, "loss": 0.1776, "learning_rate": 3.9555632340038075e-06, "epoch": 0.3370602979694145, "percentage": 33.71, "elapsed_time": "4:30:31", "remaining_time": "8:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1497, "total_steps": 4438, "loss": 0.1695, "learning_rate": 3.9540482420327845e-06, "epoch": 0.3372856056552229, "percentage": 33.73, "elapsed_time": "4:30:42", "remaining_time": "8:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 4438, "loss": 0.1666, "learning_rate": 3.9525324426829716e-06, "epoch": 0.33751091334103134, "percentage": 33.75, "elapsed_time": "4:30:51", "remaining_time": "8:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1499, "total_steps": 4438, "loss": 0.1507, "learning_rate": 3.951015836796034e-06, "epoch": 0.33773622102683976, "percentage": 33.78, "elapsed_time": "4:31:00", "remaining_time": "8:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 4438, "loss": 0.1532, "learning_rate": 3.949498425214088e-06, "epoch": 0.33796152871264823, "percentage": 33.8, "elapsed_time": "4:31:11", "remaining_time": "8:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 4438, "eval_loss": 0.1660395711660385, "epoch": 0.33796152871264823, "percentage": 33.8, "elapsed_time": "4:33:14", "remaining_time": "8:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1501, "total_steps": 4438, "loss": 0.1635, "learning_rate": 3.947980208779693e-06, "epoch": 0.33818683639845665, "percentage": 33.82, "elapsed_time": "4:33:25", "remaining_time": "8:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 4438, "loss": 0.1856, "learning_rate": 3.946461188335863e-06, "epoch": 0.33841214408426507, "percentage": 33.84, "elapsed_time": "4:33:38", "remaining_time": "8:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1503, "total_steps": 4438, "loss": 0.1904, "learning_rate": 3.944941364726049e-06, "epoch": 0.3386374517700735, "percentage": 33.87, "elapsed_time": "4:33:48", "remaining_time": "8:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 4438, "loss": 0.1608, "learning_rate": 3.943420738794153e-06, "epoch": 0.33886275945588196, "percentage": 33.89, "elapsed_time": "4:33:59", "remaining_time": "8:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 4438, "loss": 0.1806, "learning_rate": 3.941899311384525e-06, "epoch": 0.3390880671416904, "percentage": 33.91, "elapsed_time": "4:34:10", "remaining_time": "8:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 4438, "loss": 0.1697, "learning_rate": 3.9403770833419535e-06, "epoch": 0.3393133748274988, "percentage": 33.93, "elapsed_time": "4:34:22", "remaining_time": "8:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1507, "total_steps": 4438, "loss": 0.1528, "learning_rate": 3.938854055511676e-06, "epoch": 0.3395386825133072, "percentage": 33.96, "elapsed_time": "4:34:31", "remaining_time": "8:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 4438, "loss": 0.1641, "learning_rate": 3.937330228739374e-06, "epoch": 0.3397639901991157, "percentage": 33.98, "elapsed_time": "4:34:42", "remaining_time": "8:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1509, "total_steps": 4438, "loss": 0.1736, "learning_rate": 3.9358056038711714e-06, "epoch": 0.3399892978849241, "percentage": 34.0, "elapsed_time": "4:34:53", "remaining_time": "8:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 4438, "loss": 0.1693, "learning_rate": 3.934280181753634e-06, "epoch": 0.3402146055707325, "percentage": 34.02, "elapsed_time": "4:35:03", "remaining_time": "8:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1511, "total_steps": 4438, "loss": 0.1463, "learning_rate": 3.932753963233773e-06, "epoch": 0.34043991325654094, "percentage": 34.05, "elapsed_time": "4:35:12", "remaining_time": "8:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 4438, "loss": 0.1639, "learning_rate": 3.931226949159041e-06, "epoch": 0.3406652209423494, "percentage": 34.07, "elapsed_time": "4:35:24", "remaining_time": "8:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1513, "total_steps": 4438, "loss": 0.1672, "learning_rate": 3.9296991403773325e-06, "epoch": 0.34089052862815783, "percentage": 34.09, "elapsed_time": "4:35:33", "remaining_time": "8:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 4438, "loss": 0.1498, "learning_rate": 3.9281705377369814e-06, "epoch": 0.34111583631396625, "percentage": 34.11, "elapsed_time": "4:35:45", "remaining_time": "8:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 4438, "loss": 0.1538, "learning_rate": 3.9266411420867635e-06, "epoch": 0.34134114399977467, "percentage": 34.14, "elapsed_time": "4:35:56", "remaining_time": "8:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 4438, "loss": 0.1717, "learning_rate": 3.925110954275897e-06, "epoch": 0.34156645168558314, "percentage": 34.16, "elapsed_time": "4:36:06", "remaining_time": "8:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1517, "total_steps": 4438, "loss": 0.1574, "learning_rate": 3.923579975154037e-06, "epoch": 0.34179175937139156, "percentage": 34.18, "elapsed_time": "4:36:16", "remaining_time": "8:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 4438, "loss": 0.1683, "learning_rate": 3.922048205571279e-06, "epoch": 0.3420170670572, "percentage": 34.2, "elapsed_time": "4:36:27", "remaining_time": "8:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1519, "total_steps": 4438, "loss": 0.1683, "learning_rate": 3.920515646378159e-06, "epoch": 0.34224237474300845, "percentage": 34.23, "elapsed_time": "4:36:40", "remaining_time": "8:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 4438, "loss": 0.1796, "learning_rate": 3.918982298425647e-06, "epoch": 0.34246768242881687, "percentage": 34.25, "elapsed_time": "4:36:51", "remaining_time": "8:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1521, "total_steps": 4438, "loss": 0.1422, "learning_rate": 3.917448162565157e-06, "epoch": 0.3426929901146253, "percentage": 34.27, "elapsed_time": "4:37:03", "remaining_time": "8:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 4438, "loss": 0.1699, "learning_rate": 3.915913239648535e-06, "epoch": 0.3429182978004337, "percentage": 34.29, "elapsed_time": "4:37:14", "remaining_time": "8:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1523, "total_steps": 4438, "loss": 0.1711, "learning_rate": 3.91437753052807e-06, "epoch": 0.3431436054862422, "percentage": 34.32, "elapsed_time": "4:37:24", "remaining_time": "8:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 4438, "loss": 0.1574, "learning_rate": 3.91284103605648e-06, "epoch": 0.3433689131720506, "percentage": 34.34, "elapsed_time": "4:37:35", "remaining_time": "8:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 4438, "loss": 0.1608, "learning_rate": 3.911303757086925e-06, "epoch": 0.343594220857859, "percentage": 34.36, "elapsed_time": "4:37:46", "remaining_time": "8:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 4438, "loss": 0.16, "learning_rate": 3.909765694473e-06, "epoch": 0.34381952854366743, "percentage": 34.38, "elapsed_time": "4:37:56", "remaining_time": "8:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1527, "total_steps": 4438, "loss": 0.1653, "learning_rate": 3.908226849068731e-06, "epoch": 0.3440448362294759, "percentage": 34.41, "elapsed_time": "4:38:07", "remaining_time": "8:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 4438, "loss": 0.1632, "learning_rate": 3.906687221728583e-06, "epoch": 0.3442701439152843, "percentage": 34.43, "elapsed_time": "4:38:18", "remaining_time": "8:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1529, "total_steps": 4438, "loss": 0.1565, "learning_rate": 3.905146813307455e-06, "epoch": 0.34449545160109274, "percentage": 34.45, "elapsed_time": "4:38:29", "remaining_time": "8:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 4438, "loss": 0.1646, "learning_rate": 3.903605624660676e-06, "epoch": 0.34472075928690116, "percentage": 34.47, "elapsed_time": "4:38:40", "remaining_time": "8:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1531, "total_steps": 4438, "loss": 0.1616, "learning_rate": 3.902063656644012e-06, "epoch": 0.34494606697270963, "percentage": 34.5, "elapsed_time": "4:38:50", "remaining_time": "8:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 4438, "loss": 0.1889, "learning_rate": 3.900520910113659e-06, "epoch": 0.34517137465851805, "percentage": 34.52, "elapsed_time": "4:38:59", "remaining_time": "8:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1533, "total_steps": 4438, "loss": 0.1706, "learning_rate": 3.898977385926249e-06, "epoch": 0.34539668234432647, "percentage": 34.54, "elapsed_time": "4:39:08", "remaining_time": "8:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 4438, "loss": 0.1496, "learning_rate": 3.897433084938841e-06, "epoch": 0.3456219900301349, "percentage": 34.57, "elapsed_time": "4:39:19", "remaining_time": "8:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 4438, "loss": 0.1654, "learning_rate": 3.895888008008929e-06, "epoch": 0.34584729771594336, "percentage": 34.59, "elapsed_time": "4:39:29", "remaining_time": "8:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 4438, "loss": 0.1818, "learning_rate": 3.894342155994437e-06, "epoch": 0.3460726054017518, "percentage": 34.61, "elapsed_time": "4:39:41", "remaining_time": "8:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1537, "total_steps": 4438, "loss": 0.1647, "learning_rate": 3.892795529753718e-06, "epoch": 0.3462979130875602, "percentage": 34.63, "elapsed_time": "4:39:52", "remaining_time": "8:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 4438, "loss": 0.1643, "learning_rate": 3.891248130145556e-06, "epoch": 0.3465232207733686, "percentage": 34.66, "elapsed_time": "4:40:02", "remaining_time": "8:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1539, "total_steps": 4438, "loss": 0.1605, "learning_rate": 3.889699958029166e-06, "epoch": 0.3467485284591771, "percentage": 34.68, "elapsed_time": "4:40:15", "remaining_time": "8:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 4438, "loss": 0.1656, "learning_rate": 3.888151014264189e-06, "epoch": 0.3469738361449855, "percentage": 34.7, "elapsed_time": "4:40:25", "remaining_time": "8:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1541, "total_steps": 4438, "loss": 0.1494, "learning_rate": 3.886601299710694e-06, "epoch": 0.3471991438307939, "percentage": 34.72, "elapsed_time": "4:40:35", "remaining_time": "8:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 4438, "loss": 0.1506, "learning_rate": 3.885050815229182e-06, "epoch": 0.34742445151660234, "percentage": 34.75, "elapsed_time": "4:40:45", "remaining_time": "8:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1543, "total_steps": 4438, "loss": 0.1699, "learning_rate": 3.88349956168058e-06, "epoch": 0.3476497592024108, "percentage": 34.77, "elapsed_time": "4:40:55", "remaining_time": "8:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 4438, "loss": 0.1689, "learning_rate": 3.881947539926239e-06, "epoch": 0.34787506688821923, "percentage": 34.79, "elapsed_time": "4:41:07", "remaining_time": "8:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 4438, "loss": 0.1616, "learning_rate": 3.880394750827939e-06, "epoch": 0.34810037457402765, "percentage": 34.81, "elapsed_time": "4:41:17", "remaining_time": "8:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 4438, "loss": 0.1739, "learning_rate": 3.878841195247888e-06, "epoch": 0.34832568225983607, "percentage": 34.84, "elapsed_time": "4:41:26", "remaining_time": "8:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1547, "total_steps": 4438, "loss": 0.1683, "learning_rate": 3.877286874048716e-06, "epoch": 0.34855098994564454, "percentage": 34.86, "elapsed_time": "4:41:36", "remaining_time": "8:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 4438, "loss": 0.173, "learning_rate": 3.875731788093478e-06, "epoch": 0.34877629763145296, "percentage": 34.88, "elapsed_time": "4:41:46", "remaining_time": "8:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1549, "total_steps": 4438, "loss": 0.1607, "learning_rate": 3.874175938245659e-06, "epoch": 0.3490016053172614, "percentage": 34.9, "elapsed_time": "4:41:56", "remaining_time": "8:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 4438, "loss": 0.1655, "learning_rate": 3.872619325369162e-06, "epoch": 0.3492269130030698, "percentage": 34.93, "elapsed_time": "4:42:08", "remaining_time": "8:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1551, "total_steps": 4438, "loss": 0.1655, "learning_rate": 3.871061950328317e-06, "epoch": 0.34945222068887827, "percentage": 34.95, "elapsed_time": "4:42:19", "remaining_time": "8:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 4438, "loss": 0.1649, "learning_rate": 3.869503813987876e-06, "epoch": 0.3496775283746867, "percentage": 34.97, "elapsed_time": "4:42:29", "remaining_time": "8:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1553, "total_steps": 4438, "loss": 0.1684, "learning_rate": 3.867944917213014e-06, "epoch": 0.3499028360604951, "percentage": 34.99, "elapsed_time": "4:42:39", "remaining_time": "8:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 4438, "loss": 0.1493, "learning_rate": 3.866385260869327e-06, "epoch": 0.3501281437463035, "percentage": 35.02, "elapsed_time": "4:42:48", "remaining_time": "8:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 4438, "loss": 0.1681, "learning_rate": 3.864824845822837e-06, "epoch": 0.350353451432112, "percentage": 35.04, "elapsed_time": "4:42:58", "remaining_time": "8:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 4438, "loss": 0.1751, "learning_rate": 3.8632636729399815e-06, "epoch": 0.3505787591179204, "percentage": 35.06, "elapsed_time": "4:43:08", "remaining_time": "8:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1557, "total_steps": 4438, "loss": 0.1676, "learning_rate": 3.861701743087622e-06, "epoch": 0.35080406680372883, "percentage": 35.08, "elapsed_time": "4:43:18", "remaining_time": "8:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 4438, "loss": 0.1807, "learning_rate": 3.860139057133042e-06, "epoch": 0.35102937448953725, "percentage": 35.11, "elapsed_time": "4:43:29", "remaining_time": "8:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1559, "total_steps": 4438, "loss": 0.1662, "learning_rate": 3.858575615943941e-06, "epoch": 0.3512546821753457, "percentage": 35.13, "elapsed_time": "4:43:41", "remaining_time": "8:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 4438, "loss": 0.1853, "learning_rate": 3.85701142038844e-06, "epoch": 0.35147998986115414, "percentage": 35.15, "elapsed_time": "4:43:52", "remaining_time": "8:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1561, "total_steps": 4438, "loss": 0.1592, "learning_rate": 3.855446471335078e-06, "epoch": 0.35170529754696256, "percentage": 35.17, "elapsed_time": "4:44:03", "remaining_time": "8:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 4438, "loss": 0.164, "learning_rate": 3.853880769652815e-06, "epoch": 0.351930605232771, "percentage": 35.2, "elapsed_time": "4:44:12", "remaining_time": "8:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1563, "total_steps": 4438, "loss": 0.1565, "learning_rate": 3.852314316211023e-06, "epoch": 0.35215591291857945, "percentage": 35.22, "elapsed_time": "4:44:24", "remaining_time": "8:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 4438, "loss": 0.1807, "learning_rate": 3.850747111879499e-06, "epoch": 0.35238122060438787, "percentage": 35.24, "elapsed_time": "4:44:36", "remaining_time": "8:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 4438, "loss": 0.1566, "learning_rate": 3.84917915752845e-06, "epoch": 0.3526065282901963, "percentage": 35.26, "elapsed_time": "4:44:46", "remaining_time": "8:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 4438, "loss": 0.1688, "learning_rate": 3.8476104540285054e-06, "epoch": 0.3528318359760047, "percentage": 35.29, "elapsed_time": "4:44:57", "remaining_time": "8:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1567, "total_steps": 4438, "loss": 0.1722, "learning_rate": 3.846041002250705e-06, "epoch": 0.3530571436618132, "percentage": 35.31, "elapsed_time": "4:45:07", "remaining_time": "8:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 4438, "loss": 0.1667, "learning_rate": 3.84447080306651e-06, "epoch": 0.3532824513476216, "percentage": 35.33, "elapsed_time": "4:45:18", "remaining_time": "8:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1569, "total_steps": 4438, "loss": 0.1733, "learning_rate": 3.842899857347792e-06, "epoch": 0.35350775903343, "percentage": 35.35, "elapsed_time": "4:45:29", "remaining_time": "8:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 4438, "loss": 0.1572, "learning_rate": 3.841328165966837e-06, "epoch": 0.3537330667192385, "percentage": 35.38, "elapsed_time": "4:45:41", "remaining_time": "8:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1571, "total_steps": 4438, "loss": 0.1705, "learning_rate": 3.839755729796349e-06, "epoch": 0.3539583744050469, "percentage": 35.4, "elapsed_time": "4:45:51", "remaining_time": "8:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 4438, "loss": 0.1546, "learning_rate": 3.838182549709442e-06, "epoch": 0.3541836820908553, "percentage": 35.42, "elapsed_time": "4:46:02", "remaining_time": "8:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1573, "total_steps": 4438, "loss": 0.177, "learning_rate": 3.8366086265796445e-06, "epoch": 0.35440898977666374, "percentage": 35.44, "elapsed_time": "4:46:13", "remaining_time": "8:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 4438, "loss": 0.1598, "learning_rate": 3.835033961280898e-06, "epoch": 0.3546342974624722, "percentage": 35.47, "elapsed_time": "4:46:23", "remaining_time": "8:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 4438, "loss": 0.1618, "learning_rate": 3.8334585546875544e-06, "epoch": 0.35485960514828063, "percentage": 35.49, "elapsed_time": "4:46:34", "remaining_time": "8:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 4438, "loss": 0.1501, "learning_rate": 3.831882407674379e-06, "epoch": 0.35508491283408905, "percentage": 35.51, "elapsed_time": "4:46:44", "remaining_time": "8:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1577, "total_steps": 4438, "loss": 0.1454, "learning_rate": 3.830305521116546e-06, "epoch": 0.35531022051989747, "percentage": 35.53, "elapsed_time": "4:46:54", "remaining_time": "8:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 4438, "loss": 0.1829, "learning_rate": 3.828727895889644e-06, "epoch": 0.35553552820570594, "percentage": 35.56, "elapsed_time": "4:47:05", "remaining_time": "8:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1579, "total_steps": 4438, "loss": 0.164, "learning_rate": 3.827149532869668e-06, "epoch": 0.35576083589151436, "percentage": 35.58, "elapsed_time": "4:47:15", "remaining_time": "8:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 4438, "loss": 0.1748, "learning_rate": 3.825570432933026e-06, "epoch": 0.3559861435773228, "percentage": 35.6, "elapsed_time": "4:47:27", "remaining_time": "8:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1581, "total_steps": 4438, "loss": 0.1658, "learning_rate": 3.823990596956531e-06, "epoch": 0.3562114512631312, "percentage": 35.62, "elapsed_time": "4:47:37", "remaining_time": "8:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 4438, "loss": 0.1641, "learning_rate": 3.8224100258174066e-06, "epoch": 0.35643675894893967, "percentage": 35.65, "elapsed_time": "4:47:50", "remaining_time": "8:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1583, "total_steps": 4438, "loss": 0.1674, "learning_rate": 3.820828720393287e-06, "epoch": 0.3566620666347481, "percentage": 35.67, "elapsed_time": "4:48:00", "remaining_time": "8:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 4438, "loss": 0.1548, "learning_rate": 3.819246681562212e-06, "epoch": 0.3568873743205565, "percentage": 35.69, "elapsed_time": "4:48:11", "remaining_time": "8:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 4438, "loss": 0.1527, "learning_rate": 3.817663910202628e-06, "epoch": 0.3571126820063649, "percentage": 35.71, "elapsed_time": "4:48:22", "remaining_time": "8:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 4438, "loss": 0.1565, "learning_rate": 3.81608040719339e-06, "epoch": 0.3573379896921734, "percentage": 35.74, "elapsed_time": "4:48:32", "remaining_time": "8:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1587, "total_steps": 4438, "loss": 0.1616, "learning_rate": 3.8144961734137566e-06, "epoch": 0.3575632973779818, "percentage": 35.76, "elapsed_time": "4:48:42", "remaining_time": "8:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 4438, "loss": 0.1494, "learning_rate": 3.812911209743395e-06, "epoch": 0.35778860506379023, "percentage": 35.78, "elapsed_time": "4:48:53", "remaining_time": "8:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1589, "total_steps": 4438, "loss": 0.1507, "learning_rate": 3.8113255170623763e-06, "epoch": 0.35801391274959865, "percentage": 35.8, "elapsed_time": "4:49:03", "remaining_time": "8:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 4438, "loss": 0.1725, "learning_rate": 3.809739096251176e-06, "epoch": 0.3582392204354071, "percentage": 35.83, "elapsed_time": "4:49:13", "remaining_time": "8:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1591, "total_steps": 4438, "loss": 0.1693, "learning_rate": 3.8081519481906747e-06, "epoch": 0.35846452812121554, "percentage": 35.85, "elapsed_time": "4:49:24", "remaining_time": "8:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 4438, "loss": 0.1582, "learning_rate": 3.8065640737621566e-06, "epoch": 0.35868983580702396, "percentage": 35.87, "elapsed_time": "4:49:34", "remaining_time": "8:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1593, "total_steps": 4438, "loss": 0.1593, "learning_rate": 3.804975473847309e-06, "epoch": 0.3589151434928324, "percentage": 35.89, "elapsed_time": "4:49:45", "remaining_time": "8:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 4438, "loss": 0.1718, "learning_rate": 3.803386149328223e-06, "epoch": 0.35914045117864085, "percentage": 35.92, "elapsed_time": "4:49:56", "remaining_time": "8:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 4438, "loss": 0.1627, "learning_rate": 3.8017961010873904e-06, "epoch": 0.35936575886444927, "percentage": 35.94, "elapsed_time": "4:50:06", "remaining_time": "8:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 4438, "loss": 0.1836, "learning_rate": 3.8002053300077056e-06, "epoch": 0.3595910665502577, "percentage": 35.96, "elapsed_time": "4:50:16", "remaining_time": "8:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1597, "total_steps": 4438, "loss": 0.1681, "learning_rate": 3.7986138369724664e-06, "epoch": 0.3598163742360661, "percentage": 35.98, "elapsed_time": "4:50:28", "remaining_time": "8:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 4438, "loss": 0.1632, "learning_rate": 3.7970216228653667e-06, "epoch": 0.3600416819218746, "percentage": 36.01, "elapsed_time": "4:50:38", "remaining_time": "8:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1599, "total_steps": 4438, "loss": 0.1565, "learning_rate": 3.795428688570505e-06, "epoch": 0.360266989607683, "percentage": 36.03, "elapsed_time": "4:50:49", "remaining_time": "8:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 4438, "loss": 0.1687, "learning_rate": 3.7938350349723784e-06, "epoch": 0.3604922972934914, "percentage": 36.05, "elapsed_time": "4:51:00", "remaining_time": "8:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1601, "total_steps": 4438, "loss": 0.1654, "learning_rate": 3.792240662955884e-06, "epoch": 0.36071760497929983, "percentage": 36.07, "elapsed_time": "4:51:09", "remaining_time": "8:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1602, "total_steps": 4438, "loss": 0.1594, "learning_rate": 3.7906455734063156e-06, "epoch": 0.3609429126651083, "percentage": 36.1, "elapsed_time": "4:51:21", "remaining_time": "8:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1603, "total_steps": 4438, "loss": 0.1722, "learning_rate": 3.7890497672093686e-06, "epoch": 0.3611682203509167, "percentage": 36.12, "elapsed_time": "4:51:31", "remaining_time": "8:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1604, "total_steps": 4438, "loss": 0.1576, "learning_rate": 3.7874532452511324e-06, "epoch": 0.36139352803672514, "percentage": 36.14, "elapsed_time": "4:51:42", "remaining_time": "8:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 4438, "loss": 0.1653, "learning_rate": 3.785856008418099e-06, "epoch": 0.36161883572253356, "percentage": 36.16, "elapsed_time": "4:51:53", "remaining_time": "8:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1606, "total_steps": 4438, "loss": 0.1686, "learning_rate": 3.7842580575971533e-06, "epoch": 0.36184414340834203, "percentage": 36.19, "elapsed_time": "4:52:04", "remaining_time": "8:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1607, "total_steps": 4438, "loss": 0.1684, "learning_rate": 3.782659393675577e-06, "epoch": 0.36206945109415045, "percentage": 36.21, "elapsed_time": "4:52:14", "remaining_time": "8:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1608, "total_steps": 4438, "loss": 0.1495, "learning_rate": 3.7810600175410493e-06, "epoch": 0.36229475877995887, "percentage": 36.23, "elapsed_time": "4:52:24", "remaining_time": "8:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1609, "total_steps": 4438, "loss": 0.1629, "learning_rate": 3.7794599300816435e-06, "epoch": 0.3625200664657673, "percentage": 36.26, "elapsed_time": "4:52:35", "remaining_time": "8:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 4438, "loss": 0.1715, "learning_rate": 3.77785913218583e-06, "epoch": 0.36274537415157576, "percentage": 36.28, "elapsed_time": "4:52:47", "remaining_time": "8:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1611, "total_steps": 4438, "loss": 0.1616, "learning_rate": 3.7762576247424707e-06, "epoch": 0.3629706818373842, "percentage": 36.3, "elapsed_time": "4:52:57", "remaining_time": "8:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1612, "total_steps": 4438, "loss": 0.1495, "learning_rate": 3.7746554086408245e-06, "epoch": 0.3631959895231926, "percentage": 36.32, "elapsed_time": "4:53:09", "remaining_time": "8:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1613, "total_steps": 4438, "loss": 0.1624, "learning_rate": 3.7730524847705407e-06, "epoch": 0.363421297209001, "percentage": 36.35, "elapsed_time": "4:53:20", "remaining_time": "8:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1614, "total_steps": 4438, "loss": 0.1646, "learning_rate": 3.7714488540216637e-06, "epoch": 0.3636466048948095, "percentage": 36.37, "elapsed_time": "4:53:32", "remaining_time": "8:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 4438, "loss": 0.1558, "learning_rate": 3.7698445172846305e-06, "epoch": 0.3638719125806179, "percentage": 36.39, "elapsed_time": "4:53:42", "remaining_time": "8:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1616, "total_steps": 4438, "loss": 0.1689, "learning_rate": 3.7682394754502687e-06, "epoch": 0.3640972202664263, "percentage": 36.41, "elapsed_time": "4:53:53", "remaining_time": "8:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1617, "total_steps": 4438, "loss": 0.1709, "learning_rate": 3.7666337294097987e-06, "epoch": 0.3643225279522348, "percentage": 36.44, "elapsed_time": "4:54:04", "remaining_time": "8:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1618, "total_steps": 4438, "loss": 0.1501, "learning_rate": 3.7650272800548316e-06, "epoch": 0.3645478356380432, "percentage": 36.46, "elapsed_time": "4:54:15", "remaining_time": "8:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1619, "total_steps": 4438, "loss": 0.1495, "learning_rate": 3.7634201282773673e-06, "epoch": 0.36477314332385163, "percentage": 36.48, "elapsed_time": "4:54:26", "remaining_time": "8:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 4438, "loss": 0.147, "learning_rate": 3.7618122749697993e-06, "epoch": 0.36499845100966005, "percentage": 36.5, "elapsed_time": "4:54:36", "remaining_time": "8:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1621, "total_steps": 4438, "loss": 0.1614, "learning_rate": 3.7602037210249077e-06, "epoch": 0.3652237586954685, "percentage": 36.53, "elapsed_time": "4:54:47", "remaining_time": "8:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1622, "total_steps": 4438, "loss": 0.1626, "learning_rate": 3.7585944673358632e-06, "epoch": 0.36544906638127694, "percentage": 36.55, "elapsed_time": "4:54:57", "remaining_time": "8:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1623, "total_steps": 4438, "loss": 0.163, "learning_rate": 3.756984514796224e-06, "epoch": 0.36567437406708536, "percentage": 36.57, "elapsed_time": "4:55:07", "remaining_time": "8:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1624, "total_steps": 4438, "loss": 0.162, "learning_rate": 3.7553738642999354e-06, "epoch": 0.3658996817528938, "percentage": 36.59, "elapsed_time": "4:55:18", "remaining_time": "8:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 4438, "loss": 0.1604, "learning_rate": 3.753762516741333e-06, "epoch": 0.36612498943870225, "percentage": 36.62, "elapsed_time": "4:55:28", "remaining_time": "8:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1626, "total_steps": 4438, "loss": 0.1672, "learning_rate": 3.7521504730151382e-06, "epoch": 0.36635029712451067, "percentage": 36.64, "elapsed_time": "4:55:38", "remaining_time": "8:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1627, "total_steps": 4438, "loss": 0.1666, "learning_rate": 3.7505377340164585e-06, "epoch": 0.3665756048103191, "percentage": 36.66, "elapsed_time": "4:55:49", "remaining_time": "8:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1628, "total_steps": 4438, "loss": 0.1692, "learning_rate": 3.748924300640787e-06, "epoch": 0.3668009124961275, "percentage": 36.68, "elapsed_time": "4:55:59", "remaining_time": "8:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1629, "total_steps": 4438, "loss": 0.1596, "learning_rate": 3.747310173784004e-06, "epoch": 0.367026220181936, "percentage": 36.71, "elapsed_time": "4:56:09", "remaining_time": "8:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 4438, "loss": 0.1718, "learning_rate": 3.745695354342374e-06, "epoch": 0.3672515278677444, "percentage": 36.73, "elapsed_time": "4:56:19", "remaining_time": "8:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1631, "total_steps": 4438, "loss": 0.1476, "learning_rate": 3.7440798432125452e-06, "epoch": 0.3674768355535528, "percentage": 36.75, "elapsed_time": "4:56:32", "remaining_time": "8:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1632, "total_steps": 4438, "loss": 0.1528, "learning_rate": 3.742463641291552e-06, "epoch": 0.36770214323936123, "percentage": 36.77, "elapsed_time": "4:56:42", "remaining_time": "8:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1633, "total_steps": 4438, "loss": 0.1424, "learning_rate": 3.7408467494768104e-06, "epoch": 0.3679274509251697, "percentage": 36.8, "elapsed_time": "4:56:53", "remaining_time": "8:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1634, "total_steps": 4438, "loss": 0.1693, "learning_rate": 3.73922916866612e-06, "epoch": 0.3681527586109781, "percentage": 36.82, "elapsed_time": "4:57:03", "remaining_time": "8:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 4438, "loss": 0.1602, "learning_rate": 3.7376108997576628e-06, "epoch": 0.36837806629678654, "percentage": 36.84, "elapsed_time": "4:57:14", "remaining_time": "8:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1636, "total_steps": 4438, "loss": 0.1727, "learning_rate": 3.7359919436500038e-06, "epoch": 0.36860337398259496, "percentage": 36.86, "elapsed_time": "4:57:24", "remaining_time": "8:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1637, "total_steps": 4438, "loss": 0.1704, "learning_rate": 3.7343723012420884e-06, "epoch": 0.36882868166840344, "percentage": 36.89, "elapsed_time": "4:57:34", "remaining_time": "8:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1638, "total_steps": 4438, "loss": 0.1509, "learning_rate": 3.7327519734332453e-06, "epoch": 0.36905398935421185, "percentage": 36.91, "elapsed_time": "4:57:45", "remaining_time": "8:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1639, "total_steps": 4438, "loss": 0.1601, "learning_rate": 3.73113096112318e-06, "epoch": 0.36927929704002027, "percentage": 36.93, "elapsed_time": "4:57:57", "remaining_time": "8:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 4438, "loss": 0.1584, "learning_rate": 3.7295092652119815e-06, "epoch": 0.3695046047258287, "percentage": 36.95, "elapsed_time": "4:58:09", "remaining_time": "8:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1641, "total_steps": 4438, "loss": 0.1596, "learning_rate": 3.7278868866001165e-06, "epoch": 0.36972991241163716, "percentage": 36.98, "elapsed_time": "4:58:20", "remaining_time": "8:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1642, "total_steps": 4438, "loss": 0.1591, "learning_rate": 3.726263826188432e-06, "epoch": 0.3699552200974456, "percentage": 37.0, "elapsed_time": "4:58:31", "remaining_time": "8:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1643, "total_steps": 4438, "loss": 0.1594, "learning_rate": 3.724640084878153e-06, "epoch": 0.370180527783254, "percentage": 37.02, "elapsed_time": "4:58:42", "remaining_time": "8:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1644, "total_steps": 4438, "loss": 0.1695, "learning_rate": 3.7230156635708815e-06, "epoch": 0.3704058354690624, "percentage": 37.04, "elapsed_time": "4:58:54", "remaining_time": "8:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 4438, "loss": 0.1569, "learning_rate": 3.7213905631685988e-06, "epoch": 0.3706311431548709, "percentage": 37.07, "elapsed_time": "4:59:05", "remaining_time": "8:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1646, "total_steps": 4438, "loss": 0.1477, "learning_rate": 3.7197647845736616e-06, "epoch": 0.3708564508406793, "percentage": 37.09, "elapsed_time": "4:59:14", "remaining_time": "8:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1647, "total_steps": 4438, "loss": 0.1516, "learning_rate": 3.7181383286888056e-06, "epoch": 0.3710817585264877, "percentage": 37.11, "elapsed_time": "4:59:24", "remaining_time": "8:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1648, "total_steps": 4438, "loss": 0.1502, "learning_rate": 3.7165111964171407e-06, "epoch": 0.37130706621229614, "percentage": 37.13, "elapsed_time": "4:59:32", "remaining_time": "8:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1649, "total_steps": 4438, "loss": 0.1713, "learning_rate": 3.714883388662153e-06, "epoch": 0.3715323738981046, "percentage": 37.16, "elapsed_time": "4:59:43", "remaining_time": "8:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 4438, "loss": 0.155, "learning_rate": 3.7132549063277033e-06, "epoch": 0.37175768158391304, "percentage": 37.18, "elapsed_time": "4:59:54", "remaining_time": "8:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1651, "total_steps": 4438, "loss": 0.1761, "learning_rate": 3.711625750318026e-06, "epoch": 0.37198298926972145, "percentage": 37.2, "elapsed_time": "5:00:05", "remaining_time": "8:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1652, "total_steps": 4438, "loss": 0.1607, "learning_rate": 3.7099959215377325e-06, "epoch": 0.37220829695552987, "percentage": 37.22, "elapsed_time": "5:00:16", "remaining_time": "8:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1653, "total_steps": 4438, "loss": 0.1547, "learning_rate": 3.7083654208918044e-06, "epoch": 0.37243360464133834, "percentage": 37.25, "elapsed_time": "5:00:27", "remaining_time": "8:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1654, "total_steps": 4438, "loss": 0.1517, "learning_rate": 3.7067342492855997e-06, "epoch": 0.37265891232714676, "percentage": 37.27, "elapsed_time": "5:00:37", "remaining_time": "8:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 4438, "loss": 0.1587, "learning_rate": 3.7051024076248455e-06, "epoch": 0.3728842200129552, "percentage": 37.29, "elapsed_time": "5:00:48", "remaining_time": "8:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1656, "total_steps": 4438, "loss": 0.1482, "learning_rate": 3.7034698968156434e-06, "epoch": 0.3731095276987636, "percentage": 37.31, "elapsed_time": "5:00:58", "remaining_time": "8:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1657, "total_steps": 4438, "loss": 0.2014, "learning_rate": 3.7018367177644654e-06, "epoch": 0.3733348353845721, "percentage": 37.34, "elapsed_time": "5:01:08", "remaining_time": "8:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1658, "total_steps": 4438, "loss": 0.1701, "learning_rate": 3.700202871378156e-06, "epoch": 0.3735601430703805, "percentage": 37.36, "elapsed_time": "5:01:20", "remaining_time": "8:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1659, "total_steps": 4438, "loss": 0.1618, "learning_rate": 3.698568358563928e-06, "epoch": 0.3737854507561889, "percentage": 37.38, "elapsed_time": "5:01:30", "remaining_time": "8:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 4438, "loss": 0.1594, "learning_rate": 3.696933180229366e-06, "epoch": 0.3740107584419973, "percentage": 37.4, "elapsed_time": "5:01:41", "remaining_time": "8:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1661, "total_steps": 4438, "loss": 0.1716, "learning_rate": 3.6952973372824236e-06, "epoch": 0.3742360661278058, "percentage": 37.43, "elapsed_time": "5:01:53", "remaining_time": "8:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1662, "total_steps": 4438, "loss": 0.1473, "learning_rate": 3.6936608306314227e-06, "epoch": 0.3744613738136142, "percentage": 37.45, "elapsed_time": "5:02:03", "remaining_time": "8:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1663, "total_steps": 4438, "loss": 0.1417, "learning_rate": 3.6920236611850557e-06, "epoch": 0.37468668149942264, "percentage": 37.47, "elapsed_time": "5:02:12", "remaining_time": "8:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1664, "total_steps": 4438, "loss": 0.1654, "learning_rate": 3.690385829852381e-06, "epoch": 0.37491198918523105, "percentage": 37.49, "elapsed_time": "5:02:22", "remaining_time": "8:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 4438, "loss": 0.1684, "learning_rate": 3.6887473375428257e-06, "epoch": 0.3751372968710395, "percentage": 37.52, "elapsed_time": "5:02:33", "remaining_time": "8:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1666, "total_steps": 4438, "loss": 0.1673, "learning_rate": 3.6871081851661825e-06, "epoch": 0.37536260455684795, "percentage": 37.54, "elapsed_time": "5:02:44", "remaining_time": "8:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1667, "total_steps": 4438, "loss": 0.1616, "learning_rate": 3.685468373632613e-06, "epoch": 0.37558791224265636, "percentage": 37.56, "elapsed_time": "5:02:54", "remaining_time": "8:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1668, "total_steps": 4438, "loss": 0.1612, "learning_rate": 3.6838279038526427e-06, "epoch": 0.37581321992846484, "percentage": 37.58, "elapsed_time": "5:03:03", "remaining_time": "8:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1669, "total_steps": 4438, "loss": 0.1634, "learning_rate": 3.6821867767371634e-06, "epoch": 0.37603852761427325, "percentage": 37.61, "elapsed_time": "5:03:14", "remaining_time": "8:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 4438, "loss": 0.1616, "learning_rate": 3.6805449931974313e-06, "epoch": 0.3762638353000817, "percentage": 37.63, "elapsed_time": "5:03:25", "remaining_time": "8:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1671, "total_steps": 4438, "loss": 0.1627, "learning_rate": 3.6789025541450686e-06, "epoch": 0.3764891429858901, "percentage": 37.65, "elapsed_time": "5:03:36", "remaining_time": "8:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1672, "total_steps": 4438, "loss": 0.1602, "learning_rate": 3.67725946049206e-06, "epoch": 0.37671445067169856, "percentage": 37.67, "elapsed_time": "5:03:47", "remaining_time": "8:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1673, "total_steps": 4438, "loss": 0.1728, "learning_rate": 3.675615713150754e-06, "epoch": 0.376939758357507, "percentage": 37.7, "elapsed_time": "5:03:58", "remaining_time": "8:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1674, "total_steps": 4438, "loss": 0.177, "learning_rate": 3.6739713130338617e-06, "epoch": 0.3771650660433154, "percentage": 37.72, "elapsed_time": "5:04:09", "remaining_time": "8:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 4438, "loss": 0.1698, "learning_rate": 3.6723262610544586e-06, "epoch": 0.3773903737291238, "percentage": 37.74, "elapsed_time": "5:04:21", "remaining_time": "8:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1676, "total_steps": 4438, "loss": 0.1592, "learning_rate": 3.6706805581259807e-06, "epoch": 0.3776156814149323, "percentage": 37.76, "elapsed_time": "5:04:31", "remaining_time": "8:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1677, "total_steps": 4438, "loss": 0.1617, "learning_rate": 3.669034205162224e-06, "epoch": 0.3778409891007407, "percentage": 37.79, "elapsed_time": "5:04:41", "remaining_time": "8:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1678, "total_steps": 4438, "loss": 0.156, "learning_rate": 3.6673872030773473e-06, "epoch": 0.3780662967865491, "percentage": 37.81, "elapsed_time": "5:04:51", "remaining_time": "8:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1679, "total_steps": 4438, "loss": 0.1528, "learning_rate": 3.66573955278587e-06, "epoch": 0.37829160447235755, "percentage": 37.83, "elapsed_time": "5:05:01", "remaining_time": "8:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 4438, "loss": 0.1629, "learning_rate": 3.664091255202672e-06, "epoch": 0.378516912158166, "percentage": 37.85, "elapsed_time": "5:05:11", "remaining_time": "8:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1681, "total_steps": 4438, "loss": 0.1679, "learning_rate": 3.662442311242989e-06, "epoch": 0.37874221984397444, "percentage": 37.88, "elapsed_time": "5:05:23", "remaining_time": "8:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1682, "total_steps": 4438, "loss": 0.1704, "learning_rate": 3.66079272182242e-06, "epoch": 0.37896752752978285, "percentage": 37.9, "elapsed_time": "5:05:34", "remaining_time": "8:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1683, "total_steps": 4438, "loss": 0.1606, "learning_rate": 3.6591424878569203e-06, "epoch": 0.3791928352155913, "percentage": 37.92, "elapsed_time": "5:05:46", "remaining_time": "8:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1684, "total_steps": 4438, "loss": 0.1821, "learning_rate": 3.657491610262802e-06, "epoch": 0.37941814290139975, "percentage": 37.95, "elapsed_time": "5:05:57", "remaining_time": "8:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1685, "total_steps": 4438, "loss": 0.1595, "learning_rate": 3.655840089956738e-06, "epoch": 0.37964345058720816, "percentage": 37.97, "elapsed_time": "5:06:08", "remaining_time": "8:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1686, "total_steps": 4438, "loss": 0.1571, "learning_rate": 3.654187927855754e-06, "epoch": 0.3798687582730166, "percentage": 37.99, "elapsed_time": "5:06:18", "remaining_time": "8:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1687, "total_steps": 4438, "loss": 0.14, "learning_rate": 3.6525351248772357e-06, "epoch": 0.380094065958825, "percentage": 38.01, "elapsed_time": "5:06:28", "remaining_time": "8:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1688, "total_steps": 4438, "loss": 0.1635, "learning_rate": 3.6508816819389216e-06, "epoch": 0.3803193736446335, "percentage": 38.04, "elapsed_time": "5:06:39", "remaining_time": "8:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1689, "total_steps": 4438, "loss": 0.1551, "learning_rate": 3.6492275999589065e-06, "epoch": 0.3805446813304419, "percentage": 38.06, "elapsed_time": "5:06:51", "remaining_time": "8:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 4438, "loss": 0.1675, "learning_rate": 3.6475728798556426e-06, "epoch": 0.3807699890162503, "percentage": 38.08, "elapsed_time": "5:07:01", "remaining_time": "8:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1691, "total_steps": 4438, "loss": 0.1692, "learning_rate": 3.645917522547933e-06, "epoch": 0.38099529670205873, "percentage": 38.1, "elapsed_time": "5:07:12", "remaining_time": "8:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1692, "total_steps": 4438, "loss": 0.1635, "learning_rate": 3.6442615289549354e-06, "epoch": 0.3812206043878672, "percentage": 38.13, "elapsed_time": "5:07:23", "remaining_time": "8:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1693, "total_steps": 4438, "loss": 0.1686, "learning_rate": 3.6426048999961626e-06, "epoch": 0.3814459120736756, "percentage": 38.15, "elapsed_time": "5:07:31", "remaining_time": "8:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1694, "total_steps": 4438, "loss": 0.1589, "learning_rate": 3.6409476365914786e-06, "epoch": 0.38167121975948404, "percentage": 38.17, "elapsed_time": "5:07:41", "remaining_time": "8:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1695, "total_steps": 4438, "loss": 0.1683, "learning_rate": 3.6392897396610992e-06, "epoch": 0.38189652744529246, "percentage": 38.19, "elapsed_time": "5:07:53", "remaining_time": "8:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1696, "total_steps": 4438, "loss": 0.1505, "learning_rate": 3.6376312101255934e-06, "epoch": 0.38212183513110093, "percentage": 38.22, "elapsed_time": "5:08:04", "remaining_time": "8:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1697, "total_steps": 4438, "loss": 0.155, "learning_rate": 3.6359720489058804e-06, "epoch": 0.38234714281690935, "percentage": 38.24, "elapsed_time": "5:08:15", "remaining_time": "8:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1698, "total_steps": 4438, "loss": 0.1703, "learning_rate": 3.6343122569232313e-06, "epoch": 0.38257245050271776, "percentage": 38.26, "elapsed_time": "5:08:25", "remaining_time": "8:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1699, "total_steps": 4438, "loss": 0.1452, "learning_rate": 3.6326518350992657e-06, "epoch": 0.3827977581885262, "percentage": 38.28, "elapsed_time": "5:08:35", "remaining_time": "8:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 4438, "loss": 0.1568, "learning_rate": 3.6309907843559542e-06, "epoch": 0.38302306587433466, "percentage": 38.31, "elapsed_time": "5:08:45", "remaining_time": "8:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1701, "total_steps": 4438, "loss": 0.1535, "learning_rate": 3.6293291056156178e-06, "epoch": 0.3832483735601431, "percentage": 38.33, "elapsed_time": "5:08:56", "remaining_time": "8:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1702, "total_steps": 4438, "loss": 0.1581, "learning_rate": 3.6276667998009242e-06, "epoch": 0.3834736812459515, "percentage": 38.35, "elapsed_time": "5:09:07", "remaining_time": "8:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1703, "total_steps": 4438, "loss": 0.1715, "learning_rate": 3.626003867834888e-06, "epoch": 0.3836989889317599, "percentage": 38.37, "elapsed_time": "5:09:17", "remaining_time": "8:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1704, "total_steps": 4438, "loss": 0.1687, "learning_rate": 3.624340310640875e-06, "epoch": 0.3839242966175684, "percentage": 38.4, "elapsed_time": "5:09:27", "remaining_time": "8:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1705, "total_steps": 4438, "loss": 0.1693, "learning_rate": 3.6226761291425956e-06, "epoch": 0.3841496043033768, "percentage": 38.42, "elapsed_time": "5:09:37", "remaining_time": "8:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1706, "total_steps": 4438, "loss": 0.1642, "learning_rate": 3.621011324264109e-06, "epoch": 0.3843749119891852, "percentage": 38.44, "elapsed_time": "5:09:49", "remaining_time": "8:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1707, "total_steps": 4438, "loss": 0.1747, "learning_rate": 3.6193458969298184e-06, "epoch": 0.38460021967499364, "percentage": 38.46, "elapsed_time": "5:10:00", "remaining_time": "8:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1708, "total_steps": 4438, "loss": 0.1582, "learning_rate": 3.617679848064474e-06, "epoch": 0.3848255273608021, "percentage": 38.49, "elapsed_time": "5:10:09", "remaining_time": "8:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1709, "total_steps": 4438, "loss": 0.1629, "learning_rate": 3.6160131785931695e-06, "epoch": 0.38505083504661053, "percentage": 38.51, "elapsed_time": "5:10:19", "remaining_time": "8:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 4438, "loss": 0.1579, "learning_rate": 3.6143458894413463e-06, "epoch": 0.38527614273241895, "percentage": 38.53, "elapsed_time": "5:10:30", "remaining_time": "8:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1711, "total_steps": 4438, "loss": 0.1544, "learning_rate": 3.6126779815347863e-06, "epoch": 0.38550145041822736, "percentage": 38.55, "elapsed_time": "5:10:42", "remaining_time": "8:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1712, "total_steps": 4438, "loss": 0.1485, "learning_rate": 3.611009455799617e-06, "epoch": 0.38572675810403584, "percentage": 38.58, "elapsed_time": "5:10:51", "remaining_time": "8:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1713, "total_steps": 4438, "loss": 0.1486, "learning_rate": 3.609340313162309e-06, "epoch": 0.38595206578984426, "percentage": 38.6, "elapsed_time": "5:11:01", "remaining_time": "8:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1714, "total_steps": 4438, "loss": 0.1677, "learning_rate": 3.6076705545496743e-06, "epoch": 0.3861773734756527, "percentage": 38.62, "elapsed_time": "5:11:12", "remaining_time": "8:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1715, "total_steps": 4438, "loss": 0.1482, "learning_rate": 3.606000180888868e-06, "epoch": 0.38640268116146115, "percentage": 38.64, "elapsed_time": "5:11:21", "remaining_time": "8:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1716, "total_steps": 4438, "loss": 0.1479, "learning_rate": 3.604329193107386e-06, "epoch": 0.38662798884726957, "percentage": 38.67, "elapsed_time": "5:11:32", "remaining_time": "8:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1717, "total_steps": 4438, "loss": 0.1646, "learning_rate": 3.6026575921330665e-06, "epoch": 0.386853296533078, "percentage": 38.69, "elapsed_time": "5:11:42", "remaining_time": "8:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1718, "total_steps": 4438, "loss": 0.1596, "learning_rate": 3.600985378894086e-06, "epoch": 0.3870786042188864, "percentage": 38.71, "elapsed_time": "5:11:54", "remaining_time": "8:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1719, "total_steps": 4438, "loss": 0.1637, "learning_rate": 3.5993125543189634e-06, "epoch": 0.3873039119046949, "percentage": 38.73, "elapsed_time": "5:12:03", "remaining_time": "8:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 4438, "loss": 0.148, "learning_rate": 3.5976391193365544e-06, "epoch": 0.3875292195905033, "percentage": 38.76, "elapsed_time": "5:12:15", "remaining_time": "8:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1721, "total_steps": 4438, "loss": 0.1736, "learning_rate": 3.5959650748760562e-06, "epoch": 0.3877545272763117, "percentage": 38.78, "elapsed_time": "5:12:25", "remaining_time": "8:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1722, "total_steps": 4438, "loss": 0.1617, "learning_rate": 3.5942904218670025e-06, "epoch": 0.38797983496212013, "percentage": 38.8, "elapsed_time": "5:12:35", "remaining_time": "8:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1723, "total_steps": 4438, "loss": 0.1613, "learning_rate": 3.592615161239267e-06, "epoch": 0.3882051426479286, "percentage": 38.82, "elapsed_time": "5:12:46", "remaining_time": "8:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1724, "total_steps": 4438, "loss": 0.1673, "learning_rate": 3.590939293923058e-06, "epoch": 0.388430450333737, "percentage": 38.85, "elapsed_time": "5:12:58", "remaining_time": "8:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1725, "total_steps": 4438, "loss": 0.1534, "learning_rate": 3.5892628208489226e-06, "epoch": 0.38865575801954544, "percentage": 38.87, "elapsed_time": "5:13:09", "remaining_time": "8:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1726, "total_steps": 4438, "loss": 0.1595, "learning_rate": 3.5875857429477447e-06, "epoch": 0.38888106570535386, "percentage": 38.89, "elapsed_time": "5:13:20", "remaining_time": "8:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1727, "total_steps": 4438, "loss": 0.1515, "learning_rate": 3.585908061150741e-06, "epoch": 0.38910637339116233, "percentage": 38.91, "elapsed_time": "5:13:29", "remaining_time": "8:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1728, "total_steps": 4438, "loss": 0.1693, "learning_rate": 3.584229776389468e-06, "epoch": 0.38933168107697075, "percentage": 38.94, "elapsed_time": "5:13:38", "remaining_time": "8:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1729, "total_steps": 4438, "loss": 0.1737, "learning_rate": 3.5825508895958143e-06, "epoch": 0.38955698876277917, "percentage": 38.96, "elapsed_time": "5:13:48", "remaining_time": "8:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 4438, "loss": 0.171, "learning_rate": 3.580871401702002e-06, "epoch": 0.3897822964485876, "percentage": 38.98, "elapsed_time": "5:13:59", "remaining_time": "8:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1731, "total_steps": 4438, "loss": 0.1504, "learning_rate": 3.5791913136405883e-06, "epoch": 0.39000760413439606, "percentage": 39.0, "elapsed_time": "5:14:10", "remaining_time": "8:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1732, "total_steps": 4438, "loss": 0.1543, "learning_rate": 3.5775106263444644e-06, "epoch": 0.3902329118202045, "percentage": 39.03, "elapsed_time": "5:14:21", "remaining_time": "8:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1733, "total_steps": 4438, "loss": 0.1465, "learning_rate": 3.5758293407468525e-06, "epoch": 0.3904582195060129, "percentage": 39.05, "elapsed_time": "5:14:32", "remaining_time": "8:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1734, "total_steps": 4438, "loss": 0.1717, "learning_rate": 3.5741474577813086e-06, "epoch": 0.3906835271918213, "percentage": 39.07, "elapsed_time": "5:14:43", "remaining_time": "8:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1735, "total_steps": 4438, "loss": 0.1711, "learning_rate": 3.572464978381719e-06, "epoch": 0.3909088348776298, "percentage": 39.09, "elapsed_time": "5:14:54", "remaining_time": "8:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1736, "total_steps": 4438, "loss": 0.1737, "learning_rate": 3.570781903482302e-06, "epoch": 0.3911341425634382, "percentage": 39.12, "elapsed_time": "5:15:05", "remaining_time": "8:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1737, "total_steps": 4438, "loss": 0.1508, "learning_rate": 3.569098234017606e-06, "epoch": 0.3913594502492466, "percentage": 39.14, "elapsed_time": "5:15:15", "remaining_time": "8:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1738, "total_steps": 4438, "loss": 0.1619, "learning_rate": 3.5674139709225104e-06, "epoch": 0.39158475793505504, "percentage": 39.16, "elapsed_time": "5:15:26", "remaining_time": "8:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1739, "total_steps": 4438, "loss": 0.1614, "learning_rate": 3.565729115132224e-06, "epoch": 0.3918100656208635, "percentage": 39.18, "elapsed_time": "5:15:37", "remaining_time": "8:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 4438, "loss": 0.157, "learning_rate": 3.5640436675822833e-06, "epoch": 0.39203537330667193, "percentage": 39.21, "elapsed_time": "5:15:49", "remaining_time": "8:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1741, "total_steps": 4438, "loss": 0.1648, "learning_rate": 3.5623576292085555e-06, "epoch": 0.39226068099248035, "percentage": 39.23, "elapsed_time": "5:16:00", "remaining_time": "8:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1742, "total_steps": 4438, "loss": 0.1539, "learning_rate": 3.5606710009472335e-06, "epoch": 0.39248598867828877, "percentage": 39.25, "elapsed_time": "5:16:11", "remaining_time": "8:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1743, "total_steps": 4438, "loss": 0.1595, "learning_rate": 3.558983783734841e-06, "epoch": 0.39271129636409724, "percentage": 39.27, "elapsed_time": "5:16:23", "remaining_time": "8:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1744, "total_steps": 4438, "loss": 0.149, "learning_rate": 3.5572959785082264e-06, "epoch": 0.39293660404990566, "percentage": 39.3, "elapsed_time": "5:16:32", "remaining_time": "8:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1745, "total_steps": 4438, "loss": 0.1547, "learning_rate": 3.5556075862045636e-06, "epoch": 0.3931619117357141, "percentage": 39.32, "elapsed_time": "5:16:42", "remaining_time": "8:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1746, "total_steps": 4438, "loss": 0.1492, "learning_rate": 3.5539186077613562e-06, "epoch": 0.3933872194215225, "percentage": 39.34, "elapsed_time": "5:16:53", "remaining_time": "8:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1747, "total_steps": 4438, "loss": 0.1649, "learning_rate": 3.552229044116428e-06, "epoch": 0.39361252710733097, "percentage": 39.36, "elapsed_time": "5:17:04", "remaining_time": "8:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1748, "total_steps": 4438, "loss": 0.1552, "learning_rate": 3.5505388962079337e-06, "epoch": 0.3938378347931394, "percentage": 39.39, "elapsed_time": "5:17:16", "remaining_time": "8:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1749, "total_steps": 4438, "loss": 0.15, "learning_rate": 3.548848164974347e-06, "epoch": 0.3940631424789478, "percentage": 39.41, "elapsed_time": "5:17:28", "remaining_time": "8:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 4438, "loss": 0.1814, "learning_rate": 3.54715685135447e-06, "epoch": 0.3942884501647562, "percentage": 39.43, "elapsed_time": "5:17:38", "remaining_time": "8:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1751, "total_steps": 4438, "loss": 0.1579, "learning_rate": 3.545464956287425e-06, "epoch": 0.3945137578505647, "percentage": 39.45, "elapsed_time": "5:17:50", "remaining_time": "8:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1752, "total_steps": 4438, "loss": 0.146, "learning_rate": 3.5437724807126583e-06, "epoch": 0.3947390655363731, "percentage": 39.48, "elapsed_time": "5:18:00", "remaining_time": "8:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1753, "total_steps": 4438, "loss": 0.1571, "learning_rate": 3.542079425569938e-06, "epoch": 0.39496437322218153, "percentage": 39.5, "elapsed_time": "5:18:11", "remaining_time": "8:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1754, "total_steps": 4438, "loss": 0.1623, "learning_rate": 3.5403857917993554e-06, "epoch": 0.39518968090798995, "percentage": 39.52, "elapsed_time": "5:18:25", "remaining_time": "8:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1755, "total_steps": 4438, "loss": 0.1685, "learning_rate": 3.5386915803413234e-06, "epoch": 0.3954149885937984, "percentage": 39.54, "elapsed_time": "5:18:36", "remaining_time": "8:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1756, "total_steps": 4438, "loss": 0.1588, "learning_rate": 3.5369967921365718e-06, "epoch": 0.39564029627960684, "percentage": 39.57, "elapsed_time": "5:18:46", "remaining_time": "8:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1757, "total_steps": 4438, "loss": 0.1561, "learning_rate": 3.5353014281261545e-06, "epoch": 0.39586560396541526, "percentage": 39.59, "elapsed_time": "5:18:58", "remaining_time": "8:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1758, "total_steps": 4438, "loss": 0.165, "learning_rate": 3.5336054892514437e-06, "epoch": 0.3960909116512237, "percentage": 39.61, "elapsed_time": "5:19:09", "remaining_time": "8:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1759, "total_steps": 4438, "loss": 0.1636, "learning_rate": 3.531908976454132e-06, "epoch": 0.39631621933703215, "percentage": 39.63, "elapsed_time": "5:19:20", "remaining_time": "8:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 4438, "loss": 0.1426, "learning_rate": 3.530211890676229e-06, "epoch": 0.39654152702284057, "percentage": 39.66, "elapsed_time": "5:19:30", "remaining_time": "8:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1761, "total_steps": 4438, "loss": 0.1667, "learning_rate": 3.528514232860063e-06, "epoch": 0.396766834708649, "percentage": 39.68, "elapsed_time": "5:19:39", "remaining_time": "8:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1762, "total_steps": 4438, "loss": 0.1683, "learning_rate": 3.52681600394828e-06, "epoch": 0.3969921423944574, "percentage": 39.7, "elapsed_time": "5:19:50", "remaining_time": "8:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1763, "total_steps": 4438, "loss": 0.1522, "learning_rate": 3.525117204883844e-06, "epoch": 0.3972174500802659, "percentage": 39.73, "elapsed_time": "5:20:01", "remaining_time": "8:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1764, "total_steps": 4438, "loss": 0.1657, "learning_rate": 3.5234178366100343e-06, "epoch": 0.3974427577660743, "percentage": 39.75, "elapsed_time": "5:20:10", "remaining_time": "8:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1765, "total_steps": 4438, "loss": 0.1525, "learning_rate": 3.5217179000704467e-06, "epoch": 0.3976680654518827, "percentage": 39.77, "elapsed_time": "5:20:19", "remaining_time": "8:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1766, "total_steps": 4438, "loss": 0.1613, "learning_rate": 3.520017396208993e-06, "epoch": 0.3978933731376912, "percentage": 39.79, "elapsed_time": "5:20:30", "remaining_time": "8:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1767, "total_steps": 4438, "loss": 0.1632, "learning_rate": 3.518316325969899e-06, "epoch": 0.3981186808234996, "percentage": 39.82, "elapsed_time": "5:20:40", "remaining_time": "8:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1768, "total_steps": 4438, "loss": 0.1715, "learning_rate": 3.5166146902977055e-06, "epoch": 0.398343988509308, "percentage": 39.84, "elapsed_time": "5:20:52", "remaining_time": "8:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1769, "total_steps": 4438, "loss": 0.1534, "learning_rate": 3.514912490137268e-06, "epoch": 0.39856929619511644, "percentage": 39.86, "elapsed_time": "5:21:01", "remaining_time": "8:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 4438, "loss": 0.1646, "learning_rate": 3.5132097264337546e-06, "epoch": 0.3987946038809249, "percentage": 39.88, "elapsed_time": "5:21:13", "remaining_time": "8:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1771, "total_steps": 4438, "loss": 0.1568, "learning_rate": 3.5115064001326467e-06, "epoch": 0.39901991156673333, "percentage": 39.91, "elapsed_time": "5:21:24", "remaining_time": "8:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1772, "total_steps": 4438, "loss": 0.158, "learning_rate": 3.5098025121797375e-06, "epoch": 0.39924521925254175, "percentage": 39.93, "elapsed_time": "5:21:33", "remaining_time": "8:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1773, "total_steps": 4438, "loss": 0.1559, "learning_rate": 3.508098063521134e-06, "epoch": 0.39947052693835017, "percentage": 39.95, "elapsed_time": "5:21:44", "remaining_time": "8:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1774, "total_steps": 4438, "loss": 0.1639, "learning_rate": 3.5063930551032494e-06, "epoch": 0.39969583462415864, "percentage": 39.97, "elapsed_time": "5:21:54", "remaining_time": "8:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1775, "total_steps": 4438, "loss": 0.1533, "learning_rate": 3.504687487872815e-06, "epoch": 0.39992114230996706, "percentage": 40.0, "elapsed_time": "5:22:04", "remaining_time": "8:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1776, "total_steps": 4438, "loss": 0.1779, "learning_rate": 3.5029813627768665e-06, "epoch": 0.4001464499957755, "percentage": 40.02, "elapsed_time": "5:22:15", "remaining_time": "8:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1777, "total_steps": 4438, "loss": 0.1499, "learning_rate": 3.501274680762753e-06, "epoch": 0.4003717576815839, "percentage": 40.04, "elapsed_time": "5:22:24", "remaining_time": "8:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1778, "total_steps": 4438, "loss": 0.1566, "learning_rate": 3.499567442778131e-06, "epoch": 0.40059706536739237, "percentage": 40.06, "elapsed_time": "5:22:35", "remaining_time": "8:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1779, "total_steps": 4438, "loss": 0.1638, "learning_rate": 3.497859649770965e-06, "epoch": 0.4008223730532008, "percentage": 40.09, "elapsed_time": "5:22:47", "remaining_time": "8:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 4438, "loss": 0.1538, "learning_rate": 3.49615130268953e-06, "epoch": 0.4010476807390092, "percentage": 40.11, "elapsed_time": "5:22:58", "remaining_time": "8:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1781, "total_steps": 4438, "loss": 0.1665, "learning_rate": 3.494442402482407e-06, "epoch": 0.4012729884248176, "percentage": 40.13, "elapsed_time": "5:23:09", "remaining_time": "8:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1782, "total_steps": 4438, "loss": 0.1509, "learning_rate": 3.4927329500984857e-06, "epoch": 0.4014982961106261, "percentage": 40.15, "elapsed_time": "5:23:19", "remaining_time": "8:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1783, "total_steps": 4438, "loss": 0.1701, "learning_rate": 3.4910229464869594e-06, "epoch": 0.4017236037964345, "percentage": 40.18, "elapsed_time": "5:23:31", "remaining_time": "8:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1784, "total_steps": 4438, "loss": 0.159, "learning_rate": 3.489312392597331e-06, "epoch": 0.40194891148224293, "percentage": 40.2, "elapsed_time": "5:23:41", "remaining_time": "8:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1785, "total_steps": 4438, "loss": 0.1796, "learning_rate": 3.4876012893794053e-06, "epoch": 0.40217421916805135, "percentage": 40.22, "elapsed_time": "5:23:52", "remaining_time": "8:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1786, "total_steps": 4438, "loss": 0.138, "learning_rate": 3.4858896377832966e-06, "epoch": 0.4023995268538598, "percentage": 40.24, "elapsed_time": "5:24:02", "remaining_time": "8:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1787, "total_steps": 4438, "loss": 0.1731, "learning_rate": 3.4841774387594202e-06, "epoch": 0.40262483453966824, "percentage": 40.27, "elapsed_time": "5:24:14", "remaining_time": "8:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1788, "total_steps": 4438, "loss": 0.1462, "learning_rate": 3.482464693258496e-06, "epoch": 0.40285014222547666, "percentage": 40.29, "elapsed_time": "5:24:25", "remaining_time": "8:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1789, "total_steps": 4438, "loss": 0.1532, "learning_rate": 3.4807514022315473e-06, "epoch": 0.4030754499112851, "percentage": 40.31, "elapsed_time": "5:24:35", "remaining_time": "8:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 4438, "loss": 0.1525, "learning_rate": 3.4790375666299026e-06, "epoch": 0.40330075759709355, "percentage": 40.33, "elapsed_time": "5:24:46", "remaining_time": "8:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1791, "total_steps": 4438, "loss": 0.1657, "learning_rate": 3.4773231874051893e-06, "epoch": 0.40352606528290197, "percentage": 40.36, "elapsed_time": "5:24:56", "remaining_time": "8:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1792, "total_steps": 4438, "loss": 0.1675, "learning_rate": 3.4756082655093387e-06, "epoch": 0.4037513729687104, "percentage": 40.38, "elapsed_time": "5:25:08", "remaining_time": "8:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1793, "total_steps": 4438, "loss": 0.1592, "learning_rate": 3.4738928018945828e-06, "epoch": 0.4039766806545188, "percentage": 40.4, "elapsed_time": "5:25:19", "remaining_time": "7:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1794, "total_steps": 4438, "loss": 0.1474, "learning_rate": 3.4721767975134557e-06, "epoch": 0.4042019883403273, "percentage": 40.42, "elapsed_time": "5:25:30", "remaining_time": "7:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1795, "total_steps": 4438, "loss": 0.1573, "learning_rate": 3.470460253318789e-06, "epoch": 0.4044272960261357, "percentage": 40.45, "elapsed_time": "5:25:40", "remaining_time": "7:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1796, "total_steps": 4438, "loss": 0.163, "learning_rate": 3.4687431702637165e-06, "epoch": 0.4046526037119441, "percentage": 40.47, "elapsed_time": "5:25:50", "remaining_time": "7:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1797, "total_steps": 4438, "loss": 0.1699, "learning_rate": 3.4670255493016715e-06, "epoch": 0.40487791139775253, "percentage": 40.49, "elapsed_time": "5:26:01", "remaining_time": "7:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1798, "total_steps": 4438, "loss": 0.1401, "learning_rate": 3.465307391386383e-06, "epoch": 0.405103219083561, "percentage": 40.51, "elapsed_time": "5:26:11", "remaining_time": "7:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1799, "total_steps": 4438, "loss": 0.1676, "learning_rate": 3.4635886974718814e-06, "epoch": 0.4053285267693694, "percentage": 40.54, "elapsed_time": "5:26:22", "remaining_time": "7:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 4438, "loss": 0.1499, "learning_rate": 3.4618694685124927e-06, "epoch": 0.40555383445517784, "percentage": 40.56, "elapsed_time": "5:26:32", "remaining_time": "7:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1801, "total_steps": 4438, "loss": 0.1677, "learning_rate": 3.4601497054628407e-06, "epoch": 0.40577914214098626, "percentage": 40.58, "elapsed_time": "5:26:43", "remaining_time": "7:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1802, "total_steps": 4438, "loss": 0.157, "learning_rate": 3.458429409277846e-06, "epoch": 0.40600444982679473, "percentage": 40.6, "elapsed_time": "5:26:54", "remaining_time": "7:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1803, "total_steps": 4438, "loss": 0.1531, "learning_rate": 3.4567085809127247e-06, "epoch": 0.40622975751260315, "percentage": 40.63, "elapsed_time": "5:27:05", "remaining_time": "7:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1804, "total_steps": 4438, "loss": 0.1654, "learning_rate": 3.454987221322989e-06, "epoch": 0.40645506519841157, "percentage": 40.65, "elapsed_time": "5:27:14", "remaining_time": "7:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1805, "total_steps": 4438, "loss": 0.1621, "learning_rate": 3.4532653314644453e-06, "epoch": 0.40668037288422, "percentage": 40.67, "elapsed_time": "5:27:25", "remaining_time": "7:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1806, "total_steps": 4438, "loss": 0.15, "learning_rate": 3.4515429122931955e-06, "epoch": 0.40690568057002846, "percentage": 40.69, "elapsed_time": "5:27:36", "remaining_time": "7:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1807, "total_steps": 4438, "loss": 0.148, "learning_rate": 3.4498199647656335e-06, "epoch": 0.4071309882558369, "percentage": 40.72, "elapsed_time": "5:27:48", "remaining_time": "7:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1808, "total_steps": 4438, "loss": 0.1526, "learning_rate": 3.4480964898384495e-06, "epoch": 0.4073562959416453, "percentage": 40.74, "elapsed_time": "5:28:00", "remaining_time": "7:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1809, "total_steps": 4438, "loss": 0.1675, "learning_rate": 3.4463724884686234e-06, "epoch": 0.4075816036274537, "percentage": 40.76, "elapsed_time": "5:28:11", "remaining_time": "7:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 4438, "loss": 0.1548, "learning_rate": 3.44464796161343e-06, "epoch": 0.4078069113132622, "percentage": 40.78, "elapsed_time": "5:28:23", "remaining_time": "7:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1811, "total_steps": 4438, "loss": 0.1679, "learning_rate": 3.4429229102304336e-06, "epoch": 0.4080322189990706, "percentage": 40.81, "elapsed_time": "5:28:32", "remaining_time": "7:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1812, "total_steps": 4438, "loss": 0.1703, "learning_rate": 3.4411973352774917e-06, "epoch": 0.408257526684879, "percentage": 40.83, "elapsed_time": "5:28:44", "remaining_time": "7:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1813, "total_steps": 4438, "loss": 0.1581, "learning_rate": 3.4394712377127524e-06, "epoch": 0.4084828343706875, "percentage": 40.85, "elapsed_time": "5:28:55", "remaining_time": "7:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1814, "total_steps": 4438, "loss": 0.1594, "learning_rate": 3.437744618494653e-06, "epoch": 0.4087081420564959, "percentage": 40.87, "elapsed_time": "5:29:06", "remaining_time": "7:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1815, "total_steps": 4438, "loss": 0.1536, "learning_rate": 3.4360174785819196e-06, "epoch": 0.40893344974230433, "percentage": 40.9, "elapsed_time": "5:29:17", "remaining_time": "7:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1816, "total_steps": 4438, "loss": 0.1582, "learning_rate": 3.4342898189335692e-06, "epoch": 0.40915875742811275, "percentage": 40.92, "elapsed_time": "5:29:28", "remaining_time": "7:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1817, "total_steps": 4438, "loss": 0.1493, "learning_rate": 3.432561640508908e-06, "epoch": 0.4093840651139212, "percentage": 40.94, "elapsed_time": "5:29:39", "remaining_time": "7:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1818, "total_steps": 4438, "loss": 0.1552, "learning_rate": 3.4308329442675276e-06, "epoch": 0.40960937279972964, "percentage": 40.96, "elapsed_time": "5:29:49", "remaining_time": "7:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1819, "total_steps": 4438, "loss": 0.1401, "learning_rate": 3.4291037311693088e-06, "epoch": 0.40983468048553806, "percentage": 40.99, "elapsed_time": "5:29:59", "remaining_time": "7:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 4438, "loss": 0.1623, "learning_rate": 3.42737400217442e-06, "epoch": 0.4100599881713465, "percentage": 41.01, "elapsed_time": "5:30:10", "remaining_time": "7:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1821, "total_steps": 4438, "loss": 0.1557, "learning_rate": 3.4256437582433144e-06, "epoch": 0.41028529585715495, "percentage": 41.03, "elapsed_time": "5:30:20", "remaining_time": "7:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1822, "total_steps": 4438, "loss": 0.1612, "learning_rate": 3.423913000336732e-06, "epoch": 0.41051060354296337, "percentage": 41.05, "elapsed_time": "5:30:31", "remaining_time": "7:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1823, "total_steps": 4438, "loss": 0.1384, "learning_rate": 3.422181729415699e-06, "epoch": 0.4107359112287718, "percentage": 41.08, "elapsed_time": "5:30:41", "remaining_time": "7:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1824, "total_steps": 4438, "loss": 0.1674, "learning_rate": 3.4204499464415253e-06, "epoch": 0.4109612189145802, "percentage": 41.1, "elapsed_time": "5:30:52", "remaining_time": "7:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1825, "total_steps": 4438, "loss": 0.1469, "learning_rate": 3.418717652375805e-06, "epoch": 0.4111865266003887, "percentage": 41.12, "elapsed_time": "5:31:02", "remaining_time": "7:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1826, "total_steps": 4438, "loss": 0.1604, "learning_rate": 3.4169848481804165e-06, "epoch": 0.4114118342861971, "percentage": 41.14, "elapsed_time": "5:31:13", "remaining_time": "7:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1827, "total_steps": 4438, "loss": 0.1626, "learning_rate": 3.415251534817521e-06, "epoch": 0.4116371419720055, "percentage": 41.17, "elapsed_time": "5:31:23", "remaining_time": "7:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1828, "total_steps": 4438, "loss": 0.161, "learning_rate": 3.4135177132495632e-06, "epoch": 0.41186244965781393, "percentage": 41.19, "elapsed_time": "5:31:34", "remaining_time": "7:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1829, "total_steps": 4438, "loss": 0.1698, "learning_rate": 3.4117833844392704e-06, "epoch": 0.4120877573436224, "percentage": 41.21, "elapsed_time": "5:31:45", "remaining_time": "7:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 4438, "loss": 0.1515, "learning_rate": 3.41004854934965e-06, "epoch": 0.4123130650294308, "percentage": 41.23, "elapsed_time": "5:31:55", "remaining_time": "7:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1831, "total_steps": 4438, "loss": 0.1653, "learning_rate": 3.4083132089439912e-06, "epoch": 0.41253837271523924, "percentage": 41.26, "elapsed_time": "5:32:07", "remaining_time": "7:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1832, "total_steps": 4438, "loss": 0.1665, "learning_rate": 3.406577364185864e-06, "epoch": 0.41276368040104766, "percentage": 41.28, "elapsed_time": "5:32:17", "remaining_time": "7:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1833, "total_steps": 4438, "loss": 0.1717, "learning_rate": 3.404841016039118e-06, "epoch": 0.41298898808685613, "percentage": 41.3, "elapsed_time": "5:32:29", "remaining_time": "7:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1834, "total_steps": 4438, "loss": 0.166, "learning_rate": 3.403104165467883e-06, "epoch": 0.41321429577266455, "percentage": 41.32, "elapsed_time": "5:32:40", "remaining_time": "7:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1835, "total_steps": 4438, "loss": 0.151, "learning_rate": 3.4013668134365675e-06, "epoch": 0.41343960345847297, "percentage": 41.35, "elapsed_time": "5:32:50", "remaining_time": "7:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1836, "total_steps": 4438, "loss": 0.1575, "learning_rate": 3.399628960909857e-06, "epoch": 0.4136649111442814, "percentage": 41.37, "elapsed_time": "5:33:00", "remaining_time": "7:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1837, "total_steps": 4438, "loss": 0.1618, "learning_rate": 3.397890608852718e-06, "epoch": 0.41389021883008986, "percentage": 41.39, "elapsed_time": "5:33:11", "remaining_time": "7:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1838, "total_steps": 4438, "loss": 0.1595, "learning_rate": 3.3961517582303916e-06, "epoch": 0.4141155265158983, "percentage": 41.42, "elapsed_time": "5:33:21", "remaining_time": "7:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1839, "total_steps": 4438, "loss": 0.1629, "learning_rate": 3.394412410008397e-06, "epoch": 0.4143408342017067, "percentage": 41.44, "elapsed_time": "5:33:34", "remaining_time": "7:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 4438, "loss": 0.1573, "learning_rate": 3.39267256515253e-06, "epoch": 0.4145661418875151, "percentage": 41.46, "elapsed_time": "5:33:43", "remaining_time": "7:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1841, "total_steps": 4438, "loss": 0.1392, "learning_rate": 3.3909322246288606e-06, "epoch": 0.4147914495733236, "percentage": 41.48, "elapsed_time": "5:33:54", "remaining_time": "7:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1842, "total_steps": 4438, "loss": 0.1612, "learning_rate": 3.3891913894037354e-06, "epoch": 0.415016757259132, "percentage": 41.51, "elapsed_time": "5:34:04", "remaining_time": "7:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1843, "total_steps": 4438, "loss": 0.1542, "learning_rate": 3.3874500604437752e-06, "epoch": 0.4152420649449404, "percentage": 41.53, "elapsed_time": "5:34:16", "remaining_time": "7:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1844, "total_steps": 4438, "loss": 0.1515, "learning_rate": 3.385708238715876e-06, "epoch": 0.41546737263074884, "percentage": 41.55, "elapsed_time": "5:34:25", "remaining_time": "7:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1845, "total_steps": 4438, "loss": 0.1439, "learning_rate": 3.3839659251872054e-06, "epoch": 0.4156926803165573, "percentage": 41.57, "elapsed_time": "5:34:35", "remaining_time": "7:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1846, "total_steps": 4438, "loss": 0.1583, "learning_rate": 3.3822231208252053e-06, "epoch": 0.41591798800236573, "percentage": 41.6, "elapsed_time": "5:34:45", "remaining_time": "7:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1847, "total_steps": 4438, "loss": 0.1758, "learning_rate": 3.38047982659759e-06, "epoch": 0.41614329568817415, "percentage": 41.62, "elapsed_time": "5:34:56", "remaining_time": "7:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1848, "total_steps": 4438, "loss": 0.1559, "learning_rate": 3.3787360434723466e-06, "epoch": 0.41636860337398257, "percentage": 41.64, "elapsed_time": "5:35:08", "remaining_time": "7:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1849, "total_steps": 4438, "loss": 0.1739, "learning_rate": 3.3769917724177315e-06, "epoch": 0.41659391105979104, "percentage": 41.66, "elapsed_time": "5:35:19", "remaining_time": "7:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 4438, "loss": 0.1502, "learning_rate": 3.3752470144022745e-06, "epoch": 0.41681921874559946, "percentage": 41.69, "elapsed_time": "5:35:30", "remaining_time": "7:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1851, "total_steps": 4438, "loss": 0.1673, "learning_rate": 3.3735017703947748e-06, "epoch": 0.4170445264314079, "percentage": 41.71, "elapsed_time": "5:35:41", "remaining_time": "7:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1852, "total_steps": 4438, "loss": 0.151, "learning_rate": 3.371756041364301e-06, "epoch": 0.4172698341172163, "percentage": 41.73, "elapsed_time": "5:35:52", "remaining_time": "7:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1853, "total_steps": 4438, "loss": 0.1503, "learning_rate": 3.370009828280191e-06, "epoch": 0.41749514180302477, "percentage": 41.75, "elapsed_time": "5:36:03", "remaining_time": "7:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1854, "total_steps": 4438, "loss": 0.1687, "learning_rate": 3.3682631321120507e-06, "epoch": 0.4177204494888332, "percentage": 41.78, "elapsed_time": "5:36:15", "remaining_time": "7:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1855, "total_steps": 4438, "loss": 0.1853, "learning_rate": 3.366515953829758e-06, "epoch": 0.4179457571746416, "percentage": 41.8, "elapsed_time": "5:36:25", "remaining_time": "7:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1856, "total_steps": 4438, "loss": 0.1683, "learning_rate": 3.364768294403455e-06, "epoch": 0.41817106486045, "percentage": 41.82, "elapsed_time": "5:36:35", "remaining_time": "7:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1857, "total_steps": 4438, "loss": 0.1658, "learning_rate": 3.3630201548035512e-06, "epoch": 0.4183963725462585, "percentage": 41.84, "elapsed_time": "5:36:46", "remaining_time": "7:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1858, "total_steps": 4438, "loss": 0.1575, "learning_rate": 3.361271536000723e-06, "epoch": 0.4186216802320669, "percentage": 41.87, "elapsed_time": "5:36:57", "remaining_time": "7:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1859, "total_steps": 4438, "loss": 0.1625, "learning_rate": 3.359522438965915e-06, "epoch": 0.41884698791787534, "percentage": 41.89, "elapsed_time": "5:37:07", "remaining_time": "7:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 4438, "loss": 0.1474, "learning_rate": 3.3577728646703335e-06, "epoch": 0.41907229560368375, "percentage": 41.91, "elapsed_time": "5:37:19", "remaining_time": "7:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1861, "total_steps": 4438, "loss": 0.1611, "learning_rate": 3.3560228140854534e-06, "epoch": 0.4192976032894922, "percentage": 41.93, "elapsed_time": "5:37:31", "remaining_time": "7:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1862, "total_steps": 4438, "loss": 0.1669, "learning_rate": 3.354272288183012e-06, "epoch": 0.41952291097530064, "percentage": 41.96, "elapsed_time": "5:37:41", "remaining_time": "7:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1863, "total_steps": 4438, "loss": 0.142, "learning_rate": 3.352521287935011e-06, "epoch": 0.41974821866110906, "percentage": 41.98, "elapsed_time": "5:37:52", "remaining_time": "7:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1864, "total_steps": 4438, "loss": 0.156, "learning_rate": 3.3507698143137157e-06, "epoch": 0.41997352634691754, "percentage": 42.0, "elapsed_time": "5:38:03", "remaining_time": "7:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1865, "total_steps": 4438, "loss": 0.1422, "learning_rate": 3.3490178682916534e-06, "epoch": 0.42019883403272595, "percentage": 42.02, "elapsed_time": "5:38:13", "remaining_time": "7:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1866, "total_steps": 4438, "loss": 0.157, "learning_rate": 3.3472654508416157e-06, "epoch": 0.42042414171853437, "percentage": 42.05, "elapsed_time": "5:38:24", "remaining_time": "7:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1867, "total_steps": 4438, "loss": 0.1588, "learning_rate": 3.3455125629366546e-06, "epoch": 0.4206494494043428, "percentage": 42.07, "elapsed_time": "5:38:36", "remaining_time": "7:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1868, "total_steps": 4438, "loss": 0.1588, "learning_rate": 3.3437592055500825e-06, "epoch": 0.42087475709015126, "percentage": 42.09, "elapsed_time": "5:38:48", "remaining_time": "7:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1869, "total_steps": 4438, "loss": 0.15, "learning_rate": 3.342005379655474e-06, "epoch": 0.4211000647759597, "percentage": 42.11, "elapsed_time": "5:38:59", "remaining_time": "7:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 4438, "loss": 0.157, "learning_rate": 3.340251086226663e-06, "epoch": 0.4213253724617681, "percentage": 42.14, "elapsed_time": "5:39:09", "remaining_time": "7:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1871, "total_steps": 4438, "loss": 0.1662, "learning_rate": 3.3384963262377434e-06, "epoch": 0.4215506801475765, "percentage": 42.16, "elapsed_time": "5:39:19", "remaining_time": "7:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1872, "total_steps": 4438, "loss": 0.1662, "learning_rate": 3.3367411006630677e-06, "epoch": 0.421775987833385, "percentage": 42.18, "elapsed_time": "5:39:29", "remaining_time": "7:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1873, "total_steps": 4438, "loss": 0.1708, "learning_rate": 3.3349854104772476e-06, "epoch": 0.4220012955191934, "percentage": 42.2, "elapsed_time": "5:39:41", "remaining_time": "7:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1874, "total_steps": 4438, "loss": 0.1485, "learning_rate": 3.333229256655153e-06, "epoch": 0.4222266032050018, "percentage": 42.23, "elapsed_time": "5:39:53", "remaining_time": "7:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1875, "total_steps": 4438, "loss": 0.147, "learning_rate": 3.3314726401719088e-06, "epoch": 0.42245191089081024, "percentage": 42.25, "elapsed_time": "5:40:04", "remaining_time": "7:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1876, "total_steps": 4438, "loss": 0.1473, "learning_rate": 3.3297155620029e-06, "epoch": 0.4226772185766187, "percentage": 42.27, "elapsed_time": "5:40:15", "remaining_time": "7:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1877, "total_steps": 4438, "loss": 0.1525, "learning_rate": 3.3279580231237664e-06, "epoch": 0.42290252626242714, "percentage": 42.29, "elapsed_time": "5:40:26", "remaining_time": "7:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1878, "total_steps": 4438, "loss": 0.1549, "learning_rate": 3.326200024510405e-06, "epoch": 0.42312783394823555, "percentage": 42.32, "elapsed_time": "5:40:36", "remaining_time": "7:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1879, "total_steps": 4438, "loss": 0.1587, "learning_rate": 3.324441567138965e-06, "epoch": 0.423353141634044, "percentage": 42.34, "elapsed_time": "5:40:45", "remaining_time": "7:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 4438, "loss": 0.1436, "learning_rate": 3.3226826519858526e-06, "epoch": 0.42357844931985245, "percentage": 42.36, "elapsed_time": "5:40:55", "remaining_time": "7:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1881, "total_steps": 4438, "loss": 0.1551, "learning_rate": 3.320923280027728e-06, "epoch": 0.42380375700566086, "percentage": 42.38, "elapsed_time": "5:41:05", "remaining_time": "7:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1882, "total_steps": 4438, "loss": 0.1445, "learning_rate": 3.3191634522415064e-06, "epoch": 0.4240290646914693, "percentage": 42.41, "elapsed_time": "5:41:17", "remaining_time": "7:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1883, "total_steps": 4438, "loss": 0.1536, "learning_rate": 3.317403169604352e-06, "epoch": 0.4242543723772777, "percentage": 42.43, "elapsed_time": "5:41:27", "remaining_time": "7:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1884, "total_steps": 4438, "loss": 0.1438, "learning_rate": 3.315642433093686e-06, "epoch": 0.4244796800630862, "percentage": 42.45, "elapsed_time": "5:41:37", "remaining_time": "7:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1885, "total_steps": 4438, "loss": 0.154, "learning_rate": 3.313881243687179e-06, "epoch": 0.4247049877488946, "percentage": 42.47, "elapsed_time": "5:41:48", "remaining_time": "7:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1886, "total_steps": 4438, "loss": 0.1705, "learning_rate": 3.3121196023627543e-06, "epoch": 0.424930295434703, "percentage": 42.5, "elapsed_time": "5:41:59", "remaining_time": "7:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1887, "total_steps": 4438, "loss": 0.154, "learning_rate": 3.3103575100985852e-06, "epoch": 0.4251556031205114, "percentage": 42.52, "elapsed_time": "5:42:10", "remaining_time": "7:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1888, "total_steps": 4438, "loss": 0.1383, "learning_rate": 3.3085949678730953e-06, "epoch": 0.4253809108063199, "percentage": 42.54, "elapsed_time": "5:42:20", "remaining_time": "7:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1889, "total_steps": 4438, "loss": 0.137, "learning_rate": 3.3068319766649605e-06, "epoch": 0.4256062184921283, "percentage": 42.56, "elapsed_time": "5:42:31", "remaining_time": "7:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 4438, "loss": 0.165, "learning_rate": 3.305068537453102e-06, "epoch": 0.42583152617793674, "percentage": 42.59, "elapsed_time": "5:42:41", "remaining_time": "7:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1891, "total_steps": 4438, "loss": 0.1554, "learning_rate": 3.303304651216693e-06, "epoch": 0.42605683386374515, "percentage": 42.61, "elapsed_time": "5:42:52", "remaining_time": "7:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1892, "total_steps": 4438, "loss": 0.1691, "learning_rate": 3.3015403189351536e-06, "epoch": 0.42628214154955363, "percentage": 42.63, "elapsed_time": "5:43:05", "remaining_time": "7:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1893, "total_steps": 4438, "loss": 0.1452, "learning_rate": 3.2997755415881516e-06, "epoch": 0.42650744923536205, "percentage": 42.65, "elapsed_time": "5:43:16", "remaining_time": "7:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1894, "total_steps": 4438, "loss": 0.1636, "learning_rate": 3.2980103201556023e-06, "epoch": 0.42673275692117046, "percentage": 42.68, "elapsed_time": "5:43:27", "remaining_time": "7:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1895, "total_steps": 4438, "loss": 0.1691, "learning_rate": 3.2962446556176676e-06, "epoch": 0.4269580646069789, "percentage": 42.7, "elapsed_time": "5:43:38", "remaining_time": "7:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1896, "total_steps": 4438, "loss": 0.154, "learning_rate": 3.2944785489547544e-06, "epoch": 0.42718337229278736, "percentage": 42.72, "elapsed_time": "5:43:49", "remaining_time": "7:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1897, "total_steps": 4438, "loss": 0.1511, "learning_rate": 3.2927120011475168e-06, "epoch": 0.4274086799785958, "percentage": 42.74, "elapsed_time": "5:44:00", "remaining_time": "7:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1898, "total_steps": 4438, "loss": 0.157, "learning_rate": 3.290945013176852e-06, "epoch": 0.4276339876644042, "percentage": 42.77, "elapsed_time": "5:44:12", "remaining_time": "7:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1899, "total_steps": 4438, "loss": 0.1429, "learning_rate": 3.2891775860239033e-06, "epoch": 0.4278592953502126, "percentage": 42.79, "elapsed_time": "5:44:22", "remaining_time": "7:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 4438, "loss": 0.1699, "learning_rate": 3.2874097206700566e-06, "epoch": 0.4280846030360211, "percentage": 42.81, "elapsed_time": "5:44:33", "remaining_time": "7:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1901, "total_steps": 4438, "loss": 0.1698, "learning_rate": 3.285641418096942e-06, "epoch": 0.4283099107218295, "percentage": 42.83, "elapsed_time": "5:44:43", "remaining_time": "7:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1902, "total_steps": 4438, "loss": 0.1499, "learning_rate": 3.2838726792864315e-06, "epoch": 0.4285352184076379, "percentage": 42.86, "elapsed_time": "5:44:53", "remaining_time": "7:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1903, "total_steps": 4438, "loss": 0.1545, "learning_rate": 3.2821035052206413e-06, "epoch": 0.42876052609344634, "percentage": 42.88, "elapsed_time": "5:45:04", "remaining_time": "7:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1904, "total_steps": 4438, "loss": 0.1487, "learning_rate": 3.2803338968819264e-06, "epoch": 0.4289858337792548, "percentage": 42.9, "elapsed_time": "5:45:14", "remaining_time": "7:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1905, "total_steps": 4438, "loss": 0.162, "learning_rate": 3.278563855252885e-06, "epoch": 0.42921114146506323, "percentage": 42.92, "elapsed_time": "5:45:25", "remaining_time": "7:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1906, "total_steps": 4438, "loss": 0.1441, "learning_rate": 3.2767933813163542e-06, "epoch": 0.42943644915087165, "percentage": 42.95, "elapsed_time": "5:45:35", "remaining_time": "7:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1907, "total_steps": 4438, "loss": 0.1523, "learning_rate": 3.2750224760554135e-06, "epoch": 0.42966175683668006, "percentage": 42.97, "elapsed_time": "5:45:44", "remaining_time": "7:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1908, "total_steps": 4438, "loss": 0.1611, "learning_rate": 3.2732511404533797e-06, "epoch": 0.42988706452248854, "percentage": 42.99, "elapsed_time": "5:45:55", "remaining_time": "7:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1909, "total_steps": 4438, "loss": 0.173, "learning_rate": 3.2714793754938102e-06, "epoch": 0.43011237220829696, "percentage": 43.01, "elapsed_time": "5:46:08", "remaining_time": "7:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 4438, "loss": 0.1572, "learning_rate": 3.2697071821604986e-06, "epoch": 0.4303376798941054, "percentage": 43.04, "elapsed_time": "5:46:19", "remaining_time": "7:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1911, "total_steps": 4438, "loss": 0.1691, "learning_rate": 3.2679345614374802e-06, "epoch": 0.43056298757991385, "percentage": 43.06, "elapsed_time": "5:46:32", "remaining_time": "7:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1912, "total_steps": 4438, "loss": 0.1624, "learning_rate": 3.266161514309023e-06, "epoch": 0.43078829526572227, "percentage": 43.08, "elapsed_time": "5:46:44", "remaining_time": "7:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1913, "total_steps": 4438, "loss": 0.167, "learning_rate": 3.264388041759635e-06, "epoch": 0.4310136029515307, "percentage": 43.11, "elapsed_time": "5:46:53", "remaining_time": "7:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1914, "total_steps": 4438, "loss": 0.17, "learning_rate": 3.262614144774059e-06, "epoch": 0.4312389106373391, "percentage": 43.13, "elapsed_time": "5:47:05", "remaining_time": "7:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1915, "total_steps": 4438, "loss": 0.1437, "learning_rate": 3.260839824337274e-06, "epoch": 0.4314642183231476, "percentage": 43.15, "elapsed_time": "5:47:16", "remaining_time": "7:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1916, "total_steps": 4438, "loss": 0.1522, "learning_rate": 3.259065081434495e-06, "epoch": 0.431689526008956, "percentage": 43.17, "elapsed_time": "5:47:25", "remaining_time": "7:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1917, "total_steps": 4438, "loss": 0.1664, "learning_rate": 3.2572899170511683e-06, "epoch": 0.4319148336947644, "percentage": 43.2, "elapsed_time": "5:47:34", "remaining_time": "7:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1918, "total_steps": 4438, "loss": 0.1615, "learning_rate": 3.255514332172979e-06, "epoch": 0.43214014138057283, "percentage": 43.22, "elapsed_time": "5:47:47", "remaining_time": "7:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1919, "total_steps": 4438, "loss": 0.1518, "learning_rate": 3.2537383277858413e-06, "epoch": 0.4323654490663813, "percentage": 43.24, "elapsed_time": "5:47:58", "remaining_time": "7:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 4438, "loss": 0.1508, "learning_rate": 3.2519619048759056e-06, "epoch": 0.4325907567521897, "percentage": 43.26, "elapsed_time": "5:48:08", "remaining_time": "7:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1921, "total_steps": 4438, "loss": 0.1668, "learning_rate": 3.250185064429552e-06, "epoch": 0.43281606443799814, "percentage": 43.29, "elapsed_time": "5:48:19", "remaining_time": "7:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1922, "total_steps": 4438, "loss": 0.1635, "learning_rate": 3.248407807433396e-06, "epoch": 0.43304137212380656, "percentage": 43.31, "elapsed_time": "5:48:30", "remaining_time": "7:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1923, "total_steps": 4438, "loss": 0.1566, "learning_rate": 3.246630134874279e-06, "epoch": 0.43326667980961503, "percentage": 43.33, "elapsed_time": "5:48:41", "remaining_time": "7:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1924, "total_steps": 4438, "loss": 0.1751, "learning_rate": 3.2448520477392788e-06, "epoch": 0.43349198749542345, "percentage": 43.35, "elapsed_time": "5:48:53", "remaining_time": "7:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1925, "total_steps": 4438, "loss": 0.1559, "learning_rate": 3.2430735470157e-06, "epoch": 0.43371729518123187, "percentage": 43.38, "elapsed_time": "5:49:04", "remaining_time": "7:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1926, "total_steps": 4438, "loss": 0.1716, "learning_rate": 3.2412946336910778e-06, "epoch": 0.4339426028670403, "percentage": 43.4, "elapsed_time": "5:49:15", "remaining_time": "7:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1927, "total_steps": 4438, "loss": 0.1722, "learning_rate": 3.2395153087531767e-06, "epoch": 0.43416791055284876, "percentage": 43.42, "elapsed_time": "5:49:27", "remaining_time": "7:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1928, "total_steps": 4438, "loss": 0.1645, "learning_rate": 3.237735573189989e-06, "epoch": 0.4343932182386572, "percentage": 43.44, "elapsed_time": "5:49:37", "remaining_time": "7:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1929, "total_steps": 4438, "loss": 0.1372, "learning_rate": 3.2359554279897353e-06, "epoch": 0.4346185259244656, "percentage": 43.47, "elapsed_time": "5:49:47", "remaining_time": "7:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 4438, "loss": 0.1459, "learning_rate": 3.234174874140866e-06, "epoch": 0.434843833610274, "percentage": 43.49, "elapsed_time": "5:49:57", "remaining_time": "7:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1931, "total_steps": 4438, "loss": 0.1491, "learning_rate": 3.232393912632054e-06, "epoch": 0.4350691412960825, "percentage": 43.51, "elapsed_time": "5:50:09", "remaining_time": "7:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1932, "total_steps": 4438, "loss": 0.1583, "learning_rate": 3.230612544452202e-06, "epoch": 0.4352944489818909, "percentage": 43.53, "elapsed_time": "5:50:20", "remaining_time": "7:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1933, "total_steps": 4438, "loss": 0.1488, "learning_rate": 3.228830770590436e-06, "epoch": 0.4355197566676993, "percentage": 43.56, "elapsed_time": "5:50:30", "remaining_time": "7:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1934, "total_steps": 4438, "loss": 0.1551, "learning_rate": 3.2270485920361093e-06, "epoch": 0.43574506435350774, "percentage": 43.58, "elapsed_time": "5:50:40", "remaining_time": "7:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1935, "total_steps": 4438, "loss": 0.1638, "learning_rate": 3.2252660097788003e-06, "epoch": 0.4359703720393162, "percentage": 43.6, "elapsed_time": "5:50:51", "remaining_time": "7:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1936, "total_steps": 4438, "loss": 0.1581, "learning_rate": 3.2234830248083095e-06, "epoch": 0.43619567972512463, "percentage": 43.62, "elapsed_time": "5:51:01", "remaining_time": "7:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1937, "total_steps": 4438, "loss": 0.15, "learning_rate": 3.2216996381146613e-06, "epoch": 0.43642098741093305, "percentage": 43.65, "elapsed_time": "5:51:10", "remaining_time": "7:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1938, "total_steps": 4438, "loss": 0.1386, "learning_rate": 3.219915850688106e-06, "epoch": 0.43664629509674147, "percentage": 43.67, "elapsed_time": "5:51:20", "remaining_time": "7:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1939, "total_steps": 4438, "loss": 0.1528, "learning_rate": 3.2181316635191125e-06, "epoch": 0.43687160278254994, "percentage": 43.69, "elapsed_time": "5:51:30", "remaining_time": "7:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 4438, "loss": 0.147, "learning_rate": 3.2163470775983733e-06, "epoch": 0.43709691046835836, "percentage": 43.71, "elapsed_time": "5:51:41", "remaining_time": "7:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1941, "total_steps": 4438, "loss": 0.1599, "learning_rate": 3.2145620939168036e-06, "epoch": 0.4373222181541668, "percentage": 43.74, "elapsed_time": "5:51:50", "remaining_time": "7:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1942, "total_steps": 4438, "loss": 0.1613, "learning_rate": 3.2127767134655374e-06, "epoch": 0.4375475258399752, "percentage": 43.76, "elapsed_time": "5:52:02", "remaining_time": "7:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1943, "total_steps": 4438, "loss": 0.1481, "learning_rate": 3.210990937235931e-06, "epoch": 0.43777283352578367, "percentage": 43.78, "elapsed_time": "5:52:13", "remaining_time": "7:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1944, "total_steps": 4438, "loss": 0.1644, "learning_rate": 3.209204766219558e-06, "epoch": 0.4379981412115921, "percentage": 43.8, "elapsed_time": "5:52:26", "remaining_time": "7:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1945, "total_steps": 4438, "loss": 0.1401, "learning_rate": 3.207418201408213e-06, "epoch": 0.4382234488974005, "percentage": 43.83, "elapsed_time": "5:52:36", "remaining_time": "7:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1946, "total_steps": 4438, "loss": 0.1542, "learning_rate": 3.205631243793909e-06, "epoch": 0.4384487565832089, "percentage": 43.85, "elapsed_time": "5:52:47", "remaining_time": "7:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1947, "total_steps": 4438, "loss": 0.161, "learning_rate": 3.2038438943688777e-06, "epoch": 0.4386740642690174, "percentage": 43.87, "elapsed_time": "5:52:57", "remaining_time": "7:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1948, "total_steps": 4438, "loss": 0.1628, "learning_rate": 3.202056154125567e-06, "epoch": 0.4388993719548258, "percentage": 43.89, "elapsed_time": "5:53:07", "remaining_time": "7:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1949, "total_steps": 4438, "loss": 0.1494, "learning_rate": 3.2002680240566412e-06, "epoch": 0.43912467964063423, "percentage": 43.92, "elapsed_time": "5:53:18", "remaining_time": "7:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 4438, "loss": 0.1561, "learning_rate": 3.198479505154984e-06, "epoch": 0.43934998732644265, "percentage": 43.94, "elapsed_time": "5:53:29", "remaining_time": "7:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1951, "total_steps": 4438, "loss": 0.1564, "learning_rate": 3.1966905984136932e-06, "epoch": 0.4395752950122511, "percentage": 43.96, "elapsed_time": "5:53:40", "remaining_time": "7:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1952, "total_steps": 4438, "loss": 0.1723, "learning_rate": 3.1949013048260813e-06, "epoch": 0.43980060269805954, "percentage": 43.98, "elapsed_time": "5:53:51", "remaining_time": "7:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1953, "total_steps": 4438, "loss": 0.1554, "learning_rate": 3.1931116253856762e-06, "epoch": 0.44002591038386796, "percentage": 44.01, "elapsed_time": "5:54:01", "remaining_time": "7:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1954, "total_steps": 4438, "loss": 0.1603, "learning_rate": 3.1913215610862208e-06, "epoch": 0.4402512180696764, "percentage": 44.03, "elapsed_time": "5:54:11", "remaining_time": "7:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1955, "total_steps": 4438, "loss": 0.1503, "learning_rate": 3.189531112921671e-06, "epoch": 0.44047652575548485, "percentage": 44.05, "elapsed_time": "5:54:22", "remaining_time": "7:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1956, "total_steps": 4438, "loss": 0.1347, "learning_rate": 3.1877402818861954e-06, "epoch": 0.44070183344129327, "percentage": 44.07, "elapsed_time": "5:54:33", "remaining_time": "7:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1957, "total_steps": 4438, "loss": 0.1578, "learning_rate": 3.185949068974177e-06, "epoch": 0.4409271411271017, "percentage": 44.1, "elapsed_time": "5:54:43", "remaining_time": "7:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1958, "total_steps": 4438, "loss": 0.1503, "learning_rate": 3.184157475180208e-06, "epoch": 0.4411524488129101, "percentage": 44.12, "elapsed_time": "5:54:53", "remaining_time": "7:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1959, "total_steps": 4438, "loss": 0.1559, "learning_rate": 3.1823655014990937e-06, "epoch": 0.4413777564987186, "percentage": 44.14, "elapsed_time": "5:55:04", "remaining_time": "7:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 4438, "loss": 0.1477, "learning_rate": 3.1805731489258516e-06, "epoch": 0.441603064184527, "percentage": 44.16, "elapsed_time": "5:55:14", "remaining_time": "7:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1961, "total_steps": 4438, "loss": 0.1478, "learning_rate": 3.1787804184557074e-06, "epoch": 0.4418283718703354, "percentage": 44.19, "elapsed_time": "5:55:24", "remaining_time": "7:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1962, "total_steps": 4438, "loss": 0.1525, "learning_rate": 3.1769873110840977e-06, "epoch": 0.4420536795561439, "percentage": 44.21, "elapsed_time": "5:55:34", "remaining_time": "7:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1963, "total_steps": 4438, "loss": 0.1518, "learning_rate": 3.1751938278066687e-06, "epoch": 0.4422789872419523, "percentage": 44.23, "elapsed_time": "5:55:45", "remaining_time": "7:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1964, "total_steps": 4438, "loss": 0.1597, "learning_rate": 3.1733999696192736e-06, "epoch": 0.4425042949277607, "percentage": 44.25, "elapsed_time": "5:55:56", "remaining_time": "7:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1965, "total_steps": 4438, "loss": 0.1564, "learning_rate": 3.171605737517976e-06, "epoch": 0.44272960261356914, "percentage": 44.28, "elapsed_time": "5:56:07", "remaining_time": "7:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1966, "total_steps": 4438, "loss": 0.1435, "learning_rate": 3.1698111324990454e-06, "epoch": 0.4429549102993776, "percentage": 44.3, "elapsed_time": "5:56:18", "remaining_time": "7:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1967, "total_steps": 4438, "loss": 0.1623, "learning_rate": 3.16801615555896e-06, "epoch": 0.44318021798518603, "percentage": 44.32, "elapsed_time": "5:56:28", "remaining_time": "7:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1968, "total_steps": 4438, "loss": 0.1487, "learning_rate": 3.1662208076944027e-06, "epoch": 0.44340552567099445, "percentage": 44.34, "elapsed_time": "5:56:38", "remaining_time": "7:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1969, "total_steps": 4438, "loss": 0.1426, "learning_rate": 3.1644250899022637e-06, "epoch": 0.44363083335680287, "percentage": 44.37, "elapsed_time": "5:56:50", "remaining_time": "7:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 4438, "loss": 0.1498, "learning_rate": 3.162629003179638e-06, "epoch": 0.44385614104261134, "percentage": 44.39, "elapsed_time": "5:57:01", "remaining_time": "7:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1971, "total_steps": 4438, "loss": 0.1491, "learning_rate": 3.1608325485238257e-06, "epoch": 0.44408144872841976, "percentage": 44.41, "elapsed_time": "5:57:12", "remaining_time": "7:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1972, "total_steps": 4438, "loss": 0.1639, "learning_rate": 3.1590357269323312e-06, "epoch": 0.4443067564142282, "percentage": 44.43, "elapsed_time": "5:57:23", "remaining_time": "7:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1973, "total_steps": 4438, "loss": 0.1664, "learning_rate": 3.157238539402862e-06, "epoch": 0.4445320641000366, "percentage": 44.46, "elapsed_time": "5:57:32", "remaining_time": "7:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1974, "total_steps": 4438, "loss": 0.1717, "learning_rate": 3.15544098693333e-06, "epoch": 0.44475737178584507, "percentage": 44.48, "elapsed_time": "5:57:43", "remaining_time": "7:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1975, "total_steps": 4438, "loss": 0.1483, "learning_rate": 3.15364307052185e-06, "epoch": 0.4449826794716535, "percentage": 44.5, "elapsed_time": "5:57:54", "remaining_time": "7:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1976, "total_steps": 4438, "loss": 0.1577, "learning_rate": 3.151844791166735e-06, "epoch": 0.4452079871574619, "percentage": 44.52, "elapsed_time": "5:58:04", "remaining_time": "7:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1977, "total_steps": 4438, "loss": 0.1712, "learning_rate": 3.1500461498665053e-06, "epoch": 0.4454332948432703, "percentage": 44.55, "elapsed_time": "5:58:16", "remaining_time": "7:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1978, "total_steps": 4438, "loss": 0.1579, "learning_rate": 3.1482471476198784e-06, "epoch": 0.4456586025290788, "percentage": 44.57, "elapsed_time": "5:58:27", "remaining_time": "7:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1979, "total_steps": 4438, "loss": 0.1481, "learning_rate": 3.1464477854257726e-06, "epoch": 0.4458839102148872, "percentage": 44.59, "elapsed_time": "5:58:35", "remaining_time": "7:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 4438, "loss": 0.1521, "learning_rate": 3.1446480642833077e-06, "epoch": 0.44610921790069563, "percentage": 44.61, "elapsed_time": "5:58:46", "remaining_time": "7:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1981, "total_steps": 4438, "loss": 0.1591, "learning_rate": 3.1428479851918014e-06, "epoch": 0.44633452558650405, "percentage": 44.64, "elapsed_time": "5:58:58", "remaining_time": "7:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1982, "total_steps": 4438, "loss": 0.16, "learning_rate": 3.14104754915077e-06, "epoch": 0.4465598332723125, "percentage": 44.66, "elapsed_time": "5:59:09", "remaining_time": "7:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1983, "total_steps": 4438, "loss": 0.161, "learning_rate": 3.1392467571599288e-06, "epoch": 0.44678514095812094, "percentage": 44.68, "elapsed_time": "5:59:21", "remaining_time": "7:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1984, "total_steps": 4438, "loss": 0.1504, "learning_rate": 3.137445610219192e-06, "epoch": 0.44701044864392936, "percentage": 44.7, "elapsed_time": "5:59:33", "remaining_time": "7:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1985, "total_steps": 4438, "loss": 0.1591, "learning_rate": 3.1356441093286673e-06, "epoch": 0.4472357563297378, "percentage": 44.73, "elapsed_time": "5:59:43", "remaining_time": "7:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1986, "total_steps": 4438, "loss": 0.1712, "learning_rate": 3.133842255488661e-06, "epoch": 0.44746106401554625, "percentage": 44.75, "elapsed_time": "5:59:54", "remaining_time": "7:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1987, "total_steps": 4438, "loss": 0.1724, "learning_rate": 3.132040049699676e-06, "epoch": 0.44768637170135467, "percentage": 44.77, "elapsed_time": "6:00:05", "remaining_time": "7:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1988, "total_steps": 4438, "loss": 0.1599, "learning_rate": 3.130237492962411e-06, "epoch": 0.4479116793871631, "percentage": 44.79, "elapsed_time": "6:00:17", "remaining_time": "7:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1989, "total_steps": 4438, "loss": 0.1522, "learning_rate": 3.1284345862777572e-06, "epoch": 0.4481369870729715, "percentage": 44.82, "elapsed_time": "6:00:28", "remaining_time": "7:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 4438, "loss": 0.1491, "learning_rate": 3.1266313306468018e-06, "epoch": 0.44836229475878, "percentage": 44.84, "elapsed_time": "6:00:37", "remaining_time": "7:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1991, "total_steps": 4438, "loss": 0.1534, "learning_rate": 3.1248277270708255e-06, "epoch": 0.4485876024445884, "percentage": 44.86, "elapsed_time": "6:00:47", "remaining_time": "7:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1992, "total_steps": 4438, "loss": 0.1679, "learning_rate": 3.1230237765513023e-06, "epoch": 0.4488129101303968, "percentage": 44.89, "elapsed_time": "6:00:59", "remaining_time": "7:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1993, "total_steps": 4438, "loss": 0.1402, "learning_rate": 3.121219480089899e-06, "epoch": 0.44903821781620523, "percentage": 44.91, "elapsed_time": "6:01:10", "remaining_time": "7:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1994, "total_steps": 4438, "loss": 0.1521, "learning_rate": 3.119414838688473e-06, "epoch": 0.4492635255020137, "percentage": 44.93, "elapsed_time": "6:01:21", "remaining_time": "7:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1995, "total_steps": 4438, "loss": 0.1351, "learning_rate": 3.1176098533490755e-06, "epoch": 0.4494888331878221, "percentage": 44.95, "elapsed_time": "6:01:31", "remaining_time": "7:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1996, "total_steps": 4438, "loss": 0.1669, "learning_rate": 3.1158045250739473e-06, "epoch": 0.44971414087363054, "percentage": 44.98, "elapsed_time": "6:01:42", "remaining_time": "7:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1997, "total_steps": 4438, "loss": 0.1475, "learning_rate": 3.11399885486552e-06, "epoch": 0.44993944855943896, "percentage": 45.0, "elapsed_time": "6:01:53", "remaining_time": "7:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1998, "total_steps": 4438, "loss": 0.153, "learning_rate": 3.1121928437264138e-06, "epoch": 0.45016475624524743, "percentage": 45.02, "elapsed_time": "6:02:04", "remaining_time": "7:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1999, "total_steps": 4438, "loss": 0.1474, "learning_rate": 3.1103864926594406e-06, "epoch": 0.45039006393105585, "percentage": 45.04, "elapsed_time": "6:02:14", "remaining_time": "7:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 4438, "loss": 0.1492, "learning_rate": 3.1085798026676e-06, "epoch": 0.45061537161686427, "percentage": 45.07, "elapsed_time": "6:02:25", "remaining_time": "7:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 4438, "eval_loss": 0.15435218811035156, "epoch": 0.45061537161686427, "percentage": 45.07, "elapsed_time": "6:04:28", "remaining_time": "7:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2001, "total_steps": 4438, "loss": 0.1387, "learning_rate": 3.1067727747540797e-06, "epoch": 0.4508406793026727, "percentage": 45.09, "elapsed_time": "6:04:39", "remaining_time": "7:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2002, "total_steps": 4438, "loss": 0.155, "learning_rate": 3.1049654099222542e-06, "epoch": 0.45106598698848116, "percentage": 45.11, "elapsed_time": "6:04:49", "remaining_time": "7:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2003, "total_steps": 4438, "loss": 0.1476, "learning_rate": 3.1031577091756852e-06, "epoch": 0.4512912946742896, "percentage": 45.13, "elapsed_time": "6:05:00", "remaining_time": "7:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2004, "total_steps": 4438, "loss": 0.1454, "learning_rate": 3.1013496735181232e-06, "epoch": 0.451516602360098, "percentage": 45.16, "elapsed_time": "6:05:10", "remaining_time": "7:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2005, "total_steps": 4438, "loss": 0.1503, "learning_rate": 3.0995413039535017e-06, "epoch": 0.4517419100459064, "percentage": 45.18, "elapsed_time": "6:05:19", "remaining_time": "7:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2006, "total_steps": 4438, "loss": 0.1707, "learning_rate": 3.0977326014859415e-06, "epoch": 0.4519672177317149, "percentage": 45.2, "elapsed_time": "6:05:31", "remaining_time": "7:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2007, "total_steps": 4438, "loss": 0.1494, "learning_rate": 3.095923567119748e-06, "epoch": 0.4521925254175233, "percentage": 45.22, "elapsed_time": "6:05:42", "remaining_time": "7:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2008, "total_steps": 4438, "loss": 0.1585, "learning_rate": 3.09411420185941e-06, "epoch": 0.4524178331033317, "percentage": 45.25, "elapsed_time": "6:05:53", "remaining_time": "7:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2009, "total_steps": 4438, "loss": 0.1468, "learning_rate": 3.0923045067096e-06, "epoch": 0.4526431407891402, "percentage": 45.27, "elapsed_time": "6:06:03", "remaining_time": "7:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 4438, "loss": 0.1687, "learning_rate": 3.090494482675176e-06, "epoch": 0.4528684484749486, "percentage": 45.29, "elapsed_time": "6:06:14", "remaining_time": "7:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2011, "total_steps": 4438, "loss": 0.1585, "learning_rate": 3.088684130761175e-06, "epoch": 0.45309375616075703, "percentage": 45.31, "elapsed_time": "6:06:26", "remaining_time": "7:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2012, "total_steps": 4438, "loss": 0.1368, "learning_rate": 3.0868734519728194e-06, "epoch": 0.45331906384656545, "percentage": 45.34, "elapsed_time": "6:06:36", "remaining_time": "7:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2013, "total_steps": 4438, "loss": 0.168, "learning_rate": 3.085062447315511e-06, "epoch": 0.4535443715323739, "percentage": 45.36, "elapsed_time": "6:06:47", "remaining_time": "7:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2014, "total_steps": 4438, "loss": 0.1426, "learning_rate": 3.0832511177948326e-06, "epoch": 0.45376967921818234, "percentage": 45.38, "elapsed_time": "6:06:58", "remaining_time": "7:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2015, "total_steps": 4438, "loss": 0.1678, "learning_rate": 3.081439464416549e-06, "epoch": 0.45399498690399076, "percentage": 45.4, "elapsed_time": "6:07:08", "remaining_time": "7:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2016, "total_steps": 4438, "loss": 0.1617, "learning_rate": 3.0796274881866034e-06, "epoch": 0.4542202945897992, "percentage": 45.43, "elapsed_time": "6:07:18", "remaining_time": "7:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2017, "total_steps": 4438, "loss": 0.1584, "learning_rate": 3.0778151901111187e-06, "epoch": 0.45444560227560765, "percentage": 45.45, "elapsed_time": "6:07:30", "remaining_time": "7:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2018, "total_steps": 4438, "loss": 0.1382, "learning_rate": 3.0760025711963964e-06, "epoch": 0.45467090996141607, "percentage": 45.47, "elapsed_time": "6:07:39", "remaining_time": "7:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2019, "total_steps": 4438, "loss": 0.168, "learning_rate": 3.0741896324489163e-06, "epoch": 0.4548962176472245, "percentage": 45.49, "elapsed_time": "6:07:50", "remaining_time": "7:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 4438, "loss": 0.1495, "learning_rate": 3.0723763748753354e-06, "epoch": 0.4551215253330329, "percentage": 45.52, "elapsed_time": "6:08:01", "remaining_time": "7:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2021, "total_steps": 4438, "loss": 0.1561, "learning_rate": 3.0705627994824887e-06, "epoch": 0.4553468330188414, "percentage": 45.54, "elapsed_time": "6:08:11", "remaining_time": "7:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2022, "total_steps": 4438, "loss": 0.1472, "learning_rate": 3.0687489072773864e-06, "epoch": 0.4555721407046498, "percentage": 45.56, "elapsed_time": "6:08:22", "remaining_time": "7:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2023, "total_steps": 4438, "loss": 0.1451, "learning_rate": 3.0669346992672156e-06, "epoch": 0.4557974483904582, "percentage": 45.58, "elapsed_time": "6:08:32", "remaining_time": "7:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2024, "total_steps": 4438, "loss": 0.1602, "learning_rate": 3.0651201764593375e-06, "epoch": 0.45602275607626663, "percentage": 45.61, "elapsed_time": "6:08:43", "remaining_time": "7:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2025, "total_steps": 4438, "loss": 0.1525, "learning_rate": 3.06330533986129e-06, "epoch": 0.4562480637620751, "percentage": 45.63, "elapsed_time": "6:08:53", "remaining_time": "7:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2026, "total_steps": 4438, "loss": 0.1497, "learning_rate": 3.0614901904807836e-06, "epoch": 0.4564733714478835, "percentage": 45.65, "elapsed_time": "6:09:04", "remaining_time": "7:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2027, "total_steps": 4438, "loss": 0.1463, "learning_rate": 3.0596747293257047e-06, "epoch": 0.45669867913369194, "percentage": 45.67, "elapsed_time": "6:09:15", "remaining_time": "7:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2028, "total_steps": 4438, "loss": 0.1422, "learning_rate": 3.0578589574041097e-06, "epoch": 0.45692398681950036, "percentage": 45.7, "elapsed_time": "6:09:25", "remaining_time": "7:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2029, "total_steps": 4438, "loss": 0.1661, "learning_rate": 3.056042875724228e-06, "epoch": 0.45714929450530883, "percentage": 45.72, "elapsed_time": "6:09:36", "remaining_time": "7:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 4438, "loss": 0.1418, "learning_rate": 3.0542264852944635e-06, "epoch": 0.45737460219111725, "percentage": 45.74, "elapsed_time": "6:09:47", "remaining_time": "7:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2031, "total_steps": 4438, "loss": 0.1548, "learning_rate": 3.052409787123391e-06, "epoch": 0.45759990987692567, "percentage": 45.76, "elapsed_time": "6:09:56", "remaining_time": "7:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2032, "total_steps": 4438, "loss": 0.1459, "learning_rate": 3.0505927822197533e-06, "epoch": 0.4578252175627341, "percentage": 45.79, "elapsed_time": "6:10:06", "remaining_time": "7:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2033, "total_steps": 4438, "loss": 0.1376, "learning_rate": 3.0487754715924674e-06, "epoch": 0.45805052524854256, "percentage": 45.81, "elapsed_time": "6:10:17", "remaining_time": "7:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2034, "total_steps": 4438, "loss": 0.1524, "learning_rate": 3.0469578562506165e-06, "epoch": 0.458275832934351, "percentage": 45.83, "elapsed_time": "6:10:28", "remaining_time": "7:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2035, "total_steps": 4438, "loss": 0.1518, "learning_rate": 3.045139937203455e-06, "epoch": 0.4585011406201594, "percentage": 45.85, "elapsed_time": "6:10:38", "remaining_time": "7:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2036, "total_steps": 4438, "loss": 0.1668, "learning_rate": 3.0433217154604067e-06, "epoch": 0.4587264483059678, "percentage": 45.88, "elapsed_time": "6:10:49", "remaining_time": "7:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2037, "total_steps": 4438, "loss": 0.1534, "learning_rate": 3.0415031920310613e-06, "epoch": 0.4589517559917763, "percentage": 45.9, "elapsed_time": "6:10:59", "remaining_time": "7:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2038, "total_steps": 4438, "loss": 0.1497, "learning_rate": 3.0396843679251777e-06, "epoch": 0.4591770636775847, "percentage": 45.92, "elapsed_time": "6:11:10", "remaining_time": "7:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2039, "total_steps": 4438, "loss": 0.1457, "learning_rate": 3.03786524415268e-06, "epoch": 0.4594023713633931, "percentage": 45.94, "elapsed_time": "6:11:20", "remaining_time": "7:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 4438, "loss": 0.1513, "learning_rate": 3.0360458217236604e-06, "epoch": 0.45962767904920154, "percentage": 45.97, "elapsed_time": "6:11:31", "remaining_time": "7:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2041, "total_steps": 4438, "loss": 0.1505, "learning_rate": 3.034226101648377e-06, "epoch": 0.45985298673501, "percentage": 45.99, "elapsed_time": "6:11:41", "remaining_time": "7:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2042, "total_steps": 4438, "loss": 0.1444, "learning_rate": 3.0324060849372526e-06, "epoch": 0.46007829442081843, "percentage": 46.01, "elapsed_time": "6:11:52", "remaining_time": "7:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2043, "total_steps": 4438, "loss": 0.1449, "learning_rate": 3.0305857726008736e-06, "epoch": 0.46030360210662685, "percentage": 46.03, "elapsed_time": "6:12:03", "remaining_time": "7:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2044, "total_steps": 4438, "loss": 0.1479, "learning_rate": 3.028765165649992e-06, "epoch": 0.46052890979243527, "percentage": 46.06, "elapsed_time": "6:12:13", "remaining_time": "7:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2045, "total_steps": 4438, "loss": 0.1411, "learning_rate": 3.026944265095524e-06, "epoch": 0.46075421747824374, "percentage": 46.08, "elapsed_time": "6:12:24", "remaining_time": "7:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2046, "total_steps": 4438, "loss": 0.151, "learning_rate": 3.0251230719485465e-06, "epoch": 0.46097952516405216, "percentage": 46.1, "elapsed_time": "6:12:35", "remaining_time": "7:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2047, "total_steps": 4438, "loss": 0.1543, "learning_rate": 3.0233015872203004e-06, "epoch": 0.4612048328498606, "percentage": 46.12, "elapsed_time": "6:12:46", "remaining_time": "7:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2048, "total_steps": 4438, "loss": 0.151, "learning_rate": 3.0214798119221884e-06, "epoch": 0.461430140535669, "percentage": 46.15, "elapsed_time": "6:12:56", "remaining_time": "7:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2049, "total_steps": 4438, "loss": 0.145, "learning_rate": 3.0196577470657744e-06, "epoch": 0.46165544822147747, "percentage": 46.17, "elapsed_time": "6:13:07", "remaining_time": "7:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 4438, "loss": 0.1546, "learning_rate": 3.0178353936627835e-06, "epoch": 0.4618807559072859, "percentage": 46.19, "elapsed_time": "6:13:18", "remaining_time": "7:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2051, "total_steps": 4438, "loss": 0.1515, "learning_rate": 3.0160127527250993e-06, "epoch": 0.4621060635930943, "percentage": 46.21, "elapsed_time": "6:13:28", "remaining_time": "7:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2052, "total_steps": 4438, "loss": 0.1474, "learning_rate": 3.0141898252647682e-06, "epoch": 0.4623313712789027, "percentage": 46.24, "elapsed_time": "6:13:37", "remaining_time": "7:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2053, "total_steps": 4438, "loss": 0.1565, "learning_rate": 3.012366612293993e-06, "epoch": 0.4625566789647112, "percentage": 46.26, "elapsed_time": "6:13:49", "remaining_time": "7:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2054, "total_steps": 4438, "loss": 0.1632, "learning_rate": 3.0105431148251364e-06, "epoch": 0.4627819866505196, "percentage": 46.28, "elapsed_time": "6:14:00", "remaining_time": "7:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2055, "total_steps": 4438, "loss": 0.1409, "learning_rate": 3.0087193338707175e-06, "epoch": 0.46300729433632803, "percentage": 46.3, "elapsed_time": "6:14:10", "remaining_time": "7:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2056, "total_steps": 4438, "loss": 0.1613, "learning_rate": 3.0068952704434145e-06, "epoch": 0.46323260202213645, "percentage": 46.33, "elapsed_time": "6:14:22", "remaining_time": "7:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2057, "total_steps": 4438, "loss": 0.1504, "learning_rate": 3.0050709255560616e-06, "epoch": 0.4634579097079449, "percentage": 46.35, "elapsed_time": "6:14:32", "remaining_time": "7:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2058, "total_steps": 4438, "loss": 0.1541, "learning_rate": 3.0032463002216504e-06, "epoch": 0.46368321739375334, "percentage": 46.37, "elapsed_time": "6:14:43", "remaining_time": "7:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2059, "total_steps": 4438, "loss": 0.1507, "learning_rate": 3.0014213954533265e-06, "epoch": 0.46390852507956176, "percentage": 46.39, "elapsed_time": "6:14:54", "remaining_time": "7:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 4438, "loss": 0.1499, "learning_rate": 2.999596212264392e-06, "epoch": 0.46413383276537024, "percentage": 46.42, "elapsed_time": "6:15:05", "remaining_time": "7:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2061, "total_steps": 4438, "loss": 0.142, "learning_rate": 2.997770751668302e-06, "epoch": 0.46435914045117865, "percentage": 46.44, "elapsed_time": "6:15:16", "remaining_time": "7:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2062, "total_steps": 4438, "loss": 0.1604, "learning_rate": 2.9959450146786674e-06, "epoch": 0.46458444813698707, "percentage": 46.46, "elapsed_time": "6:15:27", "remaining_time": "7:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2063, "total_steps": 4438, "loss": 0.1662, "learning_rate": 2.994119002309253e-06, "epoch": 0.4648097558227955, "percentage": 46.48, "elapsed_time": "6:15:38", "remaining_time": "7:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2064, "total_steps": 4438, "loss": 0.1575, "learning_rate": 2.9922927155739737e-06, "epoch": 0.46503506350860396, "percentage": 46.51, "elapsed_time": "6:15:47", "remaining_time": "7:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2065, "total_steps": 4438, "loss": 0.1355, "learning_rate": 2.9904661554868997e-06, "epoch": 0.4652603711944124, "percentage": 46.53, "elapsed_time": "6:15:57", "remaining_time": "7:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2066, "total_steps": 4438, "loss": 0.1423, "learning_rate": 2.9886393230622507e-06, "epoch": 0.4654856788802208, "percentage": 46.55, "elapsed_time": "6:16:08", "remaining_time": "7:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2067, "total_steps": 4438, "loss": 0.1575, "learning_rate": 2.986812219314399e-06, "epoch": 0.4657109865660292, "percentage": 46.58, "elapsed_time": "6:16:19", "remaining_time": "7:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2068, "total_steps": 4438, "loss": 0.1625, "learning_rate": 2.984984845257868e-06, "epoch": 0.4659362942518377, "percentage": 46.6, "elapsed_time": "6:16:31", "remaining_time": "7:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2069, "total_steps": 4438, "loss": 0.1654, "learning_rate": 2.983157201907329e-06, "epoch": 0.4661616019376461, "percentage": 46.62, "elapsed_time": "6:16:41", "remaining_time": "7:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 4438, "loss": 0.1434, "learning_rate": 2.981329290277605e-06, "epoch": 0.4663869096234545, "percentage": 46.64, "elapsed_time": "6:16:51", "remaining_time": "7:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2071, "total_steps": 4438, "loss": 0.1516, "learning_rate": 2.9795011113836686e-06, "epoch": 0.46661221730926294, "percentage": 46.67, "elapsed_time": "6:17:01", "remaining_time": "7:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2072, "total_steps": 4438, "loss": 0.1627, "learning_rate": 2.977672666240636e-06, "epoch": 0.4668375249950714, "percentage": 46.69, "elapsed_time": "6:17:12", "remaining_time": "7:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2073, "total_steps": 4438, "loss": 0.1534, "learning_rate": 2.9758439558637774e-06, "epoch": 0.46706283268087984, "percentage": 46.71, "elapsed_time": "6:17:22", "remaining_time": "7:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2074, "total_steps": 4438, "loss": 0.1558, "learning_rate": 2.974014981268507e-06, "epoch": 0.46728814036668825, "percentage": 46.73, "elapsed_time": "6:17:32", "remaining_time": "7:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2075, "total_steps": 4438, "loss": 0.1572, "learning_rate": 2.972185743470386e-06, "epoch": 0.46751344805249667, "percentage": 46.76, "elapsed_time": "6:17:43", "remaining_time": "7:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2076, "total_steps": 4438, "loss": 0.1454, "learning_rate": 2.9703562434851218e-06, "epoch": 0.46773875573830515, "percentage": 46.78, "elapsed_time": "6:17:54", "remaining_time": "7:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2077, "total_steps": 4438, "loss": 0.1385, "learning_rate": 2.9685264823285676e-06, "epoch": 0.46796406342411356, "percentage": 46.8, "elapsed_time": "6:18:04", "remaining_time": "7:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2078, "total_steps": 4438, "loss": 0.1519, "learning_rate": 2.966696461016721e-06, "epoch": 0.468189371109922, "percentage": 46.82, "elapsed_time": "6:18:14", "remaining_time": "7:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2079, "total_steps": 4438, "loss": 0.1391, "learning_rate": 2.964866180565725e-06, "epoch": 0.4684146787957304, "percentage": 46.85, "elapsed_time": "6:18:24", "remaining_time": "7:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 4438, "loss": 0.1572, "learning_rate": 2.9630356419918682e-06, "epoch": 0.4686399864815389, "percentage": 46.87, "elapsed_time": "6:18:34", "remaining_time": "7:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2081, "total_steps": 4438, "loss": 0.1439, "learning_rate": 2.9612048463115774e-06, "epoch": 0.4688652941673473, "percentage": 46.89, "elapsed_time": "6:18:45", "remaining_time": "7:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2082, "total_steps": 4438, "loss": 0.1588, "learning_rate": 2.9593737945414264e-06, "epoch": 0.4690906018531557, "percentage": 46.91, "elapsed_time": "6:18:57", "remaining_time": "7:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2083, "total_steps": 4438, "loss": 0.1505, "learning_rate": 2.9575424876981298e-06, "epoch": 0.4693159095389641, "percentage": 46.94, "elapsed_time": "6:19:08", "remaining_time": "7:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2084, "total_steps": 4438, "loss": 0.1369, "learning_rate": 2.9557109267985445e-06, "epoch": 0.4695412172247726, "percentage": 46.96, "elapsed_time": "6:19:18", "remaining_time": "7:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2085, "total_steps": 4438, "loss": 0.1444, "learning_rate": 2.953879112859668e-06, "epoch": 0.469766524910581, "percentage": 46.98, "elapsed_time": "6:19:27", "remaining_time": "7:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2086, "total_steps": 4438, "loss": 0.1682, "learning_rate": 2.952047046898637e-06, "epoch": 0.46999183259638944, "percentage": 47.0, "elapsed_time": "6:19:38", "remaining_time": "7:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2087, "total_steps": 4438, "loss": 0.167, "learning_rate": 2.9502147299327316e-06, "epoch": 0.47021714028219785, "percentage": 47.03, "elapsed_time": "6:19:48", "remaining_time": "7:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2088, "total_steps": 4438, "loss": 0.1597, "learning_rate": 2.9483821629793673e-06, "epoch": 0.4704424479680063, "percentage": 47.05, "elapsed_time": "6:19:59", "remaining_time": "7:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2089, "total_steps": 4438, "loss": 0.1571, "learning_rate": 2.946549347056101e-06, "epoch": 0.47066775565381475, "percentage": 47.07, "elapsed_time": "6:20:09", "remaining_time": "7:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 4438, "loss": 0.1491, "learning_rate": 2.9447162831806275e-06, "epoch": 0.47089306333962316, "percentage": 47.09, "elapsed_time": "6:20:20", "remaining_time": "7:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2091, "total_steps": 4438, "loss": 0.1315, "learning_rate": 2.942882972370778e-06, "epoch": 0.4711183710254316, "percentage": 47.12, "elapsed_time": "6:20:29", "remaining_time": "7:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2092, "total_steps": 4438, "loss": 0.1516, "learning_rate": 2.941049415644522e-06, "epoch": 0.47134367871124006, "percentage": 47.14, "elapsed_time": "6:20:40", "remaining_time": "7:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2093, "total_steps": 4438, "loss": 0.155, "learning_rate": 2.9392156140199644e-06, "epoch": 0.4715689863970485, "percentage": 47.16, "elapsed_time": "6:20:50", "remaining_time": "7:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2094, "total_steps": 4438, "loss": 0.1569, "learning_rate": 2.9373815685153485e-06, "epoch": 0.4717942940828569, "percentage": 47.18, "elapsed_time": "6:21:01", "remaining_time": "7:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2095, "total_steps": 4438, "loss": 0.1591, "learning_rate": 2.93554728014905e-06, "epoch": 0.4720196017686653, "percentage": 47.21, "elapsed_time": "6:21:12", "remaining_time": "7:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2096, "total_steps": 4438, "loss": 0.151, "learning_rate": 2.933712749939582e-06, "epoch": 0.4722449094544738, "percentage": 47.23, "elapsed_time": "6:21:22", "remaining_time": "7:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2097, "total_steps": 4438, "loss": 0.1389, "learning_rate": 2.9318779789055894e-06, "epoch": 0.4724702171402822, "percentage": 47.25, "elapsed_time": "6:21:32", "remaining_time": "7:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2098, "total_steps": 4438, "loss": 0.1421, "learning_rate": 2.9300429680658538e-06, "epoch": 0.4726955248260906, "percentage": 47.27, "elapsed_time": "6:21:41", "remaining_time": "7:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2099, "total_steps": 4438, "loss": 0.1445, "learning_rate": 2.928207718439287e-06, "epoch": 0.47292083251189904, "percentage": 47.3, "elapsed_time": "6:21:53", "remaining_time": "7:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 4438, "loss": 0.1498, "learning_rate": 2.9263722310449353e-06, "epoch": 0.4731461401977075, "percentage": 47.32, "elapsed_time": "6:22:03", "remaining_time": "7:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2101, "total_steps": 4438, "loss": 0.1473, "learning_rate": 2.924536506901976e-06, "epoch": 0.47337144788351593, "percentage": 47.34, "elapsed_time": "6:22:13", "remaining_time": "7:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2102, "total_steps": 4438, "loss": 0.1598, "learning_rate": 2.9227005470297194e-06, "epoch": 0.47359675556932435, "percentage": 47.36, "elapsed_time": "6:22:25", "remaining_time": "7:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2103, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.9208643524476037e-06, "epoch": 0.47382206325513276, "percentage": 47.39, "elapsed_time": "6:22:36", "remaining_time": "7:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2104, "total_steps": 4438, "loss": 0.1439, "learning_rate": 2.919027924175201e-06, "epoch": 0.47404737094094124, "percentage": 47.41, "elapsed_time": "6:22:47", "remaining_time": "7:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2105, "total_steps": 4438, "loss": 0.1482, "learning_rate": 2.9171912632322102e-06, "epoch": 0.47427267862674966, "percentage": 47.43, "elapsed_time": "6:22:59", "remaining_time": "7:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2106, "total_steps": 4438, "loss": 0.1559, "learning_rate": 2.915354370638462e-06, "epoch": 0.4744979863125581, "percentage": 47.45, "elapsed_time": "6:23:08", "remaining_time": "7:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2107, "total_steps": 4438, "loss": 0.1451, "learning_rate": 2.913517247413914e-06, "epoch": 0.47472329399836655, "percentage": 47.48, "elapsed_time": "6:23:20", "remaining_time": "7:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2108, "total_steps": 4438, "loss": 0.1512, "learning_rate": 2.9116798945786515e-06, "epoch": 0.47494860168417496, "percentage": 47.5, "elapsed_time": "6:23:31", "remaining_time": "7:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2109, "total_steps": 4438, "loss": 0.1489, "learning_rate": 2.909842313152888e-06, "epoch": 0.4751739093699834, "percentage": 47.52, "elapsed_time": "6:23:41", "remaining_time": "7:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 4438, "loss": 0.1715, "learning_rate": 2.9080045041569647e-06, "epoch": 0.4753992170557918, "percentage": 47.54, "elapsed_time": "6:23:52", "remaining_time": "7:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2111, "total_steps": 4438, "loss": 0.152, "learning_rate": 2.9061664686113487e-06, "epoch": 0.4756245247416003, "percentage": 47.57, "elapsed_time": "6:24:04", "remaining_time": "7:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2112, "total_steps": 4438, "loss": 0.1546, "learning_rate": 2.904328207536632e-06, "epoch": 0.4758498324274087, "percentage": 47.59, "elapsed_time": "6:24:16", "remaining_time": "7:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2113, "total_steps": 4438, "loss": 0.1599, "learning_rate": 2.9024897219535326e-06, "epoch": 0.4760751401132171, "percentage": 47.61, "elapsed_time": "6:24:28", "remaining_time": "7:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2114, "total_steps": 4438, "loss": 0.1471, "learning_rate": 2.900651012882893e-06, "epoch": 0.47630044779902553, "percentage": 47.63, "elapsed_time": "6:24:38", "remaining_time": "7:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2115, "total_steps": 4438, "loss": 0.1581, "learning_rate": 2.8988120813456794e-06, "epoch": 0.476525755484834, "percentage": 47.66, "elapsed_time": "6:24:48", "remaining_time": "7:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2116, "total_steps": 4438, "loss": 0.1513, "learning_rate": 2.896972928362983e-06, "epoch": 0.4767510631706424, "percentage": 47.68, "elapsed_time": "6:25:00", "remaining_time": "7:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2117, "total_steps": 4438, "loss": 0.1667, "learning_rate": 2.8951335549560156e-06, "epoch": 0.47697637085645084, "percentage": 47.7, "elapsed_time": "6:25:10", "remaining_time": "7:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2118, "total_steps": 4438, "loss": 0.1478, "learning_rate": 2.893293962146114e-06, "epoch": 0.47720167854225926, "percentage": 47.72, "elapsed_time": "6:25:19", "remaining_time": "7:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2119, "total_steps": 4438, "loss": 0.1457, "learning_rate": 2.8914541509547345e-06, "epoch": 0.47742698622806773, "percentage": 47.75, "elapsed_time": "6:25:30", "remaining_time": "7:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 4438, "loss": 0.1439, "learning_rate": 2.8896141224034554e-06, "epoch": 0.47765229391387615, "percentage": 47.77, "elapsed_time": "6:25:40", "remaining_time": "7:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2121, "total_steps": 4438, "loss": 0.1422, "learning_rate": 2.8877738775139767e-06, "epoch": 0.47787760159968456, "percentage": 47.79, "elapsed_time": "6:25:53", "remaining_time": "7:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2122, "total_steps": 4438, "loss": 0.1361, "learning_rate": 2.885933417308118e-06, "epoch": 0.478102909285493, "percentage": 47.81, "elapsed_time": "6:26:04", "remaining_time": "7:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2123, "total_steps": 4438, "loss": 0.1494, "learning_rate": 2.8840927428078185e-06, "epoch": 0.47832821697130146, "percentage": 47.84, "elapsed_time": "6:26:14", "remaining_time": "7:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2124, "total_steps": 4438, "loss": 0.1722, "learning_rate": 2.8822518550351356e-06, "epoch": 0.4785535246571099, "percentage": 47.86, "elapsed_time": "6:26:23", "remaining_time": "7:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2125, "total_steps": 4438, "loss": 0.1594, "learning_rate": 2.8804107550122453e-06, "epoch": 0.4787788323429183, "percentage": 47.88, "elapsed_time": "6:26:35", "remaining_time": "7:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2126, "total_steps": 4438, "loss": 0.1515, "learning_rate": 2.878569443761442e-06, "epoch": 0.4790041400287267, "percentage": 47.9, "elapsed_time": "6:26:45", "remaining_time": "7:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2127, "total_steps": 4438, "loss": 0.1478, "learning_rate": 2.8767279223051375e-06, "epoch": 0.4792294477145352, "percentage": 47.93, "elapsed_time": "6:26:55", "remaining_time": "7:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2128, "total_steps": 4438, "loss": 0.149, "learning_rate": 2.87488619166586e-06, "epoch": 0.4794547554003436, "percentage": 47.95, "elapsed_time": "6:27:05", "remaining_time": "7:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2129, "total_steps": 4438, "loss": 0.1533, "learning_rate": 2.8730442528662537e-06, "epoch": 0.479680063086152, "percentage": 47.97, "elapsed_time": "6:27:14", "remaining_time": "6:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 4438, "loss": 0.151, "learning_rate": 2.8712021069290786e-06, "epoch": 0.47990537077196044, "percentage": 47.99, "elapsed_time": "6:27:24", "remaining_time": "6:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2131, "total_steps": 4438, "loss": 0.1528, "learning_rate": 2.869359754877209e-06, "epoch": 0.4801306784577689, "percentage": 48.02, "elapsed_time": "6:27:35", "remaining_time": "6:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2132, "total_steps": 4438, "loss": 0.1401, "learning_rate": 2.8675171977336357e-06, "epoch": 0.48035598614357733, "percentage": 48.04, "elapsed_time": "6:27:46", "remaining_time": "6:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2133, "total_steps": 4438, "loss": 0.1502, "learning_rate": 2.8656744365214622e-06, "epoch": 0.48058129382938575, "percentage": 48.06, "elapsed_time": "6:27:56", "remaining_time": "6:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2134, "total_steps": 4438, "loss": 0.1534, "learning_rate": 2.863831472263904e-06, "epoch": 0.48080660151519417, "percentage": 48.08, "elapsed_time": "6:28:08", "remaining_time": "6:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2135, "total_steps": 4438, "loss": 0.143, "learning_rate": 2.8619883059842897e-06, "epoch": 0.48103190920100264, "percentage": 48.11, "elapsed_time": "6:28:18", "remaining_time": "6:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2136, "total_steps": 4438, "loss": 0.1552, "learning_rate": 2.8601449387060622e-06, "epoch": 0.48125721688681106, "percentage": 48.13, "elapsed_time": "6:28:29", "remaining_time": "6:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2137, "total_steps": 4438, "loss": 0.1377, "learning_rate": 2.858301371452774e-06, "epoch": 0.4814825245726195, "percentage": 48.15, "elapsed_time": "6:28:39", "remaining_time": "6:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2138, "total_steps": 4438, "loss": 0.1622, "learning_rate": 2.8564576052480895e-06, "epoch": 0.4817078322584279, "percentage": 48.17, "elapsed_time": "6:28:50", "remaining_time": "6:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2139, "total_steps": 4438, "loss": 0.1557, "learning_rate": 2.8546136411157843e-06, "epoch": 0.48193313994423637, "percentage": 48.2, "elapsed_time": "6:29:01", "remaining_time": "6:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 4438, "loss": 0.1588, "learning_rate": 2.8527694800797417e-06, "epoch": 0.4821584476300448, "percentage": 48.22, "elapsed_time": "6:29:12", "remaining_time": "6:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2141, "total_steps": 4438, "loss": 0.158, "learning_rate": 2.850925123163956e-06, "epoch": 0.4823837553158532, "percentage": 48.24, "elapsed_time": "6:29:22", "remaining_time": "6:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2142, "total_steps": 4438, "loss": 0.1375, "learning_rate": 2.8490805713925298e-06, "epoch": 0.4826090630016616, "percentage": 48.26, "elapsed_time": "6:29:33", "remaining_time": "6:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2143, "total_steps": 4438, "loss": 0.1544, "learning_rate": 2.847235825789673e-06, "epoch": 0.4828343706874701, "percentage": 48.29, "elapsed_time": "6:29:44", "remaining_time": "6:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2144, "total_steps": 4438, "loss": 0.1599, "learning_rate": 2.845390887379706e-06, "epoch": 0.4830596783732785, "percentage": 48.31, "elapsed_time": "6:29:53", "remaining_time": "6:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2145, "total_steps": 4438, "loss": 0.1678, "learning_rate": 2.8435457571870527e-06, "epoch": 0.48328498605908693, "percentage": 48.33, "elapsed_time": "6:30:04", "remaining_time": "6:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2146, "total_steps": 4438, "loss": 0.1302, "learning_rate": 2.8417004362362465e-06, "epoch": 0.48351029374489535, "percentage": 48.36, "elapsed_time": "6:30:13", "remaining_time": "6:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2147, "total_steps": 4438, "loss": 0.1554, "learning_rate": 2.8398549255519237e-06, "epoch": 0.4837356014307038, "percentage": 48.38, "elapsed_time": "6:30:23", "remaining_time": "6:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2148, "total_steps": 4438, "loss": 0.1612, "learning_rate": 2.838009226158829e-06, "epoch": 0.48396090911651224, "percentage": 48.4, "elapsed_time": "6:30:34", "remaining_time": "6:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2149, "total_steps": 4438, "loss": 0.1695, "learning_rate": 2.83616333908181e-06, "epoch": 0.48418621680232066, "percentage": 48.42, "elapsed_time": "6:30:45", "remaining_time": "6:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 4438, "loss": 0.1571, "learning_rate": 2.8343172653458194e-06, "epoch": 0.4844115244881291, "percentage": 48.45, "elapsed_time": "6:30:56", "remaining_time": "6:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2151, "total_steps": 4438, "loss": 0.1577, "learning_rate": 2.8324710059759126e-06, "epoch": 0.48463683217393755, "percentage": 48.47, "elapsed_time": "6:31:07", "remaining_time": "6:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2152, "total_steps": 4438, "loss": 0.1405, "learning_rate": 2.8306245619972476e-06, "epoch": 0.48486213985974597, "percentage": 48.49, "elapsed_time": "6:31:18", "remaining_time": "6:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2153, "total_steps": 4438, "loss": 0.1622, "learning_rate": 2.828777934435088e-06, "epoch": 0.4850874475455544, "percentage": 48.51, "elapsed_time": "6:31:29", "remaining_time": "6:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2154, "total_steps": 4438, "loss": 0.1644, "learning_rate": 2.826931124314796e-06, "epoch": 0.4853127552313628, "percentage": 48.54, "elapsed_time": "6:31:40", "remaining_time": "6:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2155, "total_steps": 4438, "loss": 0.1514, "learning_rate": 2.8250841326618367e-06, "epoch": 0.4855380629171713, "percentage": 48.56, "elapsed_time": "6:31:51", "remaining_time": "6:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2156, "total_steps": 4438, "loss": 0.1539, "learning_rate": 2.8232369605017757e-06, "epoch": 0.4857633706029797, "percentage": 48.58, "elapsed_time": "6:32:03", "remaining_time": "6:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2157, "total_steps": 4438, "loss": 0.1462, "learning_rate": 2.8213896088602786e-06, "epoch": 0.4859886782887881, "percentage": 48.6, "elapsed_time": "6:32:13", "remaining_time": "6:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2158, "total_steps": 4438, "loss": 0.1708, "learning_rate": 2.8195420787631113e-06, "epoch": 0.4862139859745966, "percentage": 48.63, "elapsed_time": "6:32:23", "remaining_time": "6:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2159, "total_steps": 4438, "loss": 0.1563, "learning_rate": 2.8176943712361394e-06, "epoch": 0.486439293660405, "percentage": 48.65, "elapsed_time": "6:32:33", "remaining_time": "6:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 4438, "loss": 0.1471, "learning_rate": 2.8158464873053236e-06, "epoch": 0.4866646013462134, "percentage": 48.67, "elapsed_time": "6:32:45", "remaining_time": "6:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2161, "total_steps": 4438, "loss": 0.1575, "learning_rate": 2.8139984279967265e-06, "epoch": 0.48688990903202184, "percentage": 48.69, "elapsed_time": "6:32:57", "remaining_time": "6:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2162, "total_steps": 4438, "loss": 0.1368, "learning_rate": 2.8121501943365066e-06, "epoch": 0.4871152167178303, "percentage": 48.72, "elapsed_time": "6:33:06", "remaining_time": "6:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2163, "total_steps": 4438, "loss": 0.1471, "learning_rate": 2.810301787350918e-06, "epoch": 0.48734052440363873, "percentage": 48.74, "elapsed_time": "6:33:17", "remaining_time": "6:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2164, "total_steps": 4438, "loss": 0.1432, "learning_rate": 2.808453208066314e-06, "epoch": 0.48756583208944715, "percentage": 48.76, "elapsed_time": "6:33:28", "remaining_time": "6:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2165, "total_steps": 4438, "loss": 0.1465, "learning_rate": 2.8066044575091404e-06, "epoch": 0.48779113977525557, "percentage": 48.78, "elapsed_time": "6:33:38", "remaining_time": "6:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2166, "total_steps": 4438, "loss": 0.1678, "learning_rate": 2.8047555367059404e-06, "epoch": 0.48801644746106404, "percentage": 48.81, "elapsed_time": "6:33:48", "remaining_time": "6:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2167, "total_steps": 4438, "loss": 0.1403, "learning_rate": 2.80290644668335e-06, "epoch": 0.48824175514687246, "percentage": 48.83, "elapsed_time": "6:33:58", "remaining_time": "6:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2168, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.8010571884681004e-06, "epoch": 0.4884670628326809, "percentage": 48.85, "elapsed_time": "6:34:08", "remaining_time": "6:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2169, "total_steps": 4438, "loss": 0.1439, "learning_rate": 2.799207763087015e-06, "epoch": 0.4886923705184893, "percentage": 48.87, "elapsed_time": "6:34:19", "remaining_time": "6:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 4438, "loss": 0.147, "learning_rate": 2.7973581715670124e-06, "epoch": 0.48891767820429777, "percentage": 48.9, "elapsed_time": "6:34:31", "remaining_time": "6:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2171, "total_steps": 4438, "loss": 0.1521, "learning_rate": 2.7955084149351002e-06, "epoch": 0.4891429858901062, "percentage": 48.92, "elapsed_time": "6:34:43", "remaining_time": "6:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2172, "total_steps": 4438, "loss": 0.1519, "learning_rate": 2.7936584942183804e-06, "epoch": 0.4893682935759146, "percentage": 48.94, "elapsed_time": "6:34:54", "remaining_time": "6:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2173, "total_steps": 4438, "loss": 0.1496, "learning_rate": 2.7918084104440446e-06, "epoch": 0.489593601261723, "percentage": 48.96, "elapsed_time": "6:35:05", "remaining_time": "6:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2174, "total_steps": 4438, "loss": 0.1521, "learning_rate": 2.7899581646393746e-06, "epoch": 0.4898189089475315, "percentage": 48.99, "elapsed_time": "6:35:15", "remaining_time": "6:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2175, "total_steps": 4438, "loss": 0.1502, "learning_rate": 2.7881077578317445e-06, "epoch": 0.4900442166333399, "percentage": 49.01, "elapsed_time": "6:35:26", "remaining_time": "6:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2176, "total_steps": 4438, "loss": 0.1501, "learning_rate": 2.7862571910486148e-06, "epoch": 0.49026952431914833, "percentage": 49.03, "elapsed_time": "6:35:36", "remaining_time": "6:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2177, "total_steps": 4438, "loss": 0.1565, "learning_rate": 2.784406465317538e-06, "epoch": 0.49049483200495675, "percentage": 49.05, "elapsed_time": "6:35:48", "remaining_time": "6:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2178, "total_steps": 4438, "loss": 0.165, "learning_rate": 2.7825555816661503e-06, "epoch": 0.4907201396907652, "percentage": 49.08, "elapsed_time": "6:35:58", "remaining_time": "6:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2179, "total_steps": 4438, "loss": 0.1509, "learning_rate": 2.7807045411221813e-06, "epoch": 0.49094544737657364, "percentage": 49.1, "elapsed_time": "6:36:09", "remaining_time": "6:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 4438, "loss": 0.1444, "learning_rate": 2.778853344713443e-06, "epoch": 0.49117075506238206, "percentage": 49.12, "elapsed_time": "6:36:19", "remaining_time": "6:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2181, "total_steps": 4438, "loss": 0.1457, "learning_rate": 2.777001993467837e-06, "epoch": 0.4913960627481905, "percentage": 49.14, "elapsed_time": "6:36:30", "remaining_time": "6:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2182, "total_steps": 4438, "loss": 0.1429, "learning_rate": 2.7751504884133484e-06, "epoch": 0.49162137043399895, "percentage": 49.17, "elapsed_time": "6:36:43", "remaining_time": "6:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2183, "total_steps": 4438, "loss": 0.155, "learning_rate": 2.7732988305780496e-06, "epoch": 0.49184667811980737, "percentage": 49.19, "elapsed_time": "6:36:54", "remaining_time": "6:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2184, "total_steps": 4438, "loss": 0.1472, "learning_rate": 2.7714470209900974e-06, "epoch": 0.4920719858056158, "percentage": 49.21, "elapsed_time": "6:37:03", "remaining_time": "6:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2185, "total_steps": 4438, "loss": 0.1431, "learning_rate": 2.769595060677732e-06, "epoch": 0.4922972934914242, "percentage": 49.23, "elapsed_time": "6:37:15", "remaining_time": "6:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2186, "total_steps": 4438, "loss": 0.1443, "learning_rate": 2.7677429506692788e-06, "epoch": 0.4925226011772327, "percentage": 49.26, "elapsed_time": "6:37:26", "remaining_time": "6:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2187, "total_steps": 4438, "loss": 0.1476, "learning_rate": 2.7658906919931443e-06, "epoch": 0.4927479088630411, "percentage": 49.28, "elapsed_time": "6:37:36", "remaining_time": "6:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2188, "total_steps": 4438, "loss": 0.1494, "learning_rate": 2.76403828567782e-06, "epoch": 0.4929732165488495, "percentage": 49.3, "elapsed_time": "6:37:47", "remaining_time": "6:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2189, "total_steps": 4438, "loss": 0.1571, "learning_rate": 2.7621857327518763e-06, "epoch": 0.49319852423465793, "percentage": 49.32, "elapsed_time": "6:37:58", "remaining_time": "6:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 4438, "loss": 0.1583, "learning_rate": 2.7603330342439686e-06, "epoch": 0.4934238319204664, "percentage": 49.35, "elapsed_time": "6:38:09", "remaining_time": "6:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2191, "total_steps": 4438, "loss": 0.1527, "learning_rate": 2.7584801911828314e-06, "epoch": 0.4936491396062748, "percentage": 49.37, "elapsed_time": "6:38:20", "remaining_time": "6:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2192, "total_steps": 4438, "loss": 0.151, "learning_rate": 2.7566272045972777e-06, "epoch": 0.49387444729208324, "percentage": 49.39, "elapsed_time": "6:38:30", "remaining_time": "6:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2193, "total_steps": 4438, "loss": 0.137, "learning_rate": 2.7547740755162034e-06, "epoch": 0.49409975497789166, "percentage": 49.41, "elapsed_time": "6:38:41", "remaining_time": "6:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2194, "total_steps": 4438, "loss": 0.1455, "learning_rate": 2.752920804968581e-06, "epoch": 0.49432506266370013, "percentage": 49.44, "elapsed_time": "6:38:51", "remaining_time": "6:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2195, "total_steps": 4438, "loss": 0.151, "learning_rate": 2.7510673939834633e-06, "epoch": 0.49455037034950855, "percentage": 49.46, "elapsed_time": "6:39:03", "remaining_time": "6:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2196, "total_steps": 4438, "loss": 0.1428, "learning_rate": 2.7492138435899794e-06, "epoch": 0.49477567803531697, "percentage": 49.48, "elapsed_time": "6:39:13", "remaining_time": "6:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2197, "total_steps": 4438, "loss": 0.1484, "learning_rate": 2.747360154817338e-06, "epoch": 0.4950009857211254, "percentage": 49.5, "elapsed_time": "6:39:24", "remaining_time": "6:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2198, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.745506328694822e-06, "epoch": 0.49522629340693386, "percentage": 49.53, "elapsed_time": "6:39:33", "remaining_time": "6:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2199, "total_steps": 4438, "loss": 0.1469, "learning_rate": 2.743652366251793e-06, "epoch": 0.4954516010927423, "percentage": 49.55, "elapsed_time": "6:39:43", "remaining_time": "6:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 4438, "loss": 0.1415, "learning_rate": 2.741798268517687e-06, "epoch": 0.4956769087785507, "percentage": 49.57, "elapsed_time": "6:39:54", "remaining_time": "6:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2201, "total_steps": 4438, "loss": 0.1558, "learning_rate": 2.7399440365220153e-06, "epoch": 0.4959022164643591, "percentage": 49.59, "elapsed_time": "6:40:05", "remaining_time": "6:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2202, "total_steps": 4438, "loss": 0.1576, "learning_rate": 2.738089671294364e-06, "epoch": 0.4961275241501676, "percentage": 49.62, "elapsed_time": "6:40:15", "remaining_time": "6:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2203, "total_steps": 4438, "loss": 0.1685, "learning_rate": 2.7362351738643926e-06, "epoch": 0.496352831835976, "percentage": 49.64, "elapsed_time": "6:40:27", "remaining_time": "6:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2204, "total_steps": 4438, "loss": 0.1396, "learning_rate": 2.734380545261835e-06, "epoch": 0.4965781395217844, "percentage": 49.66, "elapsed_time": "6:40:37", "remaining_time": "6:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2205, "total_steps": 4438, "loss": 0.1433, "learning_rate": 2.7325257865164955e-06, "epoch": 0.4968034472075929, "percentage": 49.68, "elapsed_time": "6:40:48", "remaining_time": "6:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2206, "total_steps": 4438, "loss": 0.1659, "learning_rate": 2.730670898658255e-06, "epoch": 0.4970287548934013, "percentage": 49.71, "elapsed_time": "6:40:59", "remaining_time": "6:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2207, "total_steps": 4438, "loss": 0.1345, "learning_rate": 2.7288158827170623e-06, "epoch": 0.49725406257920973, "percentage": 49.73, "elapsed_time": "6:41:09", "remaining_time": "6:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2208, "total_steps": 4438, "loss": 0.1539, "learning_rate": 2.726960739722939e-06, "epoch": 0.49747937026501815, "percentage": 49.75, "elapsed_time": "6:41:21", "remaining_time": "6:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2209, "total_steps": 4438, "loss": 0.1525, "learning_rate": 2.725105470705977e-06, "epoch": 0.4977046779508266, "percentage": 49.77, "elapsed_time": "6:41:32", "remaining_time": "6:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 4438, "loss": 0.16, "learning_rate": 2.7232500766963373e-06, "epoch": 0.49792998563663504, "percentage": 49.8, "elapsed_time": "6:41:44", "remaining_time": "6:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2211, "total_steps": 4438, "loss": 0.1521, "learning_rate": 2.7213945587242507e-06, "epoch": 0.49815529332244346, "percentage": 49.82, "elapsed_time": "6:41:55", "remaining_time": "6:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2212, "total_steps": 4438, "loss": 0.1535, "learning_rate": 2.7195389178200194e-06, "epoch": 0.4983806010082519, "percentage": 49.84, "elapsed_time": "6:42:07", "remaining_time": "6:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2213, "total_steps": 4438, "loss": 0.1622, "learning_rate": 2.7176831550140093e-06, "epoch": 0.49860590869406035, "percentage": 49.86, "elapsed_time": "6:42:17", "remaining_time": "6:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2214, "total_steps": 4438, "loss": 0.1319, "learning_rate": 2.7158272713366573e-06, "epoch": 0.49883121637986877, "percentage": 49.89, "elapsed_time": "6:42:28", "remaining_time": "6:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2215, "total_steps": 4438, "loss": 0.1562, "learning_rate": 2.713971267818466e-06, "epoch": 0.4990565240656772, "percentage": 49.91, "elapsed_time": "6:42:38", "remaining_time": "6:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2216, "total_steps": 4438, "loss": 0.1482, "learning_rate": 2.7121151454900048e-06, "epoch": 0.4992818317514856, "percentage": 49.93, "elapsed_time": "6:42:49", "remaining_time": "6:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2217, "total_steps": 4438, "loss": 0.1418, "learning_rate": 2.7102589053819107e-06, "epoch": 0.4995071394372941, "percentage": 49.95, "elapsed_time": "6:42:59", "remaining_time": "6:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2218, "total_steps": 4438, "loss": 0.1528, "learning_rate": 2.7084025485248827e-06, "epoch": 0.4997324471231025, "percentage": 49.98, "elapsed_time": "6:43:09", "remaining_time": "6:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2219, "total_steps": 4438, "loss": 0.1473, "learning_rate": 2.706546075949688e-06, "epoch": 0.4999577548089109, "percentage": 50.0, "elapsed_time": "6:43:19", "remaining_time": "6:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 4438, "loss": 0.1507, "learning_rate": 2.7046894886871564e-06, "epoch": 0.5001830624947193, "percentage": 50.02, "elapsed_time": "6:43:30", "remaining_time": "6:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2221, "total_steps": 4438, "loss": 0.1541, "learning_rate": 2.7028327877681808e-06, "epoch": 0.5004083701805278, "percentage": 50.05, "elapsed_time": "6:43:41", "remaining_time": "6:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2222, "total_steps": 4438, "loss": 0.1509, "learning_rate": 2.700975974223719e-06, "epoch": 0.5006336778663362, "percentage": 50.07, "elapsed_time": "6:43:52", "remaining_time": "6:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2223, "total_steps": 4438, "loss": 0.1396, "learning_rate": 2.6991190490847898e-06, "epoch": 0.5008589855521447, "percentage": 50.09, "elapsed_time": "6:44:02", "remaining_time": "6:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2224, "total_steps": 4438, "loss": 0.1515, "learning_rate": 2.6972620133824745e-06, "epoch": 0.5010842932379531, "percentage": 50.11, "elapsed_time": "6:44:12", "remaining_time": "6:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2225, "total_steps": 4438, "loss": 0.1481, "learning_rate": 2.695404868147916e-06, "epoch": 0.5013096009237615, "percentage": 50.14, "elapsed_time": "6:44:23", "remaining_time": "6:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2226, "total_steps": 4438, "loss": 0.1427, "learning_rate": 2.6935476144123173e-06, "epoch": 0.50153490860957, "percentage": 50.16, "elapsed_time": "6:44:34", "remaining_time": "6:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2227, "total_steps": 4438, "loss": 0.151, "learning_rate": 2.691690253206943e-06, "epoch": 0.5017602162953784, "percentage": 50.18, "elapsed_time": "6:44:44", "remaining_time": "6:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2228, "total_steps": 4438, "loss": 0.1419, "learning_rate": 2.689832785563116e-06, "epoch": 0.5019855239811868, "percentage": 50.2, "elapsed_time": "6:44:54", "remaining_time": "6:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2229, "total_steps": 4438, "loss": 0.1415, "learning_rate": 2.6879752125122193e-06, "epoch": 0.5022108316669952, "percentage": 50.23, "elapsed_time": "6:45:05", "remaining_time": "6:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 4438, "loss": 0.1596, "learning_rate": 2.6861175350856937e-06, "epoch": 0.5024361393528036, "percentage": 50.25, "elapsed_time": "6:45:14", "remaining_time": "6:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2231, "total_steps": 4438, "loss": 0.1625, "learning_rate": 2.684259754315038e-06, "epoch": 0.5026614470386122, "percentage": 50.27, "elapsed_time": "6:45:26", "remaining_time": "6:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2232, "total_steps": 4438, "loss": 0.1477, "learning_rate": 2.6824018712318084e-06, "epoch": 0.5028867547244206, "percentage": 50.29, "elapsed_time": "6:45:38", "remaining_time": "6:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2233, "total_steps": 4438, "loss": 0.1531, "learning_rate": 2.6805438868676186e-06, "epoch": 0.503112062410229, "percentage": 50.32, "elapsed_time": "6:45:48", "remaining_time": "6:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2234, "total_steps": 4438, "loss": 0.1425, "learning_rate": 2.6786858022541385e-06, "epoch": 0.5033373700960374, "percentage": 50.34, "elapsed_time": "6:45:59", "remaining_time": "6:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2235, "total_steps": 4438, "loss": 0.165, "learning_rate": 2.676827618423093e-06, "epoch": 0.5035626777818458, "percentage": 50.36, "elapsed_time": "6:46:10", "remaining_time": "6:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2236, "total_steps": 4438, "loss": 0.1487, "learning_rate": 2.674969336406262e-06, "epoch": 0.5037879854676542, "percentage": 50.38, "elapsed_time": "6:46:21", "remaining_time": "6:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2237, "total_steps": 4438, "loss": 0.1583, "learning_rate": 2.6731109572354795e-06, "epoch": 0.5040132931534627, "percentage": 50.41, "elapsed_time": "6:46:30", "remaining_time": "6:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2238, "total_steps": 4438, "loss": 0.1677, "learning_rate": 2.6712524819426355e-06, "epoch": 0.5042386008392711, "percentage": 50.43, "elapsed_time": "6:46:41", "remaining_time": "6:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2239, "total_steps": 4438, "loss": 0.1454, "learning_rate": 2.6693939115596718e-06, "epoch": 0.5044639085250796, "percentage": 50.45, "elapsed_time": "6:46:51", "remaining_time": "6:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 4438, "loss": 0.1373, "learning_rate": 2.6675352471185824e-06, "epoch": 0.504689216210888, "percentage": 50.47, "elapsed_time": "6:47:01", "remaining_time": "6:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2241, "total_steps": 4438, "loss": 0.1471, "learning_rate": 2.6656764896514152e-06, "epoch": 0.5049145238966964, "percentage": 50.5, "elapsed_time": "6:47:12", "remaining_time": "6:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2242, "total_steps": 4438, "loss": 0.1626, "learning_rate": 2.6638176401902693e-06, "epoch": 0.5051398315825049, "percentage": 50.52, "elapsed_time": "6:47:22", "remaining_time": "6:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2243, "total_steps": 4438, "loss": 0.1414, "learning_rate": 2.6619586997672923e-06, "epoch": 0.5053651392683133, "percentage": 50.54, "elapsed_time": "6:47:32", "remaining_time": "6:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2244, "total_steps": 4438, "loss": 0.1559, "learning_rate": 2.6600996694146876e-06, "epoch": 0.5055904469541217, "percentage": 50.56, "elapsed_time": "6:47:42", "remaining_time": "6:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2245, "total_steps": 4438, "loss": 0.1427, "learning_rate": 2.658240550164704e-06, "epoch": 0.5058157546399301, "percentage": 50.59, "elapsed_time": "6:47:54", "remaining_time": "6:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2246, "total_steps": 4438, "loss": 0.1418, "learning_rate": 2.656381343049641e-06, "epoch": 0.5060410623257385, "percentage": 50.61, "elapsed_time": "6:48:04", "remaining_time": "6:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2247, "total_steps": 4438, "loss": 0.1412, "learning_rate": 2.654522049101847e-06, "epoch": 0.5062663700115471, "percentage": 50.63, "elapsed_time": "6:48:15", "remaining_time": "6:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2248, "total_steps": 4438, "loss": 0.1597, "learning_rate": 2.652662669353719e-06, "epoch": 0.5064916776973555, "percentage": 50.65, "elapsed_time": "6:48:25", "remaining_time": "6:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2249, "total_steps": 4438, "loss": 0.1314, "learning_rate": 2.6508032048377006e-06, "epoch": 0.5067169853831639, "percentage": 50.68, "elapsed_time": "6:48:35", "remaining_time": "6:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 4438, "loss": 0.1457, "learning_rate": 2.648943656586284e-06, "epoch": 0.5069422930689723, "percentage": 50.7, "elapsed_time": "6:48:45", "remaining_time": "6:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2251, "total_steps": 4438, "loss": 0.1444, "learning_rate": 2.6470840256320064e-06, "epoch": 0.5071676007547807, "percentage": 50.72, "elapsed_time": "6:48:54", "remaining_time": "6:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2252, "total_steps": 4438, "loss": 0.1286, "learning_rate": 2.6452243130074523e-06, "epoch": 0.5073929084405892, "percentage": 50.74, "elapsed_time": "6:49:05", "remaining_time": "6:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2253, "total_steps": 4438, "loss": 0.1469, "learning_rate": 2.6433645197452493e-06, "epoch": 0.5076182161263976, "percentage": 50.77, "elapsed_time": "6:49:15", "remaining_time": "6:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2254, "total_steps": 4438, "loss": 0.1415, "learning_rate": 2.6415046468780726e-06, "epoch": 0.5078435238122061, "percentage": 50.79, "elapsed_time": "6:49:26", "remaining_time": "6:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2255, "total_steps": 4438, "loss": 0.1332, "learning_rate": 2.63964469543864e-06, "epoch": 0.5080688314980145, "percentage": 50.81, "elapsed_time": "6:49:36", "remaining_time": "6:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2256, "total_steps": 4438, "loss": 0.1462, "learning_rate": 2.637784666459714e-06, "epoch": 0.5082941391838229, "percentage": 50.83, "elapsed_time": "6:49:47", "remaining_time": "6:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2257, "total_steps": 4438, "loss": 0.1602, "learning_rate": 2.635924560974098e-06, "epoch": 0.5085194468696314, "percentage": 50.86, "elapsed_time": "6:49:58", "remaining_time": "6:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2258, "total_steps": 4438, "loss": 0.1486, "learning_rate": 2.6340643800146387e-06, "epoch": 0.5087447545554398, "percentage": 50.88, "elapsed_time": "6:50:07", "remaining_time": "6:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2259, "total_steps": 4438, "loss": 0.1527, "learning_rate": 2.6322041246142273e-06, "epoch": 0.5089700622412482, "percentage": 50.9, "elapsed_time": "6:50:19", "remaining_time": "6:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 4438, "loss": 0.1511, "learning_rate": 2.6303437958057932e-06, "epoch": 0.5091953699270566, "percentage": 50.92, "elapsed_time": "6:50:29", "remaining_time": "6:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2261, "total_steps": 4438, "loss": 0.1461, "learning_rate": 2.6284833946223075e-06, "epoch": 0.509420677612865, "percentage": 50.95, "elapsed_time": "6:50:40", "remaining_time": "6:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2262, "total_steps": 4438, "loss": 0.1543, "learning_rate": 2.626622922096782e-06, "epoch": 0.5096459852986736, "percentage": 50.97, "elapsed_time": "6:50:50", "remaining_time": "6:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2263, "total_steps": 4438, "loss": 0.1391, "learning_rate": 2.624762379262268e-06, "epoch": 0.509871292984482, "percentage": 50.99, "elapsed_time": "6:51:01", "remaining_time": "6:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2264, "total_steps": 4438, "loss": 0.1461, "learning_rate": 2.622901767151855e-06, "epoch": 0.5100966006702904, "percentage": 51.01, "elapsed_time": "6:51:12", "remaining_time": "6:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2265, "total_steps": 4438, "loss": 0.1411, "learning_rate": 2.6210410867986713e-06, "epoch": 0.5103219083560988, "percentage": 51.04, "elapsed_time": "6:51:22", "remaining_time": "6:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2266, "total_steps": 4438, "loss": 0.1428, "learning_rate": 2.619180339235884e-06, "epoch": 0.5105472160419072, "percentage": 51.06, "elapsed_time": "6:51:33", "remaining_time": "6:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2267, "total_steps": 4438, "loss": 0.1602, "learning_rate": 2.6173195254966966e-06, "epoch": 0.5107725237277156, "percentage": 51.08, "elapsed_time": "6:51:45", "remaining_time": "6:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2268, "total_steps": 4438, "loss": 0.1397, "learning_rate": 2.6154586466143495e-06, "epoch": 0.5109978314135241, "percentage": 51.1, "elapsed_time": "6:51:56", "remaining_time": "6:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2269, "total_steps": 4438, "loss": 0.1344, "learning_rate": 2.6135977036221195e-06, "epoch": 0.5112231390993325, "percentage": 51.13, "elapsed_time": "6:52:06", "remaining_time": "6:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 4438, "loss": 0.146, "learning_rate": 2.6117366975533187e-06, "epoch": 0.511448446785141, "percentage": 51.15, "elapsed_time": "6:52:18", "remaining_time": "6:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2271, "total_steps": 4438, "loss": 0.1636, "learning_rate": 2.609875629441295e-06, "epoch": 0.5116737544709494, "percentage": 51.17, "elapsed_time": "6:52:29", "remaining_time": "6:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2272, "total_steps": 4438, "loss": 0.1388, "learning_rate": 2.60801450031943e-06, "epoch": 0.5118990621567578, "percentage": 51.19, "elapsed_time": "6:52:40", "remaining_time": "6:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2273, "total_steps": 4438, "loss": 0.1459, "learning_rate": 2.6061533112211394e-06, "epoch": 0.5121243698425663, "percentage": 51.22, "elapsed_time": "6:52:49", "remaining_time": "6:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2274, "total_steps": 4438, "loss": 0.1562, "learning_rate": 2.604292063179871e-06, "epoch": 0.5123496775283747, "percentage": 51.24, "elapsed_time": "6:53:01", "remaining_time": "6:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2275, "total_steps": 4438, "loss": 0.1507, "learning_rate": 2.602430757229108e-06, "epoch": 0.5125749852141831, "percentage": 51.26, "elapsed_time": "6:53:13", "remaining_time": "6:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2276, "total_steps": 4438, "loss": 0.1475, "learning_rate": 2.600569394402363e-06, "epoch": 0.5128002928999915, "percentage": 51.28, "elapsed_time": "6:53:22", "remaining_time": "6:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2277, "total_steps": 4438, "loss": 0.1571, "learning_rate": 2.5987079757331824e-06, "epoch": 0.5130256005857999, "percentage": 51.31, "elapsed_time": "6:53:34", "remaining_time": "6:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2278, "total_steps": 4438, "loss": 0.1418, "learning_rate": 2.596846502255142e-06, "epoch": 0.5132509082716085, "percentage": 51.33, "elapsed_time": "6:53:44", "remaining_time": "6:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2279, "total_steps": 4438, "loss": 0.1488, "learning_rate": 2.5949849750018486e-06, "epoch": 0.5134762159574169, "percentage": 51.35, "elapsed_time": "6:53:56", "remaining_time": "6:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 4438, "loss": 0.1464, "learning_rate": 2.5931233950069385e-06, "epoch": 0.5137015236432253, "percentage": 51.37, "elapsed_time": "6:54:07", "remaining_time": "6:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2281, "total_steps": 4438, "loss": 0.1474, "learning_rate": 2.591261763304079e-06, "epoch": 0.5139268313290337, "percentage": 51.4, "elapsed_time": "6:54:18", "remaining_time": "6:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2282, "total_steps": 4438, "loss": 0.1394, "learning_rate": 2.589400080926964e-06, "epoch": 0.5141521390148421, "percentage": 51.42, "elapsed_time": "6:54:29", "remaining_time": "6:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2283, "total_steps": 4438, "loss": 0.1536, "learning_rate": 2.5875383489093165e-06, "epoch": 0.5143774467006506, "percentage": 51.44, "elapsed_time": "6:54:41", "remaining_time": "6:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2284, "total_steps": 4438, "loss": 0.149, "learning_rate": 2.585676568284886e-06, "epoch": 0.514602754386459, "percentage": 51.46, "elapsed_time": "6:54:52", "remaining_time": "6:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2285, "total_steps": 4438, "loss": 0.1417, "learning_rate": 2.583814740087451e-06, "epoch": 0.5148280620722674, "percentage": 51.49, "elapsed_time": "6:55:03", "remaining_time": "6:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2286, "total_steps": 4438, "loss": 0.1549, "learning_rate": 2.581952865350815e-06, "epoch": 0.5150533697580759, "percentage": 51.51, "elapsed_time": "6:55:13", "remaining_time": "6:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2287, "total_steps": 4438, "loss": 0.1462, "learning_rate": 2.5800909451088075e-06, "epoch": 0.5152786774438843, "percentage": 51.53, "elapsed_time": "6:55:23", "remaining_time": "6:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2288, "total_steps": 4438, "loss": 0.1448, "learning_rate": 2.578228980395283e-06, "epoch": 0.5155039851296928, "percentage": 51.55, "elapsed_time": "6:55:33", "remaining_time": "6:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2289, "total_steps": 4438, "loss": 0.1527, "learning_rate": 2.5763669722441226e-06, "epoch": 0.5157292928155012, "percentage": 51.58, "elapsed_time": "6:55:44", "remaining_time": "6:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 4438, "loss": 0.1316, "learning_rate": 2.5745049216892286e-06, "epoch": 0.5159546005013096, "percentage": 51.6, "elapsed_time": "6:55:55", "remaining_time": "6:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2291, "total_steps": 4438, "loss": 0.1464, "learning_rate": 2.5726428297645285e-06, "epoch": 0.516179908187118, "percentage": 51.62, "elapsed_time": "6:56:05", "remaining_time": "6:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2292, "total_steps": 4438, "loss": 0.1464, "learning_rate": 2.570780697503973e-06, "epoch": 0.5164052158729264, "percentage": 51.64, "elapsed_time": "6:56:16", "remaining_time": "6:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2293, "total_steps": 4438, "loss": 0.1619, "learning_rate": 2.5689185259415346e-06, "epoch": 0.5166305235587348, "percentage": 51.67, "elapsed_time": "6:56:27", "remaining_time": "6:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2294, "total_steps": 4438, "loss": 0.1341, "learning_rate": 2.5670563161112073e-06, "epoch": 0.5168558312445434, "percentage": 51.69, "elapsed_time": "6:56:38", "remaining_time": "6:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2295, "total_steps": 4438, "loss": 0.1524, "learning_rate": 2.5651940690470074e-06, "epoch": 0.5170811389303518, "percentage": 51.71, "elapsed_time": "6:56:49", "remaining_time": "6:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2296, "total_steps": 4438, "loss": 0.1584, "learning_rate": 2.56333178578297e-06, "epoch": 0.5173064466161602, "percentage": 51.74, "elapsed_time": "6:56:59", "remaining_time": "6:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2297, "total_steps": 4438, "loss": 0.1484, "learning_rate": 2.5614694673531533e-06, "epoch": 0.5175317543019686, "percentage": 51.76, "elapsed_time": "6:57:09", "remaining_time": "6:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2298, "total_steps": 4438, "loss": 0.1373, "learning_rate": 2.5596071147916325e-06, "epoch": 0.517757061987777, "percentage": 51.78, "elapsed_time": "6:57:19", "remaining_time": "6:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2299, "total_steps": 4438, "loss": 0.1626, "learning_rate": 2.557744729132503e-06, "epoch": 0.5179823696735855, "percentage": 51.8, "elapsed_time": "6:57:30", "remaining_time": "6:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 4438, "loss": 0.1529, "learning_rate": 2.555882311409878e-06, "epoch": 0.5182076773593939, "percentage": 51.83, "elapsed_time": "6:57:41", "remaining_time": "6:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2301, "total_steps": 4438, "loss": 0.1492, "learning_rate": 2.554019862657888e-06, "epoch": 0.5184329850452023, "percentage": 51.85, "elapsed_time": "6:57:53", "remaining_time": "6:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2302, "total_steps": 4438, "loss": 0.1476, "learning_rate": 2.5521573839106815e-06, "epoch": 0.5186582927310108, "percentage": 51.87, "elapsed_time": "6:58:04", "remaining_time": "6:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2303, "total_steps": 4438, "loss": 0.1414, "learning_rate": 2.5502948762024244e-06, "epoch": 0.5188836004168192, "percentage": 51.89, "elapsed_time": "6:58:14", "remaining_time": "6:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2304, "total_steps": 4438, "loss": 0.156, "learning_rate": 2.5484323405672965e-06, "epoch": 0.5191089081026277, "percentage": 51.92, "elapsed_time": "6:58:25", "remaining_time": "6:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2305, "total_steps": 4438, "loss": 0.1416, "learning_rate": 2.546569778039496e-06, "epoch": 0.5193342157884361, "percentage": 51.94, "elapsed_time": "6:58:36", "remaining_time": "6:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2306, "total_steps": 4438, "loss": 0.1479, "learning_rate": 2.544707189653233e-06, "epoch": 0.5195595234742445, "percentage": 51.96, "elapsed_time": "6:58:46", "remaining_time": "6:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2307, "total_steps": 4438, "loss": 0.1509, "learning_rate": 2.542844576442734e-06, "epoch": 0.5197848311600529, "percentage": 51.98, "elapsed_time": "6:58:57", "remaining_time": "6:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2308, "total_steps": 4438, "loss": 0.1404, "learning_rate": 2.5409819394422386e-06, "epoch": 0.5200101388458613, "percentage": 52.01, "elapsed_time": "6:59:08", "remaining_time": "6:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2309, "total_steps": 4438, "loss": 0.1311, "learning_rate": 2.539119279686001e-06, "epoch": 0.5202354465316699, "percentage": 52.03, "elapsed_time": "6:59:17", "remaining_time": "6:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 4438, "loss": 0.155, "learning_rate": 2.5372565982082843e-06, "epoch": 0.5204607542174783, "percentage": 52.05, "elapsed_time": "6:59:27", "remaining_time": "6:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2311, "total_steps": 4438, "loss": 0.1623, "learning_rate": 2.535393896043368e-06, "epoch": 0.5206860619032867, "percentage": 52.07, "elapsed_time": "6:59:38", "remaining_time": "6:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2312, "total_steps": 4438, "loss": 0.1548, "learning_rate": 2.5335311742255392e-06, "epoch": 0.5209113695890951, "percentage": 52.1, "elapsed_time": "6:59:50", "remaining_time": "6:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2313, "total_steps": 4438, "loss": 0.1454, "learning_rate": 2.5316684337891005e-06, "epoch": 0.5211366772749035, "percentage": 52.12, "elapsed_time": "7:00:01", "remaining_time": "6:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2314, "total_steps": 4438, "loss": 0.1689, "learning_rate": 2.5298056757683604e-06, "epoch": 0.521361984960712, "percentage": 52.14, "elapsed_time": "7:00:10", "remaining_time": "6:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2315, "total_steps": 4438, "loss": 0.1492, "learning_rate": 2.52794290119764e-06, "epoch": 0.5215872926465204, "percentage": 52.16, "elapsed_time": "7:00:22", "remaining_time": "6:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2316, "total_steps": 4438, "loss": 0.1683, "learning_rate": 2.5260801111112677e-06, "epoch": 0.5218126003323288, "percentage": 52.19, "elapsed_time": "7:00:32", "remaining_time": "6:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2317, "total_steps": 4438, "loss": 0.1417, "learning_rate": 2.5242173065435815e-06, "epoch": 0.5220379080181373, "percentage": 52.21, "elapsed_time": "7:00:42", "remaining_time": "6:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2318, "total_steps": 4438, "loss": 0.1316, "learning_rate": 2.5223544885289287e-06, "epoch": 0.5222632157039457, "percentage": 52.23, "elapsed_time": "7:00:53", "remaining_time": "6:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2319, "total_steps": 4438, "loss": 0.1469, "learning_rate": 2.5204916581016608e-06, "epoch": 0.5224885233897542, "percentage": 52.25, "elapsed_time": "7:01:02", "remaining_time": "6:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 4438, "loss": 0.1468, "learning_rate": 2.518628816296139e-06, "epoch": 0.5227138310755626, "percentage": 52.28, "elapsed_time": "7:01:14", "remaining_time": "6:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2321, "total_steps": 4438, "loss": 0.1422, "learning_rate": 2.5167659641467302e-06, "epoch": 0.522939138761371, "percentage": 52.3, "elapsed_time": "7:01:24", "remaining_time": "6:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2322, "total_steps": 4438, "loss": 0.1507, "learning_rate": 2.5149031026878063e-06, "epoch": 0.5231644464471794, "percentage": 52.32, "elapsed_time": "7:01:34", "remaining_time": "6:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2323, "total_steps": 4438, "loss": 0.1217, "learning_rate": 2.5130402329537444e-06, "epoch": 0.5233897541329878, "percentage": 52.34, "elapsed_time": "7:01:45", "remaining_time": "6:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2324, "total_steps": 4438, "loss": 0.1565, "learning_rate": 2.5111773559789277e-06, "epoch": 0.5236150618187962, "percentage": 52.37, "elapsed_time": "7:01:55", "remaining_time": "6:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2325, "total_steps": 4438, "loss": 0.1369, "learning_rate": 2.509314472797742e-06, "epoch": 0.5238403695046048, "percentage": 52.39, "elapsed_time": "7:02:06", "remaining_time": "6:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2326, "total_steps": 4438, "loss": 0.1406, "learning_rate": 2.5074515844445774e-06, "epoch": 0.5240656771904132, "percentage": 52.41, "elapsed_time": "7:02:16", "remaining_time": "6:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2327, "total_steps": 4438, "loss": 0.1714, "learning_rate": 2.5055886919538247e-06, "epoch": 0.5242909848762216, "percentage": 52.43, "elapsed_time": "7:02:28", "remaining_time": "6:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2328, "total_steps": 4438, "loss": 0.1475, "learning_rate": 2.50372579635988e-06, "epoch": 0.52451629256203, "percentage": 52.46, "elapsed_time": "7:02:38", "remaining_time": "6:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2329, "total_steps": 4438, "loss": 0.1298, "learning_rate": 2.5018628986971395e-06, "epoch": 0.5247416002478384, "percentage": 52.48, "elapsed_time": "7:02:48", "remaining_time": "6:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 4438, "loss": 0.1381, "learning_rate": 2.5e-06, "epoch": 0.5249669079336469, "percentage": 52.5, "elapsed_time": "7:02:59", "remaining_time": "6:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2331, "total_steps": 4438, "loss": 0.1644, "learning_rate": 2.4981371013028618e-06, "epoch": 0.5251922156194553, "percentage": 52.52, "elapsed_time": "7:03:10", "remaining_time": "6:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2332, "total_steps": 4438, "loss": 0.1418, "learning_rate": 2.4962742036401213e-06, "epoch": 0.5254175233052637, "percentage": 52.55, "elapsed_time": "7:03:20", "remaining_time": "6:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2333, "total_steps": 4438, "loss": 0.1407, "learning_rate": 2.494411308046176e-06, "epoch": 0.5256428309910722, "percentage": 52.57, "elapsed_time": "7:03:31", "remaining_time": "6:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2334, "total_steps": 4438, "loss": 0.1543, "learning_rate": 2.4925484155554235e-06, "epoch": 0.5258681386768806, "percentage": 52.59, "elapsed_time": "7:03:42", "remaining_time": "6:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2335, "total_steps": 4438, "loss": 0.1684, "learning_rate": 2.490685527202258e-06, "epoch": 0.5260934463626891, "percentage": 52.61, "elapsed_time": "7:03:53", "remaining_time": "6:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2336, "total_steps": 4438, "loss": 0.1441, "learning_rate": 2.4888226440210723e-06, "epoch": 0.5263187540484975, "percentage": 52.64, "elapsed_time": "7:04:05", "remaining_time": "6:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2337, "total_steps": 4438, "loss": 0.1458, "learning_rate": 2.4869597670462555e-06, "epoch": 0.5265440617343059, "percentage": 52.66, "elapsed_time": "7:04:15", "remaining_time": "6:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2338, "total_steps": 4438, "loss": 0.1564, "learning_rate": 2.4850968973121945e-06, "epoch": 0.5267693694201143, "percentage": 52.68, "elapsed_time": "7:04:25", "remaining_time": "6:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2339, "total_steps": 4438, "loss": 0.1512, "learning_rate": 2.483234035853271e-06, "epoch": 0.5269946771059227, "percentage": 52.7, "elapsed_time": "7:04:36", "remaining_time": "6:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 4438, "loss": 0.1346, "learning_rate": 2.481371183703862e-06, "epoch": 0.5272199847917312, "percentage": 52.73, "elapsed_time": "7:04:47", "remaining_time": "6:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2341, "total_steps": 4438, "loss": 0.1514, "learning_rate": 2.4795083418983405e-06, "epoch": 0.5274452924775397, "percentage": 52.75, "elapsed_time": "7:04:58", "remaining_time": "6:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2342, "total_steps": 4438, "loss": 0.1523, "learning_rate": 2.477645511471073e-06, "epoch": 0.5276706001633481, "percentage": 52.77, "elapsed_time": "7:05:09", "remaining_time": "6:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2343, "total_steps": 4438, "loss": 0.1327, "learning_rate": 2.475782693456419e-06, "epoch": 0.5278959078491565, "percentage": 52.79, "elapsed_time": "7:05:18", "remaining_time": "6:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2344, "total_steps": 4438, "loss": 0.1336, "learning_rate": 2.473919888888733e-06, "epoch": 0.5281212155349649, "percentage": 52.82, "elapsed_time": "7:05:28", "remaining_time": "6:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2345, "total_steps": 4438, "loss": 0.1465, "learning_rate": 2.472057098802361e-06, "epoch": 0.5283465232207734, "percentage": 52.84, "elapsed_time": "7:05:39", "remaining_time": "6:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2346, "total_steps": 4438, "loss": 0.1343, "learning_rate": 2.4701943242316405e-06, "epoch": 0.5285718309065818, "percentage": 52.86, "elapsed_time": "7:05:51", "remaining_time": "6:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2347, "total_steps": 4438, "loss": 0.1563, "learning_rate": 2.4683315662109003e-06, "epoch": 0.5287971385923902, "percentage": 52.88, "elapsed_time": "7:06:01", "remaining_time": "6:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2348, "total_steps": 4438, "loss": 0.1315, "learning_rate": 2.466468825774461e-06, "epoch": 0.5290224462781986, "percentage": 52.91, "elapsed_time": "7:06:10", "remaining_time": "6:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2349, "total_steps": 4438, "loss": 0.1419, "learning_rate": 2.464606103956633e-06, "epoch": 0.5292477539640071, "percentage": 52.93, "elapsed_time": "7:06:21", "remaining_time": "6:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 4438, "loss": 0.1577, "learning_rate": 2.462743401791716e-06, "epoch": 0.5294730616498156, "percentage": 52.95, "elapsed_time": "7:06:34", "remaining_time": "6:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2351, "total_steps": 4438, "loss": 0.1463, "learning_rate": 2.460880720314e-06, "epoch": 0.529698369335624, "percentage": 52.97, "elapsed_time": "7:06:45", "remaining_time": "6:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2352, "total_steps": 4438, "loss": 0.1485, "learning_rate": 2.4590180605577614e-06, "epoch": 0.5299236770214324, "percentage": 53.0, "elapsed_time": "7:06:56", "remaining_time": "6:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2353, "total_steps": 4438, "loss": 0.1436, "learning_rate": 2.4571554235572665e-06, "epoch": 0.5301489847072408, "percentage": 53.02, "elapsed_time": "7:07:06", "remaining_time": "6:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2354, "total_steps": 4438, "loss": 0.1503, "learning_rate": 2.4552928103467677e-06, "epoch": 0.5303742923930492, "percentage": 53.04, "elapsed_time": "7:07:15", "remaining_time": "6:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2355, "total_steps": 4438, "loss": 0.1509, "learning_rate": 2.4534302219605044e-06, "epoch": 0.5305996000788576, "percentage": 53.06, "elapsed_time": "7:07:26", "remaining_time": "6:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2356, "total_steps": 4438, "loss": 0.1414, "learning_rate": 2.4515676594327035e-06, "epoch": 0.5308249077646662, "percentage": 53.09, "elapsed_time": "7:07:38", "remaining_time": "6:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2357, "total_steps": 4438, "loss": 0.1514, "learning_rate": 2.4497051237975773e-06, "epoch": 0.5310502154504746, "percentage": 53.11, "elapsed_time": "7:07:49", "remaining_time": "6:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2358, "total_steps": 4438, "loss": 0.1579, "learning_rate": 2.4478426160893197e-06, "epoch": 0.531275523136283, "percentage": 53.13, "elapsed_time": "7:08:00", "remaining_time": "6:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2359, "total_steps": 4438, "loss": 0.1462, "learning_rate": 2.4459801373421134e-06, "epoch": 0.5315008308220914, "percentage": 53.15, "elapsed_time": "7:08:10", "remaining_time": "6:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 4438, "loss": 0.1458, "learning_rate": 2.4441176885901234e-06, "epoch": 0.5317261385078998, "percentage": 53.18, "elapsed_time": "7:08:20", "remaining_time": "6:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2361, "total_steps": 4438, "loss": 0.1429, "learning_rate": 2.4422552708674977e-06, "epoch": 0.5319514461937083, "percentage": 53.2, "elapsed_time": "7:08:31", "remaining_time": "6:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2362, "total_steps": 4438, "loss": 0.1384, "learning_rate": 2.440392885208368e-06, "epoch": 0.5321767538795167, "percentage": 53.22, "elapsed_time": "7:08:43", "remaining_time": "6:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2363, "total_steps": 4438, "loss": 0.1432, "learning_rate": 2.4385305326468475e-06, "epoch": 0.5324020615653251, "percentage": 53.24, "elapsed_time": "7:08:52", "remaining_time": "6:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2364, "total_steps": 4438, "loss": 0.1384, "learning_rate": 2.436668214217031e-06, "epoch": 0.5326273692511336, "percentage": 53.27, "elapsed_time": "7:09:02", "remaining_time": "6:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2365, "total_steps": 4438, "loss": 0.1455, "learning_rate": 2.4348059309529935e-06, "epoch": 0.532852676936942, "percentage": 53.29, "elapsed_time": "7:09:12", "remaining_time": "6:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2366, "total_steps": 4438, "loss": 0.139, "learning_rate": 2.4329436838887936e-06, "epoch": 0.5330779846227505, "percentage": 53.31, "elapsed_time": "7:09:22", "remaining_time": "6:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2367, "total_steps": 4438, "loss": 0.1502, "learning_rate": 2.4310814740584663e-06, "epoch": 0.5333032923085589, "percentage": 53.33, "elapsed_time": "7:09:34", "remaining_time": "6:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2368, "total_steps": 4438, "loss": 0.1466, "learning_rate": 2.4292193024960275e-06, "epoch": 0.5335285999943673, "percentage": 53.36, "elapsed_time": "7:09:44", "remaining_time": "6:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2369, "total_steps": 4438, "loss": 0.125, "learning_rate": 2.427357170235472e-06, "epoch": 0.5337539076801757, "percentage": 53.38, "elapsed_time": "7:09:54", "remaining_time": "6:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 4438, "loss": 0.1406, "learning_rate": 2.425495078310772e-06, "epoch": 0.5339792153659841, "percentage": 53.4, "elapsed_time": "7:10:05", "remaining_time": "6:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2371, "total_steps": 4438, "loss": 0.1566, "learning_rate": 2.4236330277558774e-06, "epoch": 0.5342045230517926, "percentage": 53.42, "elapsed_time": "7:10:14", "remaining_time": "6:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2372, "total_steps": 4438, "loss": 0.1592, "learning_rate": 2.4217710196047166e-06, "epoch": 0.5344298307376011, "percentage": 53.45, "elapsed_time": "7:10:23", "remaining_time": "6:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2373, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.419909054891193e-06, "epoch": 0.5346551384234095, "percentage": 53.47, "elapsed_time": "7:10:34", "remaining_time": "6:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2374, "total_steps": 4438, "loss": 0.1461, "learning_rate": 2.4180471346491864e-06, "epoch": 0.5348804461092179, "percentage": 53.49, "elapsed_time": "7:10:44", "remaining_time": "6:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2375, "total_steps": 4438, "loss": 0.1502, "learning_rate": 2.4161852599125504e-06, "epoch": 0.5351057537950263, "percentage": 53.52, "elapsed_time": "7:10:56", "remaining_time": "6:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2376, "total_steps": 4438, "loss": 0.1311, "learning_rate": 2.414323431715115e-06, "epoch": 0.5353310614808348, "percentage": 53.54, "elapsed_time": "7:11:06", "remaining_time": "6:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2377, "total_steps": 4438, "loss": 0.1399, "learning_rate": 2.412461651090685e-06, "epoch": 0.5355563691666432, "percentage": 53.56, "elapsed_time": "7:11:15", "remaining_time": "6:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2378, "total_steps": 4438, "loss": 0.139, "learning_rate": 2.410599919073037e-06, "epoch": 0.5357816768524516, "percentage": 53.58, "elapsed_time": "7:11:25", "remaining_time": "6:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2379, "total_steps": 4438, "loss": 0.1443, "learning_rate": 2.408738236695922e-06, "epoch": 0.53600698453826, "percentage": 53.61, "elapsed_time": "7:11:36", "remaining_time": "6:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 4438, "loss": 0.1516, "learning_rate": 2.4068766049930623e-06, "epoch": 0.5362322922240685, "percentage": 53.63, "elapsed_time": "7:11:47", "remaining_time": "6:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2381, "total_steps": 4438, "loss": 0.1487, "learning_rate": 2.4050150249981522e-06, "epoch": 0.536457599909877, "percentage": 53.65, "elapsed_time": "7:11:58", "remaining_time": "6:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2382, "total_steps": 4438, "loss": 0.1521, "learning_rate": 2.403153497744859e-06, "epoch": 0.5366829075956854, "percentage": 53.67, "elapsed_time": "7:12:09", "remaining_time": "6:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2383, "total_steps": 4438, "loss": 0.1414, "learning_rate": 2.4012920242668184e-06, "epoch": 0.5369082152814938, "percentage": 53.7, "elapsed_time": "7:12:20", "remaining_time": "6:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2384, "total_steps": 4438, "loss": 0.1481, "learning_rate": 2.3994306055976374e-06, "epoch": 0.5371335229673022, "percentage": 53.72, "elapsed_time": "7:12:30", "remaining_time": "6:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2385, "total_steps": 4438, "loss": 0.1589, "learning_rate": 2.397569242770893e-06, "epoch": 0.5373588306531106, "percentage": 53.74, "elapsed_time": "7:12:40", "remaining_time": "6:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2386, "total_steps": 4438, "loss": 0.1402, "learning_rate": 2.3957079368201293e-06, "epoch": 0.537584138338919, "percentage": 53.76, "elapsed_time": "7:12:51", "remaining_time": "6:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2387, "total_steps": 4438, "loss": 0.1334, "learning_rate": 2.393846688778861e-06, "epoch": 0.5378094460247275, "percentage": 53.79, "elapsed_time": "7:13:02", "remaining_time": "6:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2388, "total_steps": 4438, "loss": 0.1606, "learning_rate": 2.39198549968057e-06, "epoch": 0.538034753710536, "percentage": 53.81, "elapsed_time": "7:13:13", "remaining_time": "6:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2389, "total_steps": 4438, "loss": 0.1479, "learning_rate": 2.390124370558705e-06, "epoch": 0.5382600613963444, "percentage": 53.83, "elapsed_time": "7:13:23", "remaining_time": "6:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 4438, "loss": 0.1564, "learning_rate": 2.3882633024466813e-06, "epoch": 0.5384853690821528, "percentage": 53.85, "elapsed_time": "7:13:33", "remaining_time": "6:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2391, "total_steps": 4438, "loss": 0.1431, "learning_rate": 2.386402296377881e-06, "epoch": 0.5387106767679612, "percentage": 53.88, "elapsed_time": "7:13:44", "remaining_time": "6:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2392, "total_steps": 4438, "loss": 0.1346, "learning_rate": 2.3845413533856517e-06, "epoch": 0.5389359844537697, "percentage": 53.9, "elapsed_time": "7:13:53", "remaining_time": "6:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2393, "total_steps": 4438, "loss": 0.1578, "learning_rate": 2.3826804745033046e-06, "epoch": 0.5391612921395781, "percentage": 53.92, "elapsed_time": "7:14:04", "remaining_time": "6:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2394, "total_steps": 4438, "loss": 0.1457, "learning_rate": 2.3808196607641176e-06, "epoch": 0.5393865998253865, "percentage": 53.94, "elapsed_time": "7:14:16", "remaining_time": "6:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2395, "total_steps": 4438, "loss": 0.1528, "learning_rate": 2.3789589132013304e-06, "epoch": 0.5396119075111949, "percentage": 53.97, "elapsed_time": "7:14:28", "remaining_time": "6:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2396, "total_steps": 4438, "loss": 0.1524, "learning_rate": 2.3770982328481464e-06, "epoch": 0.5398372151970035, "percentage": 53.99, "elapsed_time": "7:14:38", "remaining_time": "6:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2397, "total_steps": 4438, "loss": 0.1553, "learning_rate": 2.3752376207377333e-06, "epoch": 0.5400625228828119, "percentage": 54.01, "elapsed_time": "7:14:50", "remaining_time": "6:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2398, "total_steps": 4438, "loss": 0.1525, "learning_rate": 2.3733770779032185e-06, "epoch": 0.5402878305686203, "percentage": 54.03, "elapsed_time": "7:15:00", "remaining_time": "6:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2399, "total_steps": 4438, "loss": 0.1555, "learning_rate": 2.371516605377693e-06, "epoch": 0.5405131382544287, "percentage": 54.06, "elapsed_time": "7:15:10", "remaining_time": "6:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 4438, "loss": 0.151, "learning_rate": 2.3696562041942076e-06, "epoch": 0.5407384459402371, "percentage": 54.08, "elapsed_time": "7:15:21", "remaining_time": "6:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2401, "total_steps": 4438, "loss": 0.1442, "learning_rate": 2.367795875385773e-06, "epoch": 0.5409637536260455, "percentage": 54.1, "elapsed_time": "7:15:33", "remaining_time": "6:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2402, "total_steps": 4438, "loss": 0.13, "learning_rate": 2.3659356199853617e-06, "epoch": 0.541189061311854, "percentage": 54.12, "elapsed_time": "7:15:44", "remaining_time": "6:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2403, "total_steps": 4438, "loss": 0.1482, "learning_rate": 2.3640754390259026e-06, "epoch": 0.5414143689976625, "percentage": 54.15, "elapsed_time": "7:15:56", "remaining_time": "6:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2404, "total_steps": 4438, "loss": 0.1483, "learning_rate": 2.362215333540287e-06, "epoch": 0.5416396766834709, "percentage": 54.17, "elapsed_time": "7:16:08", "remaining_time": "6:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2405, "total_steps": 4438, "loss": 0.1418, "learning_rate": 2.36035530456136e-06, "epoch": 0.5418649843692793, "percentage": 54.19, "elapsed_time": "7:16:19", "remaining_time": "6:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2406, "total_steps": 4438, "loss": 0.1415, "learning_rate": 2.3584953531219278e-06, "epoch": 0.5420902920550877, "percentage": 54.21, "elapsed_time": "7:16:28", "remaining_time": "6:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2407, "total_steps": 4438, "loss": 0.16, "learning_rate": 2.356635480254751e-06, "epoch": 0.5423155997408962, "percentage": 54.24, "elapsed_time": "7:16:39", "remaining_time": "6:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2408, "total_steps": 4438, "loss": 0.1455, "learning_rate": 2.3547756869925485e-06, "epoch": 0.5425409074267046, "percentage": 54.26, "elapsed_time": "7:16:52", "remaining_time": "6:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2409, "total_steps": 4438, "loss": 0.1518, "learning_rate": 2.3529159743679936e-06, "epoch": 0.542766215112513, "percentage": 54.28, "elapsed_time": "7:17:02", "remaining_time": "6:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 4438, "loss": 0.1407, "learning_rate": 2.3510563434137175e-06, "epoch": 0.5429915227983214, "percentage": 54.3, "elapsed_time": "7:17:12", "remaining_time": "6:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2411, "total_steps": 4438, "loss": 0.1331, "learning_rate": 2.3491967951623006e-06, "epoch": 0.5432168304841299, "percentage": 54.33, "elapsed_time": "7:17:23", "remaining_time": "6:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2412, "total_steps": 4438, "loss": 0.1416, "learning_rate": 2.347337330646282e-06, "epoch": 0.5434421381699384, "percentage": 54.35, "elapsed_time": "7:17:35", "remaining_time": "6:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2413, "total_steps": 4438, "loss": 0.138, "learning_rate": 2.3454779508981536e-06, "epoch": 0.5436674458557468, "percentage": 54.37, "elapsed_time": "7:17:46", "remaining_time": "6:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2414, "total_steps": 4438, "loss": 0.1491, "learning_rate": 2.3436186569503598e-06, "epoch": 0.5438927535415552, "percentage": 54.39, "elapsed_time": "7:17:56", "remaining_time": "6:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2415, "total_steps": 4438, "loss": 0.1453, "learning_rate": 2.341759449835297e-06, "epoch": 0.5441180612273636, "percentage": 54.42, "elapsed_time": "7:18:06", "remaining_time": "6:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2416, "total_steps": 4438, "loss": 0.1449, "learning_rate": 2.339900330585313e-06, "epoch": 0.544343368913172, "percentage": 54.44, "elapsed_time": "7:18:17", "remaining_time": "6:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2417, "total_steps": 4438, "loss": 0.1324, "learning_rate": 2.338041300232708e-06, "epoch": 0.5445686765989805, "percentage": 54.46, "elapsed_time": "7:18:26", "remaining_time": "6:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2418, "total_steps": 4438, "loss": 0.1413, "learning_rate": 2.3361823598097316e-06, "epoch": 0.5447939842847889, "percentage": 54.48, "elapsed_time": "7:18:36", "remaining_time": "6:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2419, "total_steps": 4438, "loss": 0.1516, "learning_rate": 2.334323510348585e-06, "epoch": 0.5450192919705974, "percentage": 54.51, "elapsed_time": "7:18:45", "remaining_time": "6:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 4438, "loss": 0.1519, "learning_rate": 2.332464752881418e-06, "epoch": 0.5452445996564058, "percentage": 54.53, "elapsed_time": "7:18:56", "remaining_time": "6:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2421, "total_steps": 4438, "loss": 0.1379, "learning_rate": 2.330606088440329e-06, "epoch": 0.5454699073422142, "percentage": 54.55, "elapsed_time": "7:19:06", "remaining_time": "6:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2422, "total_steps": 4438, "loss": 0.1473, "learning_rate": 2.3287475180573653e-06, "epoch": 0.5456952150280227, "percentage": 54.57, "elapsed_time": "7:19:15", "remaining_time": "6:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2423, "total_steps": 4438, "loss": 0.1279, "learning_rate": 2.3268890427645213e-06, "epoch": 0.5459205227138311, "percentage": 54.6, "elapsed_time": "7:19:26", "remaining_time": "6:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2424, "total_steps": 4438, "loss": 0.1362, "learning_rate": 2.3250306635937385e-06, "epoch": 0.5461458303996395, "percentage": 54.62, "elapsed_time": "7:19:37", "remaining_time": "6:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2425, "total_steps": 4438, "loss": 0.1443, "learning_rate": 2.323172381576907e-06, "epoch": 0.5463711380854479, "percentage": 54.64, "elapsed_time": "7:19:48", "remaining_time": "6:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2426, "total_steps": 4438, "loss": 0.1358, "learning_rate": 2.3213141977458615e-06, "epoch": 0.5465964457712563, "percentage": 54.66, "elapsed_time": "7:19:57", "remaining_time": "6:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2427, "total_steps": 4438, "loss": 0.1494, "learning_rate": 2.3194561131323823e-06, "epoch": 0.5468217534570649, "percentage": 54.69, "elapsed_time": "7:20:08", "remaining_time": "6:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2428, "total_steps": 4438, "loss": 0.1551, "learning_rate": 2.3175981287681924e-06, "epoch": 0.5470470611428733, "percentage": 54.71, "elapsed_time": "7:20:20", "remaining_time": "6:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2429, "total_steps": 4438, "loss": 0.1498, "learning_rate": 2.3157402456849632e-06, "epoch": 0.5472723688286817, "percentage": 54.73, "elapsed_time": "7:20:30", "remaining_time": "6:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 4438, "loss": 0.1497, "learning_rate": 2.3138824649143076e-06, "epoch": 0.5474976765144901, "percentage": 54.75, "elapsed_time": "7:20:41", "remaining_time": "6:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2431, "total_steps": 4438, "loss": 0.1449, "learning_rate": 2.312024787487782e-06, "epoch": 0.5477229842002985, "percentage": 54.78, "elapsed_time": "7:20:50", "remaining_time": "6:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2432, "total_steps": 4438, "loss": 0.145, "learning_rate": 2.310167214436885e-06, "epoch": 0.5479482918861069, "percentage": 54.8, "elapsed_time": "7:21:02", "remaining_time": "6:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2433, "total_steps": 4438, "loss": 0.1484, "learning_rate": 2.3083097467930583e-06, "epoch": 0.5481735995719154, "percentage": 54.82, "elapsed_time": "7:21:12", "remaining_time": "6:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2434, "total_steps": 4438, "loss": 0.1395, "learning_rate": 2.306452385587683e-06, "epoch": 0.5483989072577238, "percentage": 54.84, "elapsed_time": "7:21:23", "remaining_time": "6:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2435, "total_steps": 4438, "loss": 0.1436, "learning_rate": 2.304595131852085e-06, "epoch": 0.5486242149435323, "percentage": 54.87, "elapsed_time": "7:21:33", "remaining_time": "6:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2436, "total_steps": 4438, "loss": 0.1492, "learning_rate": 2.3027379866175263e-06, "epoch": 0.5488495226293407, "percentage": 54.89, "elapsed_time": "7:21:44", "remaining_time": "6:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2437, "total_steps": 4438, "loss": 0.142, "learning_rate": 2.300880950915211e-06, "epoch": 0.5490748303151491, "percentage": 54.91, "elapsed_time": "7:21:54", "remaining_time": "6:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2438, "total_steps": 4438, "loss": 0.1469, "learning_rate": 2.2990240257762817e-06, "epoch": 0.5493001380009576, "percentage": 54.93, "elapsed_time": "7:22:05", "remaining_time": "6:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2439, "total_steps": 4438, "loss": 0.1207, "learning_rate": 2.2971672122318196e-06, "epoch": 0.549525445686766, "percentage": 54.96, "elapsed_time": "7:22:14", "remaining_time": "6:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 4438, "loss": 0.1402, "learning_rate": 2.295310511312844e-06, "epoch": 0.5497507533725744, "percentage": 54.98, "elapsed_time": "7:22:25", "remaining_time": "6:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2441, "total_steps": 4438, "loss": 0.1427, "learning_rate": 2.293453924050312e-06, "epoch": 0.5499760610583828, "percentage": 55.0, "elapsed_time": "7:22:36", "remaining_time": "6:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2442, "total_steps": 4438, "loss": 0.1525, "learning_rate": 2.2915974514751173e-06, "epoch": 0.5502013687441912, "percentage": 55.02, "elapsed_time": "7:22:46", "remaining_time": "6:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2443, "total_steps": 4438, "loss": 0.1499, "learning_rate": 2.2897410946180897e-06, "epoch": 0.5504266764299998, "percentage": 55.05, "elapsed_time": "7:22:57", "remaining_time": "6:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2444, "total_steps": 4438, "loss": 0.1393, "learning_rate": 2.287884854509995e-06, "epoch": 0.5506519841158082, "percentage": 55.07, "elapsed_time": "7:23:07", "remaining_time": "6:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2445, "total_steps": 4438, "loss": 0.1509, "learning_rate": 2.286028732181535e-06, "epoch": 0.5508772918016166, "percentage": 55.09, "elapsed_time": "7:23:18", "remaining_time": "6:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2446, "total_steps": 4438, "loss": 0.1435, "learning_rate": 2.2841727286633444e-06, "epoch": 0.551102599487425, "percentage": 55.11, "elapsed_time": "7:23:30", "remaining_time": "6:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2447, "total_steps": 4438, "loss": 0.139, "learning_rate": 2.282316844985992e-06, "epoch": 0.5513279071732334, "percentage": 55.14, "elapsed_time": "7:23:41", "remaining_time": "6:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2448, "total_steps": 4438, "loss": 0.1464, "learning_rate": 2.280461082179982e-06, "epoch": 0.5515532148590419, "percentage": 55.16, "elapsed_time": "7:23:52", "remaining_time": "6:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2449, "total_steps": 4438, "loss": 0.1553, "learning_rate": 2.27860544127575e-06, "epoch": 0.5517785225448503, "percentage": 55.18, "elapsed_time": "7:24:02", "remaining_time": "6:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 4438, "loss": 0.1447, "learning_rate": 2.2767499233036635e-06, "epoch": 0.5520038302306588, "percentage": 55.21, "elapsed_time": "7:24:13", "remaining_time": "6:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2451, "total_steps": 4438, "loss": 0.1398, "learning_rate": 2.2748945292940237e-06, "epoch": 0.5522291379164672, "percentage": 55.23, "elapsed_time": "7:24:23", "remaining_time": "6:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2452, "total_steps": 4438, "loss": 0.1416, "learning_rate": 2.2730392602770617e-06, "epoch": 0.5524544456022756, "percentage": 55.25, "elapsed_time": "7:24:33", "remaining_time": "6:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2453, "total_steps": 4438, "loss": 0.1368, "learning_rate": 2.271184117282938e-06, "epoch": 0.552679753288084, "percentage": 55.27, "elapsed_time": "7:24:43", "remaining_time": "5:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2454, "total_steps": 4438, "loss": 0.1505, "learning_rate": 2.269329101341745e-06, "epoch": 0.5529050609738925, "percentage": 55.3, "elapsed_time": "7:24:54", "remaining_time": "5:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2455, "total_steps": 4438, "loss": 0.1307, "learning_rate": 2.267474213483505e-06, "epoch": 0.5531303686597009, "percentage": 55.32, "elapsed_time": "7:25:05", "remaining_time": "5:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2456, "total_steps": 4438, "loss": 0.1472, "learning_rate": 2.265619454738166e-06, "epoch": 0.5533556763455093, "percentage": 55.34, "elapsed_time": "7:25:16", "remaining_time": "5:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2457, "total_steps": 4438, "loss": 0.15, "learning_rate": 2.2637648261356078e-06, "epoch": 0.5535809840313177, "percentage": 55.36, "elapsed_time": "7:25:27", "remaining_time": "5:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2458, "total_steps": 4438, "loss": 0.1429, "learning_rate": 2.2619103287056366e-06, "epoch": 0.5538062917171263, "percentage": 55.39, "elapsed_time": "7:25:40", "remaining_time": "5:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2459, "total_steps": 4438, "loss": 0.1504, "learning_rate": 2.260055963477985e-06, "epoch": 0.5540315994029347, "percentage": 55.41, "elapsed_time": "7:25:50", "remaining_time": "5:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 4438, "loss": 0.1503, "learning_rate": 2.2582017314823135e-06, "epoch": 0.5542569070887431, "percentage": 55.43, "elapsed_time": "7:26:00", "remaining_time": "5:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2461, "total_steps": 4438, "loss": 0.1479, "learning_rate": 2.2563476337482073e-06, "epoch": 0.5544822147745515, "percentage": 55.45, "elapsed_time": "7:26:10", "remaining_time": "5:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2462, "total_steps": 4438, "loss": 0.1456, "learning_rate": 2.254493671305179e-06, "epoch": 0.5547075224603599, "percentage": 55.48, "elapsed_time": "7:26:20", "remaining_time": "5:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2463, "total_steps": 4438, "loss": 0.1482, "learning_rate": 2.2526398451826638e-06, "epoch": 0.5549328301461683, "percentage": 55.5, "elapsed_time": "7:26:32", "remaining_time": "5:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2464, "total_steps": 4438, "loss": 0.1466, "learning_rate": 2.250786156410022e-06, "epoch": 0.5551581378319768, "percentage": 55.52, "elapsed_time": "7:26:42", "remaining_time": "5:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2465, "total_steps": 4438, "loss": 0.1549, "learning_rate": 2.2489326060165384e-06, "epoch": 0.5553834455177852, "percentage": 55.54, "elapsed_time": "7:26:53", "remaining_time": "5:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2466, "total_steps": 4438, "loss": 0.1488, "learning_rate": 2.24707919503142e-06, "epoch": 0.5556087532035937, "percentage": 55.57, "elapsed_time": "7:27:04", "remaining_time": "5:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2467, "total_steps": 4438, "loss": 0.1326, "learning_rate": 2.2452259244837974e-06, "epoch": 0.5558340608894021, "percentage": 55.59, "elapsed_time": "7:27:14", "remaining_time": "5:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2468, "total_steps": 4438, "loss": 0.1345, "learning_rate": 2.2433727954027227e-06, "epoch": 0.5560593685752105, "percentage": 55.61, "elapsed_time": "7:27:24", "remaining_time": "5:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2469, "total_steps": 4438, "loss": 0.1466, "learning_rate": 2.24151980881717e-06, "epoch": 0.556284676261019, "percentage": 55.63, "elapsed_time": "7:27:36", "remaining_time": "5:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 4438, "loss": 0.1342, "learning_rate": 2.239666965756032e-06, "epoch": 0.5565099839468274, "percentage": 55.66, "elapsed_time": "7:27:47", "remaining_time": "5:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2471, "total_steps": 4438, "loss": 0.1376, "learning_rate": 2.237814267248124e-06, "epoch": 0.5567352916326358, "percentage": 55.68, "elapsed_time": "7:27:57", "remaining_time": "5:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2472, "total_steps": 4438, "loss": 0.1477, "learning_rate": 2.2359617143221805e-06, "epoch": 0.5569605993184442, "percentage": 55.7, "elapsed_time": "7:28:08", "remaining_time": "5:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2473, "total_steps": 4438, "loss": 0.1382, "learning_rate": 2.234109308006856e-06, "epoch": 0.5571859070042526, "percentage": 55.72, "elapsed_time": "7:28:18", "remaining_time": "5:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2474, "total_steps": 4438, "loss": 0.1309, "learning_rate": 2.232257049330722e-06, "epoch": 0.5574112146900612, "percentage": 55.75, "elapsed_time": "7:28:29", "remaining_time": "5:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2475, "total_steps": 4438, "loss": 0.143, "learning_rate": 2.2304049393222686e-06, "epoch": 0.5576365223758696, "percentage": 55.77, "elapsed_time": "7:28:40", "remaining_time": "5:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2476, "total_steps": 4438, "loss": 0.1401, "learning_rate": 2.2285529790099034e-06, "epoch": 0.557861830061678, "percentage": 55.79, "elapsed_time": "7:28:50", "remaining_time": "5:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2477, "total_steps": 4438, "loss": 0.1416, "learning_rate": 2.2267011694219513e-06, "epoch": 0.5580871377474864, "percentage": 55.81, "elapsed_time": "7:29:02", "remaining_time": "5:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2478, "total_steps": 4438, "loss": 0.138, "learning_rate": 2.224849511586652e-06, "epoch": 0.5583124454332948, "percentage": 55.84, "elapsed_time": "7:29:13", "remaining_time": "5:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2479, "total_steps": 4438, "loss": 0.1294, "learning_rate": 2.2229980065321636e-06, "epoch": 0.5585377531191033, "percentage": 55.86, "elapsed_time": "7:29:23", "remaining_time": "5:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 4438, "loss": 0.1561, "learning_rate": 2.221146655286558e-06, "epoch": 0.5587630608049117, "percentage": 55.88, "elapsed_time": "7:29:34", "remaining_time": "5:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2481, "total_steps": 4438, "loss": 0.1476, "learning_rate": 2.2192954588778195e-06, "epoch": 0.5589883684907201, "percentage": 55.9, "elapsed_time": "7:29:44", "remaining_time": "5:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2482, "total_steps": 4438, "loss": 0.1479, "learning_rate": 2.21744441833385e-06, "epoch": 0.5592136761765286, "percentage": 55.93, "elapsed_time": "7:29:55", "remaining_time": "5:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2483, "total_steps": 4438, "loss": 0.1538, "learning_rate": 2.2155935346824634e-06, "epoch": 0.559438983862337, "percentage": 55.95, "elapsed_time": "7:30:07", "remaining_time": "5:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2484, "total_steps": 4438, "loss": 0.1436, "learning_rate": 2.2137428089513857e-06, "epoch": 0.5596642915481455, "percentage": 55.97, "elapsed_time": "7:30:16", "remaining_time": "5:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2485, "total_steps": 4438, "loss": 0.155, "learning_rate": 2.2118922421682563e-06, "epoch": 0.5598895992339539, "percentage": 55.99, "elapsed_time": "7:30:27", "remaining_time": "5:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2486, "total_steps": 4438, "loss": 0.151, "learning_rate": 2.2100418353606262e-06, "epoch": 0.5601149069197623, "percentage": 56.02, "elapsed_time": "7:30:37", "remaining_time": "5:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2487, "total_steps": 4438, "loss": 0.1326, "learning_rate": 2.208191589555956e-06, "epoch": 0.5603402146055707, "percentage": 56.04, "elapsed_time": "7:30:48", "remaining_time": "5:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2488, "total_steps": 4438, "loss": 0.1438, "learning_rate": 2.20634150578162e-06, "epoch": 0.5605655222913791, "percentage": 56.06, "elapsed_time": "7:30:59", "remaining_time": "5:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2489, "total_steps": 4438, "loss": 0.139, "learning_rate": 2.2044915850649e-06, "epoch": 0.5607908299771875, "percentage": 56.08, "elapsed_time": "7:31:10", "remaining_time": "5:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 4438, "loss": 0.1467, "learning_rate": 2.202641828432988e-06, "epoch": 0.5610161376629961, "percentage": 56.11, "elapsed_time": "7:31:20", "remaining_time": "5:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2491, "total_steps": 4438, "loss": 0.1524, "learning_rate": 2.2007922369129854e-06, "epoch": 0.5612414453488045, "percentage": 56.13, "elapsed_time": "7:31:31", "remaining_time": "5:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2492, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.1989428115319005e-06, "epoch": 0.5614667530346129, "percentage": 56.15, "elapsed_time": "7:31:40", "remaining_time": "5:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2493, "total_steps": 4438, "loss": 0.145, "learning_rate": 2.1970935533166505e-06, "epoch": 0.5616920607204213, "percentage": 56.17, "elapsed_time": "7:31:53", "remaining_time": "5:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2494, "total_steps": 4438, "loss": 0.1402, "learning_rate": 2.19524446329406e-06, "epoch": 0.5619173684062297, "percentage": 56.2, "elapsed_time": "7:32:02", "remaining_time": "5:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2495, "total_steps": 4438, "loss": 0.1549, "learning_rate": 2.1933955424908596e-06, "epoch": 0.5621426760920382, "percentage": 56.22, "elapsed_time": "7:32:14", "remaining_time": "5:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2496, "total_steps": 4438, "loss": 0.1262, "learning_rate": 2.1915467919336862e-06, "epoch": 0.5623679837778466, "percentage": 56.24, "elapsed_time": "7:32:25", "remaining_time": "5:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2497, "total_steps": 4438, "loss": 0.1402, "learning_rate": 2.1896982126490825e-06, "epoch": 0.562593291463655, "percentage": 56.26, "elapsed_time": "7:32:35", "remaining_time": "5:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2498, "total_steps": 4438, "loss": 0.1517, "learning_rate": 2.1878498056634946e-06, "epoch": 0.5628185991494635, "percentage": 56.29, "elapsed_time": "7:32:46", "remaining_time": "5:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2499, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.1860015720032747e-06, "epoch": 0.563043906835272, "percentage": 56.31, "elapsed_time": "7:32:56", "remaining_time": "5:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 4438, "loss": 0.1318, "learning_rate": 2.1841535126946777e-06, "epoch": 0.5632692145210804, "percentage": 56.33, "elapsed_time": "7:33:07", "remaining_time": "5:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 4438, "eval_loss": 0.1443219631910324, "epoch": 0.5632692145210804, "percentage": 56.33, "elapsed_time": "7:35:10", "remaining_time": "5:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2501, "total_steps": 4438, "loss": 0.1521, "learning_rate": 2.1823056287638623e-06, "epoch": 0.5634945222068888, "percentage": 56.35, "elapsed_time": "7:35:20", "remaining_time": "5:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2502, "total_steps": 4438, "loss": 0.1425, "learning_rate": 2.180457921236889e-06, "epoch": 0.5637198298926972, "percentage": 56.38, "elapsed_time": "7:35:33", "remaining_time": "5:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2503, "total_steps": 4438, "loss": 0.1399, "learning_rate": 2.1786103911397218e-06, "epoch": 0.5639451375785056, "percentage": 56.4, "elapsed_time": "7:35:42", "remaining_time": "5:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2504, "total_steps": 4438, "loss": 0.1396, "learning_rate": 2.176763039498225e-06, "epoch": 0.564170445264314, "percentage": 56.42, "elapsed_time": "7:35:54", "remaining_time": "5:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2505, "total_steps": 4438, "loss": 0.1425, "learning_rate": 2.174915867338164e-06, "epoch": 0.5643957529501226, "percentage": 56.44, "elapsed_time": "7:36:04", "remaining_time": "5:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2506, "total_steps": 4438, "loss": 0.1406, "learning_rate": 2.1730688756852046e-06, "epoch": 0.564621060635931, "percentage": 56.47, "elapsed_time": "7:36:17", "remaining_time": "5:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2507, "total_steps": 4438, "loss": 0.1551, "learning_rate": 2.171222065564913e-06, "epoch": 0.5648463683217394, "percentage": 56.49, "elapsed_time": "7:36:28", "remaining_time": "5:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2508, "total_steps": 4438, "loss": 0.145, "learning_rate": 2.1693754380027533e-06, "epoch": 0.5650716760075478, "percentage": 56.51, "elapsed_time": "7:36:38", "remaining_time": "5:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2509, "total_steps": 4438, "loss": 0.1359, "learning_rate": 2.1675289940240883e-06, "epoch": 0.5652969836933562, "percentage": 56.53, "elapsed_time": "7:36:48", "remaining_time": "5:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 4438, "loss": 0.1217, "learning_rate": 2.165682734654181e-06, "epoch": 0.5655222913791647, "percentage": 56.56, "elapsed_time": "7:36:59", "remaining_time": "5:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2511, "total_steps": 4438, "loss": 0.1487, "learning_rate": 2.16383666091819e-06, "epoch": 0.5657475990649731, "percentage": 56.58, "elapsed_time": "7:37:10", "remaining_time": "5:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2512, "total_steps": 4438, "loss": 0.1445, "learning_rate": 2.161990773841171e-06, "epoch": 0.5659729067507815, "percentage": 56.6, "elapsed_time": "7:37:22", "remaining_time": "5:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2513, "total_steps": 4438, "loss": 0.1401, "learning_rate": 2.1601450744480763e-06, "epoch": 0.56619821443659, "percentage": 56.62, "elapsed_time": "7:37:31", "remaining_time": "5:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2514, "total_steps": 4438, "loss": 0.1473, "learning_rate": 2.1582995637637543e-06, "epoch": 0.5664235221223984, "percentage": 56.65, "elapsed_time": "7:37:41", "remaining_time": "5:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2515, "total_steps": 4438, "loss": 0.1366, "learning_rate": 2.156454242812948e-06, "epoch": 0.5666488298082069, "percentage": 56.67, "elapsed_time": "7:37:53", "remaining_time": "5:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2516, "total_steps": 4438, "loss": 0.1543, "learning_rate": 2.1546091126202955e-06, "epoch": 0.5668741374940153, "percentage": 56.69, "elapsed_time": "7:38:05", "remaining_time": "5:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2517, "total_steps": 4438, "loss": 0.133, "learning_rate": 2.1527641742103282e-06, "epoch": 0.5670994451798237, "percentage": 56.71, "elapsed_time": "7:38:14", "remaining_time": "5:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2518, "total_steps": 4438, "loss": 0.1418, "learning_rate": 2.150919428607472e-06, "epoch": 0.5673247528656321, "percentage": 56.74, "elapsed_time": "7:38:26", "remaining_time": "5:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2519, "total_steps": 4438, "loss": 0.1484, "learning_rate": 2.149074876836045e-06, "epoch": 0.5675500605514405, "percentage": 56.76, "elapsed_time": "7:38:37", "remaining_time": "5:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 4438, "loss": 0.156, "learning_rate": 2.147230519920259e-06, "epoch": 0.567775368237249, "percentage": 56.78, "elapsed_time": "7:38:49", "remaining_time": "5:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2521, "total_steps": 4438, "loss": 0.1373, "learning_rate": 2.1453863588842165e-06, "epoch": 0.5680006759230575, "percentage": 56.8, "elapsed_time": "7:38:59", "remaining_time": "5:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2522, "total_steps": 4438, "loss": 0.1469, "learning_rate": 2.143542394751911e-06, "epoch": 0.5682259836088659, "percentage": 56.83, "elapsed_time": "7:39:09", "remaining_time": "5:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2523, "total_steps": 4438, "loss": 0.1436, "learning_rate": 2.1416986285472268e-06, "epoch": 0.5684512912946743, "percentage": 56.85, "elapsed_time": "7:39:20", "remaining_time": "5:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2524, "total_steps": 4438, "loss": 0.1439, "learning_rate": 2.139855061293939e-06, "epoch": 0.5686765989804827, "percentage": 56.87, "elapsed_time": "7:39:29", "remaining_time": "5:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2525, "total_steps": 4438, "loss": 0.147, "learning_rate": 2.1380116940157107e-06, "epoch": 0.5689019066662911, "percentage": 56.89, "elapsed_time": "7:39:40", "remaining_time": "5:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2526, "total_steps": 4438, "loss": 0.1506, "learning_rate": 2.1361685277360973e-06, "epoch": 0.5691272143520996, "percentage": 56.92, "elapsed_time": "7:39:50", "remaining_time": "5:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2527, "total_steps": 4438, "loss": 0.1451, "learning_rate": 2.1343255634785386e-06, "epoch": 0.569352522037908, "percentage": 56.94, "elapsed_time": "7:40:00", "remaining_time": "5:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2528, "total_steps": 4438, "loss": 0.1164, "learning_rate": 2.132482802266364e-06, "epoch": 0.5695778297237164, "percentage": 56.96, "elapsed_time": "7:40:10", "remaining_time": "5:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2529, "total_steps": 4438, "loss": 0.1406, "learning_rate": 2.1306402451227907e-06, "epoch": 0.5698031374095249, "percentage": 56.99, "elapsed_time": "7:40:21", "remaining_time": "5:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 4438, "loss": 0.1416, "learning_rate": 2.128797893070922e-06, "epoch": 0.5700284450953333, "percentage": 57.01, "elapsed_time": "7:40:30", "remaining_time": "5:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2531, "total_steps": 4438, "loss": 0.1455, "learning_rate": 2.1269557471337467e-06, "epoch": 0.5702537527811418, "percentage": 57.03, "elapsed_time": "7:40:41", "remaining_time": "5:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2532, "total_steps": 4438, "loss": 0.1499, "learning_rate": 2.1251138083341404e-06, "epoch": 0.5704790604669502, "percentage": 57.05, "elapsed_time": "7:40:51", "remaining_time": "5:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2533, "total_steps": 4438, "loss": 0.1415, "learning_rate": 2.123272077694864e-06, "epoch": 0.5707043681527586, "percentage": 57.08, "elapsed_time": "7:41:01", "remaining_time": "5:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2534, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.1214305562385592e-06, "epoch": 0.570929675838567, "percentage": 57.1, "elapsed_time": "7:41:12", "remaining_time": "5:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2535, "total_steps": 4438, "loss": 0.1359, "learning_rate": 2.1195892449877556e-06, "epoch": 0.5711549835243754, "percentage": 57.12, "elapsed_time": "7:41:24", "remaining_time": "5:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2536, "total_steps": 4438, "loss": 0.147, "learning_rate": 2.117748144964865e-06, "epoch": 0.5713802912101839, "percentage": 57.14, "elapsed_time": "7:41:36", "remaining_time": "5:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2537, "total_steps": 4438, "loss": 0.1416, "learning_rate": 2.115907257192182e-06, "epoch": 0.5716055988959924, "percentage": 57.17, "elapsed_time": "7:41:47", "remaining_time": "5:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2538, "total_steps": 4438, "loss": 0.1305, "learning_rate": 2.1140665826918823e-06, "epoch": 0.5718309065818008, "percentage": 57.19, "elapsed_time": "7:41:58", "remaining_time": "5:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2539, "total_steps": 4438, "loss": 0.152, "learning_rate": 2.1122261224860237e-06, "epoch": 0.5720562142676092, "percentage": 57.21, "elapsed_time": "7:42:08", "remaining_time": "5:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 4438, "loss": 0.1453, "learning_rate": 2.1103858775965455e-06, "epoch": 0.5722815219534176, "percentage": 57.23, "elapsed_time": "7:42:19", "remaining_time": "5:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2541, "total_steps": 4438, "loss": 0.1452, "learning_rate": 2.1085458490452663e-06, "epoch": 0.5725068296392261, "percentage": 57.26, "elapsed_time": "7:42:28", "remaining_time": "5:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2542, "total_steps": 4438, "loss": 0.1294, "learning_rate": 2.106706037853887e-06, "epoch": 0.5727321373250345, "percentage": 57.28, "elapsed_time": "7:42:40", "remaining_time": "5:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2543, "total_steps": 4438, "loss": 0.1323, "learning_rate": 2.1048664450439853e-06, "epoch": 0.5729574450108429, "percentage": 57.3, "elapsed_time": "7:42:49", "remaining_time": "5:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2544, "total_steps": 4438, "loss": 0.144, "learning_rate": 2.103027071637018e-06, "epoch": 0.5731827526966513, "percentage": 57.32, "elapsed_time": "7:42:59", "remaining_time": "5:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2545, "total_steps": 4438, "loss": 0.1326, "learning_rate": 2.101187918654321e-06, "epoch": 0.5734080603824598, "percentage": 57.35, "elapsed_time": "7:43:08", "remaining_time": "5:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2546, "total_steps": 4438, "loss": 0.1519, "learning_rate": 2.099348987117108e-06, "epoch": 0.5736333680682683, "percentage": 57.37, "elapsed_time": "7:43:20", "remaining_time": "5:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2547, "total_steps": 4438, "loss": 0.1456, "learning_rate": 2.0975102780464674e-06, "epoch": 0.5738586757540767, "percentage": 57.39, "elapsed_time": "7:43:30", "remaining_time": "5:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2548, "total_steps": 4438, "loss": 0.1466, "learning_rate": 2.095671792463368e-06, "epoch": 0.5740839834398851, "percentage": 57.41, "elapsed_time": "7:43:42", "remaining_time": "5:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2549, "total_steps": 4438, "loss": 0.1462, "learning_rate": 2.0938335313886513e-06, "epoch": 0.5743092911256935, "percentage": 57.44, "elapsed_time": "7:43:52", "remaining_time": "5:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 4438, "loss": 0.1306, "learning_rate": 2.0919954958430357e-06, "epoch": 0.5745345988115019, "percentage": 57.46, "elapsed_time": "7:44:03", "remaining_time": "5:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2551, "total_steps": 4438, "loss": 0.1499, "learning_rate": 2.0901576868471125e-06, "epoch": 0.5747599064973103, "percentage": 57.48, "elapsed_time": "7:44:13", "remaining_time": "5:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2552, "total_steps": 4438, "loss": 0.1435, "learning_rate": 2.0883201054213493e-06, "epoch": 0.5749852141831189, "percentage": 57.5, "elapsed_time": "7:44:22", "remaining_time": "5:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2553, "total_steps": 4438, "loss": 0.1396, "learning_rate": 2.086482752586087e-06, "epoch": 0.5752105218689273, "percentage": 57.53, "elapsed_time": "7:44:33", "remaining_time": "5:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2554, "total_steps": 4438, "loss": 0.134, "learning_rate": 2.0846456293615384e-06, "epoch": 0.5754358295547357, "percentage": 57.55, "elapsed_time": "7:44:45", "remaining_time": "5:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2555, "total_steps": 4438, "loss": 0.1424, "learning_rate": 2.0828087367677906e-06, "epoch": 0.5756611372405441, "percentage": 57.57, "elapsed_time": "7:44:56", "remaining_time": "5:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2556, "total_steps": 4438, "loss": 0.1521, "learning_rate": 2.0809720758247997e-06, "epoch": 0.5758864449263525, "percentage": 57.59, "elapsed_time": "7:45:06", "remaining_time": "5:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2557, "total_steps": 4438, "loss": 0.1604, "learning_rate": 2.0791356475523967e-06, "epoch": 0.576111752612161, "percentage": 57.62, "elapsed_time": "7:45:16", "remaining_time": "5:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2558, "total_steps": 4438, "loss": 0.1485, "learning_rate": 2.077299452970282e-06, "epoch": 0.5763370602979694, "percentage": 57.64, "elapsed_time": "7:45:28", "remaining_time": "5:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2559, "total_steps": 4438, "loss": 0.1388, "learning_rate": 2.0754634930980245e-06, "epoch": 0.5765623679837778, "percentage": 57.66, "elapsed_time": "7:45:39", "remaining_time": "5:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 4438, "loss": 0.1436, "learning_rate": 2.0736277689550655e-06, "epoch": 0.5767876756695863, "percentage": 57.68, "elapsed_time": "7:45:50", "remaining_time": "5:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2561, "total_steps": 4438, "loss": 0.1475, "learning_rate": 2.0717922815607134e-06, "epoch": 0.5770129833553947, "percentage": 57.71, "elapsed_time": "7:46:00", "remaining_time": "5:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2562, "total_steps": 4438, "loss": 0.1422, "learning_rate": 2.069957031934147e-06, "epoch": 0.5772382910412032, "percentage": 57.73, "elapsed_time": "7:46:11", "remaining_time": "5:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2563, "total_steps": 4438, "loss": 0.1505, "learning_rate": 2.0681220210944106e-06, "epoch": 0.5774635987270116, "percentage": 57.75, "elapsed_time": "7:46:21", "remaining_time": "5:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2564, "total_steps": 4438, "loss": 0.1514, "learning_rate": 2.066287250060418e-06, "epoch": 0.57768890641282, "percentage": 57.77, "elapsed_time": "7:46:32", "remaining_time": "5:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2565, "total_steps": 4438, "loss": 0.1494, "learning_rate": 2.06445271985095e-06, "epoch": 0.5779142140986284, "percentage": 57.8, "elapsed_time": "7:46:44", "remaining_time": "5:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2566, "total_steps": 4438, "loss": 0.1377, "learning_rate": 2.062618431484652e-06, "epoch": 0.5781395217844368, "percentage": 57.82, "elapsed_time": "7:46:54", "remaining_time": "5:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2567, "total_steps": 4438, "loss": 0.1435, "learning_rate": 2.060784385980036e-06, "epoch": 0.5783648294702453, "percentage": 57.84, "elapsed_time": "7:47:04", "remaining_time": "5:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2568, "total_steps": 4438, "loss": 0.1361, "learning_rate": 2.05895058435548e-06, "epoch": 0.5785901371560538, "percentage": 57.86, "elapsed_time": "7:47:13", "remaining_time": "5:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2569, "total_steps": 4438, "loss": 0.1391, "learning_rate": 2.0571170276292233e-06, "epoch": 0.5788154448418622, "percentage": 57.89, "elapsed_time": "7:47:23", "remaining_time": "5:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 4438, "loss": 0.1384, "learning_rate": 2.0552837168193738e-06, "epoch": 0.5790407525276706, "percentage": 57.91, "elapsed_time": "7:47:34", "remaining_time": "5:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2571, "total_steps": 4438, "loss": 0.1378, "learning_rate": 2.0534506529439e-06, "epoch": 0.579266060213479, "percentage": 57.93, "elapsed_time": "7:47:45", "remaining_time": "5:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2572, "total_steps": 4438, "loss": 0.1503, "learning_rate": 2.051617837020633e-06, "epoch": 0.5794913678992875, "percentage": 57.95, "elapsed_time": "7:47:57", "remaining_time": "5:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2573, "total_steps": 4438, "loss": 0.1321, "learning_rate": 2.0497852700672692e-06, "epoch": 0.5797166755850959, "percentage": 57.98, "elapsed_time": "7:48:07", "remaining_time": "5:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2574, "total_steps": 4438, "loss": 0.1541, "learning_rate": 2.047952953101363e-06, "epoch": 0.5799419832709043, "percentage": 58.0, "elapsed_time": "7:48:19", "remaining_time": "5:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2575, "total_steps": 4438, "loss": 0.1344, "learning_rate": 2.0461208871403333e-06, "epoch": 0.5801672909567127, "percentage": 58.02, "elapsed_time": "7:48:30", "remaining_time": "5:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2576, "total_steps": 4438, "loss": 0.1352, "learning_rate": 2.0442890732014563e-06, "epoch": 0.5803925986425212, "percentage": 58.04, "elapsed_time": "7:48:41", "remaining_time": "5:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2577, "total_steps": 4438, "loss": 0.1322, "learning_rate": 2.042457512301871e-06, "epoch": 0.5806179063283297, "percentage": 58.07, "elapsed_time": "7:48:53", "remaining_time": "5:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2578, "total_steps": 4438, "loss": 0.1446, "learning_rate": 2.040626205458574e-06, "epoch": 0.5808432140141381, "percentage": 58.09, "elapsed_time": "7:49:04", "remaining_time": "5:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2579, "total_steps": 4438, "loss": 0.149, "learning_rate": 2.038795153688423e-06, "epoch": 0.5810685216999465, "percentage": 58.11, "elapsed_time": "7:49:16", "remaining_time": "5:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 4438, "loss": 0.1472, "learning_rate": 2.0369643580081326e-06, "epoch": 0.5812938293857549, "percentage": 58.13, "elapsed_time": "7:49:26", "remaining_time": "5:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2581, "total_steps": 4438, "loss": 0.1411, "learning_rate": 2.0351338194342744e-06, "epoch": 0.5815191370715633, "percentage": 58.16, "elapsed_time": "7:49:37", "remaining_time": "5:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2582, "total_steps": 4438, "loss": 0.1372, "learning_rate": 2.0333035389832795e-06, "epoch": 0.5817444447573717, "percentage": 58.18, "elapsed_time": "7:49:47", "remaining_time": "5:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2583, "total_steps": 4438, "loss": 0.1502, "learning_rate": 2.0314735176714336e-06, "epoch": 0.5819697524431802, "percentage": 58.2, "elapsed_time": "7:49:59", "remaining_time": "5:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2584, "total_steps": 4438, "loss": 0.1482, "learning_rate": 2.0296437565148786e-06, "epoch": 0.5821950601289887, "percentage": 58.22, "elapsed_time": "7:50:10", "remaining_time": "5:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2585, "total_steps": 4438, "loss": 0.1335, "learning_rate": 2.0278142565296153e-06, "epoch": 0.5824203678147971, "percentage": 58.25, "elapsed_time": "7:50:21", "remaining_time": "5:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2586, "total_steps": 4438, "loss": 0.1482, "learning_rate": 2.025985018731494e-06, "epoch": 0.5826456755006055, "percentage": 58.27, "elapsed_time": "7:50:33", "remaining_time": "5:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2587, "total_steps": 4438, "loss": 0.1424, "learning_rate": 2.0241560441362235e-06, "epoch": 0.582870983186414, "percentage": 58.29, "elapsed_time": "7:50:43", "remaining_time": "5:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2588, "total_steps": 4438, "loss": 0.146, "learning_rate": 2.0223273337593647e-06, "epoch": 0.5830962908722224, "percentage": 58.31, "elapsed_time": "7:50:54", "remaining_time": "5:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2589, "total_steps": 4438, "loss": 0.1524, "learning_rate": 2.020498888616333e-06, "epoch": 0.5833215985580308, "percentage": 58.34, "elapsed_time": "7:51:05", "remaining_time": "5:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 4438, "loss": 0.1433, "learning_rate": 2.0186707097223952e-06, "epoch": 0.5835469062438392, "percentage": 58.36, "elapsed_time": "7:51:15", "remaining_time": "5:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2591, "total_steps": 4438, "loss": 0.1366, "learning_rate": 2.016842798092672e-06, "epoch": 0.5837722139296476, "percentage": 58.38, "elapsed_time": "7:51:26", "remaining_time": "5:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2592, "total_steps": 4438, "loss": 0.1481, "learning_rate": 2.0150151547421333e-06, "epoch": 0.5839975216154561, "percentage": 58.4, "elapsed_time": "7:51:37", "remaining_time": "5:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2593, "total_steps": 4438, "loss": 0.1413, "learning_rate": 2.013187780685602e-06, "epoch": 0.5842228293012646, "percentage": 58.43, "elapsed_time": "7:51:47", "remaining_time": "5:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2594, "total_steps": 4438, "loss": 0.1367, "learning_rate": 2.0113606769377497e-06, "epoch": 0.584448136987073, "percentage": 58.45, "elapsed_time": "7:51:57", "remaining_time": "5:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2595, "total_steps": 4438, "loss": 0.1473, "learning_rate": 2.009533844513101e-06, "epoch": 0.5846734446728814, "percentage": 58.47, "elapsed_time": "7:52:08", "remaining_time": "5:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2596, "total_steps": 4438, "loss": 0.133, "learning_rate": 2.0077072844260267e-06, "epoch": 0.5848987523586898, "percentage": 58.49, "elapsed_time": "7:52:18", "remaining_time": "5:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2597, "total_steps": 4438, "loss": 0.14, "learning_rate": 2.0058809976907475e-06, "epoch": 0.5851240600444982, "percentage": 58.52, "elapsed_time": "7:52:29", "remaining_time": "5:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2598, "total_steps": 4438, "loss": 0.1495, "learning_rate": 2.0040549853213326e-06, "epoch": 0.5853493677303067, "percentage": 58.54, "elapsed_time": "7:52:39", "remaining_time": "5:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2599, "total_steps": 4438, "loss": 0.1406, "learning_rate": 2.0022292483316984e-06, "epoch": 0.5855746754161152, "percentage": 58.56, "elapsed_time": "7:52:50", "remaining_time": "5:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 4438, "loss": 0.1466, "learning_rate": 2.0004037877356085e-06, "epoch": 0.5857999831019236, "percentage": 58.58, "elapsed_time": "7:53:00", "remaining_time": "5:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2601, "total_steps": 4438, "loss": 0.1428, "learning_rate": 1.998578604546674e-06, "epoch": 0.586025290787732, "percentage": 58.61, "elapsed_time": "7:53:11", "remaining_time": "5:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2602, "total_steps": 4438, "loss": 0.1457, "learning_rate": 1.9967536997783495e-06, "epoch": 0.5862505984735404, "percentage": 58.63, "elapsed_time": "7:53:21", "remaining_time": "5:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2603, "total_steps": 4438, "loss": 0.1375, "learning_rate": 1.9949290744439392e-06, "epoch": 0.5864759061593489, "percentage": 58.65, "elapsed_time": "7:53:32", "remaining_time": "5:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2604, "total_steps": 4438, "loss": 0.1475, "learning_rate": 1.9931047295565863e-06, "epoch": 0.5867012138451573, "percentage": 58.68, "elapsed_time": "7:53:44", "remaining_time": "5:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2605, "total_steps": 4438, "loss": 0.1311, "learning_rate": 1.9912806661292838e-06, "epoch": 0.5869265215309657, "percentage": 58.7, "elapsed_time": "7:53:55", "remaining_time": "5:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2606, "total_steps": 4438, "loss": 0.1462, "learning_rate": 1.989456885174865e-06, "epoch": 0.5871518292167741, "percentage": 58.72, "elapsed_time": "7:54:06", "remaining_time": "5:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2607, "total_steps": 4438, "loss": 0.1278, "learning_rate": 1.987633387706008e-06, "epoch": 0.5873771369025826, "percentage": 58.74, "elapsed_time": "7:54:16", "remaining_time": "5:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2608, "total_steps": 4438, "loss": 0.1341, "learning_rate": 1.9858101747352326e-06, "epoch": 0.5876024445883911, "percentage": 58.77, "elapsed_time": "7:54:26", "remaining_time": "5:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2609, "total_steps": 4438, "loss": 0.1415, "learning_rate": 1.9839872472749016e-06, "epoch": 0.5878277522741995, "percentage": 58.79, "elapsed_time": "7:54:36", "remaining_time": "5:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 4438, "loss": 0.123, "learning_rate": 1.9821646063372174e-06, "epoch": 0.5880530599600079, "percentage": 58.81, "elapsed_time": "7:54:47", "remaining_time": "5:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2611, "total_steps": 4438, "loss": 0.13, "learning_rate": 1.9803422529342264e-06, "epoch": 0.5882783676458163, "percentage": 58.83, "elapsed_time": "7:54:57", "remaining_time": "5:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2612, "total_steps": 4438, "loss": 0.1273, "learning_rate": 1.978520188077813e-06, "epoch": 0.5885036753316247, "percentage": 58.86, "elapsed_time": "7:55:08", "remaining_time": "5:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2613, "total_steps": 4438, "loss": 0.1525, "learning_rate": 1.976698412779701e-06, "epoch": 0.5887289830174331, "percentage": 58.88, "elapsed_time": "7:55:20", "remaining_time": "5:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2614, "total_steps": 4438, "loss": 0.1423, "learning_rate": 1.9748769280514544e-06, "epoch": 0.5889542907032416, "percentage": 58.9, "elapsed_time": "7:55:29", "remaining_time": "5:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2615, "total_steps": 4438, "loss": 0.1403, "learning_rate": 1.973055734904477e-06, "epoch": 0.5891795983890501, "percentage": 58.92, "elapsed_time": "7:55:39", "remaining_time": "5:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2616, "total_steps": 4438, "loss": 0.1366, "learning_rate": 1.971234834350008e-06, "epoch": 0.5894049060748585, "percentage": 58.95, "elapsed_time": "7:55:49", "remaining_time": "5:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2617, "total_steps": 4438, "loss": 0.142, "learning_rate": 1.9694142273991264e-06, "epoch": 0.5896302137606669, "percentage": 58.97, "elapsed_time": "7:56:01", "remaining_time": "5:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2618, "total_steps": 4438, "loss": 0.1442, "learning_rate": 1.967593915062748e-06, "epoch": 0.5898555214464754, "percentage": 58.99, "elapsed_time": "7:56:12", "remaining_time": "5:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2619, "total_steps": 4438, "loss": 0.1457, "learning_rate": 1.9657738983516227e-06, "epoch": 0.5900808291322838, "percentage": 59.01, "elapsed_time": "7:56:22", "remaining_time": "5:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 4438, "loss": 0.1537, "learning_rate": 1.96395417827634e-06, "epoch": 0.5903061368180922, "percentage": 59.04, "elapsed_time": "7:56:33", "remaining_time": "5:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2621, "total_steps": 4438, "loss": 0.1193, "learning_rate": 1.9621347558473216e-06, "epoch": 0.5905314445039006, "percentage": 59.06, "elapsed_time": "7:56:42", "remaining_time": "5:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2622, "total_steps": 4438, "loss": 0.1432, "learning_rate": 1.960315632074824e-06, "epoch": 0.590756752189709, "percentage": 59.08, "elapsed_time": "7:56:55", "remaining_time": "5:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2623, "total_steps": 4438, "loss": 0.1385, "learning_rate": 1.95849680796894e-06, "epoch": 0.5909820598755176, "percentage": 59.1, "elapsed_time": "7:57:07", "remaining_time": "5:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2624, "total_steps": 4438, "loss": 0.1465, "learning_rate": 1.9566782845395945e-06, "epoch": 0.591207367561326, "percentage": 59.13, "elapsed_time": "7:57:18", "remaining_time": "5:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2625, "total_steps": 4438, "loss": 0.1468, "learning_rate": 1.9548600627965454e-06, "epoch": 0.5914326752471344, "percentage": 59.15, "elapsed_time": "7:57:30", "remaining_time": "5:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2626, "total_steps": 4438, "loss": 0.1433, "learning_rate": 1.9530421437493843e-06, "epoch": 0.5916579829329428, "percentage": 59.17, "elapsed_time": "7:57:41", "remaining_time": "5:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2627, "total_steps": 4438, "loss": 0.136, "learning_rate": 1.951224528407534e-06, "epoch": 0.5918832906187512, "percentage": 59.19, "elapsed_time": "7:57:52", "remaining_time": "5:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2628, "total_steps": 4438, "loss": 0.1429, "learning_rate": 1.949407217780247e-06, "epoch": 0.5921085983045596, "percentage": 59.22, "elapsed_time": "7:58:04", "remaining_time": "5:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2629, "total_steps": 4438, "loss": 0.1522, "learning_rate": 1.94759021287661e-06, "epoch": 0.5923339059903681, "percentage": 59.24, "elapsed_time": "7:58:15", "remaining_time": "5:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 4438, "loss": 0.1446, "learning_rate": 1.945773514705537e-06, "epoch": 0.5925592136761765, "percentage": 59.26, "elapsed_time": "7:58:26", "remaining_time": "5:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2631, "total_steps": 4438, "loss": 0.1447, "learning_rate": 1.943957124275773e-06, "epoch": 0.592784521361985, "percentage": 59.28, "elapsed_time": "7:58:38", "remaining_time": "5:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2632, "total_steps": 4438, "loss": 0.1275, "learning_rate": 1.9421410425958915e-06, "epoch": 0.5930098290477934, "percentage": 59.31, "elapsed_time": "7:58:47", "remaining_time": "5:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2633, "total_steps": 4438, "loss": 0.1506, "learning_rate": 1.9403252706742957e-06, "epoch": 0.5932351367336018, "percentage": 59.33, "elapsed_time": "7:58:58", "remaining_time": "5:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2634, "total_steps": 4438, "loss": 0.1351, "learning_rate": 1.938509809519216e-06, "epoch": 0.5934604444194103, "percentage": 59.35, "elapsed_time": "7:59:07", "remaining_time": "5:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2635, "total_steps": 4438, "loss": 0.1388, "learning_rate": 1.9366946601387103e-06, "epoch": 0.5936857521052187, "percentage": 59.37, "elapsed_time": "7:59:20", "remaining_time": "5:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2636, "total_steps": 4438, "loss": 0.1625, "learning_rate": 1.934879823540663e-06, "epoch": 0.5939110597910271, "percentage": 59.4, "elapsed_time": "7:59:30", "remaining_time": "5:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2637, "total_steps": 4438, "loss": 0.1526, "learning_rate": 1.9330653007327852e-06, "epoch": 0.5941363674768355, "percentage": 59.42, "elapsed_time": "7:59:41", "remaining_time": "5:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2638, "total_steps": 4438, "loss": 0.1461, "learning_rate": 1.931251092722615e-06, "epoch": 0.5943616751626439, "percentage": 59.44, "elapsed_time": "7:59:51", "remaining_time": "5:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2639, "total_steps": 4438, "loss": 0.1441, "learning_rate": 1.9294372005175125e-06, "epoch": 0.5945869828484525, "percentage": 59.46, "elapsed_time": "8:00:02", "remaining_time": "5:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 4438, "loss": 0.1411, "learning_rate": 1.9276236251246655e-06, "epoch": 0.5948122905342609, "percentage": 59.49, "elapsed_time": "8:00:13", "remaining_time": "5:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2641, "total_steps": 4438, "loss": 0.1361, "learning_rate": 1.9258103675510846e-06, "epoch": 0.5950375982200693, "percentage": 59.51, "elapsed_time": "8:00:24", "remaining_time": "5:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2642, "total_steps": 4438, "loss": 0.1537, "learning_rate": 1.9239974288036044e-06, "epoch": 0.5952629059058777, "percentage": 59.53, "elapsed_time": "8:00:34", "remaining_time": "5:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2643, "total_steps": 4438, "loss": 0.1226, "learning_rate": 1.9221848098888817e-06, "epoch": 0.5954882135916861, "percentage": 59.55, "elapsed_time": "8:00:43", "remaining_time": "5:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2644, "total_steps": 4438, "loss": 0.1327, "learning_rate": 1.920372511813397e-06, "epoch": 0.5957135212774946, "percentage": 59.58, "elapsed_time": "8:00:54", "remaining_time": "5:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2645, "total_steps": 4438, "loss": 0.1424, "learning_rate": 1.9185605355834518e-06, "epoch": 0.595938828963303, "percentage": 59.6, "elapsed_time": "8:01:04", "remaining_time": "5:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2646, "total_steps": 4438, "loss": 0.1319, "learning_rate": 1.916748882205168e-06, "epoch": 0.5961641366491115, "percentage": 59.62, "elapsed_time": "8:01:14", "remaining_time": "5:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2647, "total_steps": 4438, "loss": 0.1356, "learning_rate": 1.91493755268449e-06, "epoch": 0.5963894443349199, "percentage": 59.64, "elapsed_time": "8:01:24", "remaining_time": "5:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2648, "total_steps": 4438, "loss": 0.1366, "learning_rate": 1.913126548027181e-06, "epoch": 0.5966147520207283, "percentage": 59.67, "elapsed_time": "8:01:32", "remaining_time": "5:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2649, "total_steps": 4438, "loss": 0.135, "learning_rate": 1.9113158692388253e-06, "epoch": 0.5968400597065368, "percentage": 59.69, "elapsed_time": "8:01:42", "remaining_time": "5:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 4438, "loss": 0.1437, "learning_rate": 1.909505517324825e-06, "epoch": 0.5970653673923452, "percentage": 59.71, "elapsed_time": "8:01:53", "remaining_time": "5:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2651, "total_steps": 4438, "loss": 0.1303, "learning_rate": 1.9076954932904e-06, "epoch": 0.5972906750781536, "percentage": 59.73, "elapsed_time": "8:02:02", "remaining_time": "5:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2652, "total_steps": 4438, "loss": 0.1378, "learning_rate": 1.905885798140591e-06, "epoch": 0.597515982763962, "percentage": 59.76, "elapsed_time": "8:02:12", "remaining_time": "5:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2653, "total_steps": 4438, "loss": 0.1318, "learning_rate": 1.9040764328802523e-06, "epoch": 0.5977412904497704, "percentage": 59.78, "elapsed_time": "8:02:23", "remaining_time": "5:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2654, "total_steps": 4438, "loss": 0.1285, "learning_rate": 1.9022673985140585e-06, "epoch": 0.597966598135579, "percentage": 59.8, "elapsed_time": "8:02:34", "remaining_time": "5:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2655, "total_steps": 4438, "loss": 0.1487, "learning_rate": 1.9004586960464993e-06, "epoch": 0.5981919058213874, "percentage": 59.82, "elapsed_time": "8:02:46", "remaining_time": "5:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2656, "total_steps": 4438, "loss": 0.144, "learning_rate": 1.8986503264818785e-06, "epoch": 0.5984172135071958, "percentage": 59.85, "elapsed_time": "8:02:55", "remaining_time": "5:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2657, "total_steps": 4438, "loss": 0.1454, "learning_rate": 1.8968422908243156e-06, "epoch": 0.5986425211930042, "percentage": 59.87, "elapsed_time": "8:03:07", "remaining_time": "5:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2658, "total_steps": 4438, "loss": 0.139, "learning_rate": 1.895034590077747e-06, "epoch": 0.5988678288788126, "percentage": 59.89, "elapsed_time": "8:03:18", "remaining_time": "5:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2659, "total_steps": 4438, "loss": 0.1525, "learning_rate": 1.8932272252459213e-06, "epoch": 0.599093136564621, "percentage": 59.91, "elapsed_time": "8:03:28", "remaining_time": "5:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 4438, "loss": 0.1492, "learning_rate": 1.8914201973324004e-06, "epoch": 0.5993184442504295, "percentage": 59.94, "elapsed_time": "8:03:38", "remaining_time": "5:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2661, "total_steps": 4438, "loss": 0.1249, "learning_rate": 1.88961350734056e-06, "epoch": 0.5995437519362379, "percentage": 59.96, "elapsed_time": "8:03:49", "remaining_time": "5:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2662, "total_steps": 4438, "loss": 0.1491, "learning_rate": 1.8878071562735873e-06, "epoch": 0.5997690596220464, "percentage": 59.98, "elapsed_time": "8:03:59", "remaining_time": "5:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2663, "total_steps": 4438, "loss": 0.1407, "learning_rate": 1.8860011451344811e-06, "epoch": 0.5999943673078548, "percentage": 60.0, "elapsed_time": "8:04:10", "remaining_time": "5:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2664, "total_steps": 4438, "loss": 0.1463, "learning_rate": 1.8841954749260535e-06, "epoch": 0.6002196749936632, "percentage": 60.03, "elapsed_time": "8:04:21", "remaining_time": "5:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2665, "total_steps": 4438, "loss": 0.1487, "learning_rate": 1.8823901466509253e-06, "epoch": 0.6004449826794717, "percentage": 60.05, "elapsed_time": "8:04:32", "remaining_time": "5:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2666, "total_steps": 4438, "loss": 0.1486, "learning_rate": 1.8805851613115278e-06, "epoch": 0.6006702903652801, "percentage": 60.07, "elapsed_time": "8:04:42", "remaining_time": "5:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2667, "total_steps": 4438, "loss": 0.1306, "learning_rate": 1.878780519910102e-06, "epoch": 0.6008955980510885, "percentage": 60.09, "elapsed_time": "8:04:53", "remaining_time": "5:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2668, "total_steps": 4438, "loss": 0.1296, "learning_rate": 1.8769762234486982e-06, "epoch": 0.6011209057368969, "percentage": 60.12, "elapsed_time": "8:05:03", "remaining_time": "5:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2669, "total_steps": 4438, "loss": 0.1379, "learning_rate": 1.8751722729291747e-06, "epoch": 0.6013462134227053, "percentage": 60.14, "elapsed_time": "8:05:13", "remaining_time": "5:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 4438, "loss": 0.1253, "learning_rate": 1.8733686693531986e-06, "epoch": 0.6015715211085139, "percentage": 60.16, "elapsed_time": "8:05:23", "remaining_time": "5:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2671, "total_steps": 4438, "loss": 0.1326, "learning_rate": 1.8715654137222434e-06, "epoch": 0.6017968287943223, "percentage": 60.18, "elapsed_time": "8:05:36", "remaining_time": "5:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2672, "total_steps": 4438, "loss": 0.1456, "learning_rate": 1.8697625070375893e-06, "epoch": 0.6020221364801307, "percentage": 60.21, "elapsed_time": "8:05:47", "remaining_time": "5:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2673, "total_steps": 4438, "loss": 0.1277, "learning_rate": 1.8679599503003246e-06, "epoch": 0.6022474441659391, "percentage": 60.23, "elapsed_time": "8:05:57", "remaining_time": "5:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2674, "total_steps": 4438, "loss": 0.1371, "learning_rate": 1.8661577445113399e-06, "epoch": 0.6024727518517475, "percentage": 60.25, "elapsed_time": "8:06:07", "remaining_time": "5:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2675, "total_steps": 4438, "loss": 0.1426, "learning_rate": 1.8643558906713344e-06, "epoch": 0.602698059537556, "percentage": 60.27, "elapsed_time": "8:06:18", "remaining_time": "5:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2676, "total_steps": 4438, "loss": 0.1248, "learning_rate": 1.8625543897808094e-06, "epoch": 0.6029233672233644, "percentage": 60.3, "elapsed_time": "8:06:30", "remaining_time": "5:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2677, "total_steps": 4438, "loss": 0.1345, "learning_rate": 1.8607532428400714e-06, "epoch": 0.6031486749091728, "percentage": 60.32, "elapsed_time": "8:06:40", "remaining_time": "5:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2678, "total_steps": 4438, "loss": 0.1523, "learning_rate": 1.8589524508492308e-06, "epoch": 0.6033739825949813, "percentage": 60.34, "elapsed_time": "8:06:50", "remaining_time": "5:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2679, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.8571520148081992e-06, "epoch": 0.6035992902807897, "percentage": 60.37, "elapsed_time": "8:06:59", "remaining_time": "5:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 4438, "loss": 0.1405, "learning_rate": 1.8553519357166927e-06, "epoch": 0.6038245979665982, "percentage": 60.39, "elapsed_time": "8:07:10", "remaining_time": "5:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2681, "total_steps": 4438, "loss": 0.1442, "learning_rate": 1.853552214574228e-06, "epoch": 0.6040499056524066, "percentage": 60.41, "elapsed_time": "8:07:21", "remaining_time": "5:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2682, "total_steps": 4438, "loss": 0.1152, "learning_rate": 1.8517528523801226e-06, "epoch": 0.604275213338215, "percentage": 60.43, "elapsed_time": "8:07:32", "remaining_time": "5:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2683, "total_steps": 4438, "loss": 0.1379, "learning_rate": 1.8499538501334955e-06, "epoch": 0.6045005210240234, "percentage": 60.46, "elapsed_time": "8:07:43", "remaining_time": "5:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2684, "total_steps": 4438, "loss": 0.1419, "learning_rate": 1.8481552088332656e-06, "epoch": 0.6047258287098318, "percentage": 60.48, "elapsed_time": "8:07:52", "remaining_time": "5:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2685, "total_steps": 4438, "loss": 0.1537, "learning_rate": 1.8463569294781509e-06, "epoch": 0.6049511363956402, "percentage": 60.5, "elapsed_time": "8:08:04", "remaining_time": "5:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2686, "total_steps": 4438, "loss": 0.135, "learning_rate": 1.84455901306667e-06, "epoch": 0.6051764440814488, "percentage": 60.52, "elapsed_time": "8:08:14", "remaining_time": "5:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2687, "total_steps": 4438, "loss": 0.1319, "learning_rate": 1.842761460597138e-06, "epoch": 0.6054017517672572, "percentage": 60.55, "elapsed_time": "8:08:26", "remaining_time": "5:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2688, "total_steps": 4438, "loss": 0.1402, "learning_rate": 1.8409642730676692e-06, "epoch": 0.6056270594530656, "percentage": 60.57, "elapsed_time": "8:08:37", "remaining_time": "5:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2689, "total_steps": 4438, "loss": 0.1354, "learning_rate": 1.8391674514761745e-06, "epoch": 0.605852367138874, "percentage": 60.59, "elapsed_time": "8:08:48", "remaining_time": "5:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 4438, "loss": 0.1378, "learning_rate": 1.8373709968203624e-06, "epoch": 0.6060776748246824, "percentage": 60.61, "elapsed_time": "8:09:00", "remaining_time": "5:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2691, "total_steps": 4438, "loss": 0.1339, "learning_rate": 1.8355749100977371e-06, "epoch": 0.6063029825104909, "percentage": 60.64, "elapsed_time": "8:09:10", "remaining_time": "5:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2692, "total_steps": 4438, "loss": 0.1354, "learning_rate": 1.8337791923055983e-06, "epoch": 0.6065282901962993, "percentage": 60.66, "elapsed_time": "8:09:21", "remaining_time": "5:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2693, "total_steps": 4438, "loss": 0.1213, "learning_rate": 1.8319838444410412e-06, "epoch": 0.6067535978821077, "percentage": 60.68, "elapsed_time": "8:09:32", "remaining_time": "5:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2694, "total_steps": 4438, "loss": 0.1345, "learning_rate": 1.8301888675009554e-06, "epoch": 0.6069789055679162, "percentage": 60.7, "elapsed_time": "8:09:43", "remaining_time": "5:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2695, "total_steps": 4438, "loss": 0.157, "learning_rate": 1.8283942624820247e-06, "epoch": 0.6072042132537246, "percentage": 60.73, "elapsed_time": "8:09:54", "remaining_time": "5:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2696, "total_steps": 4438, "loss": 0.1302, "learning_rate": 1.8266000303807272e-06, "epoch": 0.6074295209395331, "percentage": 60.75, "elapsed_time": "8:10:04", "remaining_time": "5:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2697, "total_steps": 4438, "loss": 0.1331, "learning_rate": 1.8248061721933325e-06, "epoch": 0.6076548286253415, "percentage": 60.77, "elapsed_time": "8:10:14", "remaining_time": "5:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2698, "total_steps": 4438, "loss": 0.1441, "learning_rate": 1.8230126889159027e-06, "epoch": 0.6078801363111499, "percentage": 60.79, "elapsed_time": "8:10:24", "remaining_time": "5:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2699, "total_steps": 4438, "loss": 0.1424, "learning_rate": 1.8212195815442934e-06, "epoch": 0.6081054439969583, "percentage": 60.82, "elapsed_time": "8:10:35", "remaining_time": "5:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 4438, "loss": 0.1287, "learning_rate": 1.8194268510741493e-06, "epoch": 0.6083307516827667, "percentage": 60.84, "elapsed_time": "8:10:46", "remaining_time": "5:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2701, "total_steps": 4438, "loss": 0.1355, "learning_rate": 1.8176344985009064e-06, "epoch": 0.6085560593685753, "percentage": 60.86, "elapsed_time": "8:10:57", "remaining_time": "5:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2702, "total_steps": 4438, "loss": 0.1451, "learning_rate": 1.8158425248197931e-06, "epoch": 0.6087813670543837, "percentage": 60.88, "elapsed_time": "8:11:08", "remaining_time": "5:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2703, "total_steps": 4438, "loss": 0.1338, "learning_rate": 1.8140509310258238e-06, "epoch": 0.6090066747401921, "percentage": 60.91, "elapsed_time": "8:11:19", "remaining_time": "5:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2704, "total_steps": 4438, "loss": 0.1407, "learning_rate": 1.812259718113805e-06, "epoch": 0.6092319824260005, "percentage": 60.93, "elapsed_time": "8:11:30", "remaining_time": "5:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2705, "total_steps": 4438, "loss": 0.1302, "learning_rate": 1.8104688870783296e-06, "epoch": 0.6094572901118089, "percentage": 60.95, "elapsed_time": "8:11:42", "remaining_time": "5:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2706, "total_steps": 4438, "loss": 0.1549, "learning_rate": 1.8086784389137796e-06, "epoch": 0.6096825977976174, "percentage": 60.97, "elapsed_time": "8:11:53", "remaining_time": "5:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2707, "total_steps": 4438, "loss": 0.1392, "learning_rate": 1.806888374614324e-06, "epoch": 0.6099079054834258, "percentage": 61.0, "elapsed_time": "8:12:03", "remaining_time": "5:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2708, "total_steps": 4438, "loss": 0.1438, "learning_rate": 1.8050986951739201e-06, "epoch": 0.6101332131692342, "percentage": 61.02, "elapsed_time": "8:12:14", "remaining_time": "5:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2709, "total_steps": 4438, "loss": 0.1392, "learning_rate": 1.8033094015863082e-06, "epoch": 0.6103585208550427, "percentage": 61.04, "elapsed_time": "8:12:24", "remaining_time": "5:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.8015204948450166e-06, "epoch": 0.6105838285408511, "percentage": 61.06, "elapsed_time": "8:12:34", "remaining_time": "5:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2711, "total_steps": 4438, "loss": 0.133, "learning_rate": 1.7997319759433596e-06, "epoch": 0.6108091362266596, "percentage": 61.09, "elapsed_time": "8:12:44", "remaining_time": "5:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2712, "total_steps": 4438, "loss": 0.1396, "learning_rate": 1.7979438458744343e-06, "epoch": 0.611034443912468, "percentage": 61.11, "elapsed_time": "8:12:54", "remaining_time": "5:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2713, "total_steps": 4438, "loss": 0.1398, "learning_rate": 1.7961561056311234e-06, "epoch": 0.6112597515982764, "percentage": 61.13, "elapsed_time": "8:13:06", "remaining_time": "5:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2714, "total_steps": 4438, "loss": 0.1484, "learning_rate": 1.7943687562060919e-06, "epoch": 0.6114850592840848, "percentage": 61.15, "elapsed_time": "8:13:17", "remaining_time": "5:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2715, "total_steps": 4438, "loss": 0.1428, "learning_rate": 1.792581798591788e-06, "epoch": 0.6117103669698932, "percentage": 61.18, "elapsed_time": "8:13:28", "remaining_time": "5:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2716, "total_steps": 4438, "loss": 0.137, "learning_rate": 1.7907952337804429e-06, "epoch": 0.6119356746557016, "percentage": 61.2, "elapsed_time": "8:13:38", "remaining_time": "5:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2717, "total_steps": 4438, "loss": 0.1533, "learning_rate": 1.7890090627640699e-06, "epoch": 0.6121609823415102, "percentage": 61.22, "elapsed_time": "8:13:48", "remaining_time": "5:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2718, "total_steps": 4438, "loss": 0.1479, "learning_rate": 1.787223286534463e-06, "epoch": 0.6123862900273186, "percentage": 61.24, "elapsed_time": "8:13:57", "remaining_time": "5:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2719, "total_steps": 4438, "loss": 0.1455, "learning_rate": 1.785437906083197e-06, "epoch": 0.612611597713127, "percentage": 61.27, "elapsed_time": "8:14:09", "remaining_time": "5:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 4438, "loss": 0.1526, "learning_rate": 1.783652922401627e-06, "epoch": 0.6128369053989354, "percentage": 61.29, "elapsed_time": "8:14:20", "remaining_time": "5:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2721, "total_steps": 4438, "loss": 0.1322, "learning_rate": 1.7818683364808883e-06, "epoch": 0.6130622130847438, "percentage": 61.31, "elapsed_time": "8:14:30", "remaining_time": "5:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2722, "total_steps": 4438, "loss": 0.1317, "learning_rate": 1.7800841493118942e-06, "epoch": 0.6132875207705523, "percentage": 61.33, "elapsed_time": "8:14:41", "remaining_time": "5:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2723, "total_steps": 4438, "loss": 0.1416, "learning_rate": 1.7783003618853384e-06, "epoch": 0.6135128284563607, "percentage": 61.36, "elapsed_time": "8:14:53", "remaining_time": "5:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2724, "total_steps": 4438, "loss": 0.1408, "learning_rate": 1.776516975191691e-06, "epoch": 0.6137381361421691, "percentage": 61.38, "elapsed_time": "8:15:05", "remaining_time": "5:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2725, "total_steps": 4438, "loss": 0.1285, "learning_rate": 1.7747339902212e-06, "epoch": 0.6139634438279776, "percentage": 61.4, "elapsed_time": "8:15:16", "remaining_time": "5:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2726, "total_steps": 4438, "loss": 0.1274, "learning_rate": 1.7729514079638915e-06, "epoch": 0.614188751513786, "percentage": 61.42, "elapsed_time": "8:15:26", "remaining_time": "5:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2727, "total_steps": 4438, "loss": 0.1482, "learning_rate": 1.7711692294095654e-06, "epoch": 0.6144140591995945, "percentage": 61.45, "elapsed_time": "8:15:37", "remaining_time": "5:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2728, "total_steps": 4438, "loss": 0.1521, "learning_rate": 1.7693874555477996e-06, "epoch": 0.6146393668854029, "percentage": 61.47, "elapsed_time": "8:15:48", "remaining_time": "5:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2729, "total_steps": 4438, "loss": 0.1359, "learning_rate": 1.7676060873679473e-06, "epoch": 0.6148646745712113, "percentage": 61.49, "elapsed_time": "8:15:58", "remaining_time": "5:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 4438, "loss": 0.1443, "learning_rate": 1.7658251258591352e-06, "epoch": 0.6150899822570197, "percentage": 61.51, "elapsed_time": "8:16:11", "remaining_time": "5:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2731, "total_steps": 4438, "loss": 0.1448, "learning_rate": 1.764044572010265e-06, "epoch": 0.6153152899428281, "percentage": 61.54, "elapsed_time": "8:16:22", "remaining_time": "5:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2732, "total_steps": 4438, "loss": 0.1565, "learning_rate": 1.7622644268100116e-06, "epoch": 0.6155405976286366, "percentage": 61.56, "elapsed_time": "8:16:31", "remaining_time": "5:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2733, "total_steps": 4438, "loss": 0.1506, "learning_rate": 1.7604846912468243e-06, "epoch": 0.6157659053144451, "percentage": 61.58, "elapsed_time": "8:16:43", "remaining_time": "5:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2734, "total_steps": 4438, "loss": 0.1337, "learning_rate": 1.7587053663089233e-06, "epoch": 0.6159912130002535, "percentage": 61.6, "elapsed_time": "8:16:53", "remaining_time": "5:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2735, "total_steps": 4438, "loss": 0.144, "learning_rate": 1.7569264529843009e-06, "epoch": 0.6162165206860619, "percentage": 61.63, "elapsed_time": "8:17:04", "remaining_time": "5:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2736, "total_steps": 4438, "loss": 0.1383, "learning_rate": 1.755147952260722e-06, "epoch": 0.6164418283718703, "percentage": 61.65, "elapsed_time": "8:17:14", "remaining_time": "5:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2737, "total_steps": 4438, "loss": 0.1453, "learning_rate": 1.753369865125722e-06, "epoch": 0.6166671360576788, "percentage": 61.67, "elapsed_time": "8:17:24", "remaining_time": "5:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2738, "total_steps": 4438, "loss": 0.1474, "learning_rate": 1.7515921925666053e-06, "epoch": 0.6168924437434872, "percentage": 61.69, "elapsed_time": "8:17:35", "remaining_time": "5:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2739, "total_steps": 4438, "loss": 0.1505, "learning_rate": 1.749814935570448e-06, "epoch": 0.6171177514292956, "percentage": 61.72, "elapsed_time": "8:17:44", "remaining_time": "5:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 4438, "loss": 0.137, "learning_rate": 1.748038095124095e-06, "epoch": 0.617343059115104, "percentage": 61.74, "elapsed_time": "8:17:54", "remaining_time": "5:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2741, "total_steps": 4438, "loss": 0.1337, "learning_rate": 1.746261672214159e-06, "epoch": 0.6175683668009125, "percentage": 61.76, "elapsed_time": "8:18:04", "remaining_time": "5:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2742, "total_steps": 4438, "loss": 0.1432, "learning_rate": 1.7444856678270218e-06, "epoch": 0.617793674486721, "percentage": 61.78, "elapsed_time": "8:18:15", "remaining_time": "5:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2743, "total_steps": 4438, "loss": 0.1371, "learning_rate": 1.7427100829488325e-06, "epoch": 0.6180189821725294, "percentage": 61.81, "elapsed_time": "8:18:27", "remaining_time": "5:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2744, "total_steps": 4438, "loss": 0.1459, "learning_rate": 1.7409349185655067e-06, "epoch": 0.6182442898583378, "percentage": 61.83, "elapsed_time": "8:18:36", "remaining_time": "5:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2745, "total_steps": 4438, "loss": 0.1319, "learning_rate": 1.739160175662727e-06, "epoch": 0.6184695975441462, "percentage": 61.85, "elapsed_time": "8:18:46", "remaining_time": "5:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2746, "total_steps": 4438, "loss": 0.1423, "learning_rate": 1.7373858552259421e-06, "epoch": 0.6186949052299546, "percentage": 61.87, "elapsed_time": "8:18:57", "remaining_time": "5:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2747, "total_steps": 4438, "loss": 0.139, "learning_rate": 1.7356119582403663e-06, "epoch": 0.618920212915763, "percentage": 61.9, "elapsed_time": "8:19:07", "remaining_time": "5:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2748, "total_steps": 4438, "loss": 0.1386, "learning_rate": 1.733838485690978e-06, "epoch": 0.6191455206015716, "percentage": 61.92, "elapsed_time": "8:19:17", "remaining_time": "5:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2749, "total_steps": 4438, "loss": 0.1266, "learning_rate": 1.7320654385625208e-06, "epoch": 0.61937082828738, "percentage": 61.94, "elapsed_time": "8:19:28", "remaining_time": "5:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 4438, "loss": 0.1342, "learning_rate": 1.7302928178395018e-06, "epoch": 0.6195961359731884, "percentage": 61.96, "elapsed_time": "8:19:37", "remaining_time": "5:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2751, "total_steps": 4438, "loss": 0.1423, "learning_rate": 1.7285206245061908e-06, "epoch": 0.6198214436589968, "percentage": 61.99, "elapsed_time": "8:19:47", "remaining_time": "5:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2752, "total_steps": 4438, "loss": 0.1315, "learning_rate": 1.726748859546621e-06, "epoch": 0.6200467513448052, "percentage": 62.01, "elapsed_time": "8:19:58", "remaining_time": "5:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2753, "total_steps": 4438, "loss": 0.1217, "learning_rate": 1.7249775239445875e-06, "epoch": 0.6202720590306137, "percentage": 62.03, "elapsed_time": "8:20:09", "remaining_time": "5:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2754, "total_steps": 4438, "loss": 0.1245, "learning_rate": 1.723206618683646e-06, "epoch": 0.6204973667164221, "percentage": 62.05, "elapsed_time": "8:20:20", "remaining_time": "5:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2755, "total_steps": 4438, "loss": 0.1352, "learning_rate": 1.7214361447471156e-06, "epoch": 0.6207226744022305, "percentage": 62.08, "elapsed_time": "8:20:31", "remaining_time": "5:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2756, "total_steps": 4438, "loss": 0.1503, "learning_rate": 1.7196661031180738e-06, "epoch": 0.620947982088039, "percentage": 62.1, "elapsed_time": "8:20:41", "remaining_time": "5:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2757, "total_steps": 4438, "loss": 0.1338, "learning_rate": 1.7178964947793591e-06, "epoch": 0.6211732897738474, "percentage": 62.12, "elapsed_time": "8:20:52", "remaining_time": "5:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2758, "total_steps": 4438, "loss": 0.1397, "learning_rate": 1.716127320713568e-06, "epoch": 0.6213985974596559, "percentage": 62.15, "elapsed_time": "8:21:01", "remaining_time": "5:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2759, "total_steps": 4438, "loss": 0.1309, "learning_rate": 1.7143585819030583e-06, "epoch": 0.6216239051454643, "percentage": 62.17, "elapsed_time": "8:21:12", "remaining_time": "5:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 4438, "loss": 0.1296, "learning_rate": 1.7125902793299434e-06, "epoch": 0.6218492128312727, "percentage": 62.19, "elapsed_time": "8:21:22", "remaining_time": "5:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2761, "total_steps": 4438, "loss": 0.1194, "learning_rate": 1.7108224139760982e-06, "epoch": 0.6220745205170811, "percentage": 62.21, "elapsed_time": "8:21:31", "remaining_time": "5:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2762, "total_steps": 4438, "loss": 0.1209, "learning_rate": 1.7090549868231492e-06, "epoch": 0.6222998282028895, "percentage": 62.24, "elapsed_time": "8:21:42", "remaining_time": "5:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2763, "total_steps": 4438, "loss": 0.1433, "learning_rate": 1.707287998852485e-06, "epoch": 0.622525135888698, "percentage": 62.26, "elapsed_time": "8:21:52", "remaining_time": "5:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2764, "total_steps": 4438, "loss": 0.1295, "learning_rate": 1.7055214510452462e-06, "epoch": 0.6227504435745065, "percentage": 62.28, "elapsed_time": "8:22:03", "remaining_time": "5:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2765, "total_steps": 4438, "loss": 0.1366, "learning_rate": 1.7037553443823332e-06, "epoch": 0.6229757512603149, "percentage": 62.3, "elapsed_time": "8:22:13", "remaining_time": "5:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2766, "total_steps": 4438, "loss": 0.1305, "learning_rate": 1.7019896798443984e-06, "epoch": 0.6232010589461233, "percentage": 62.33, "elapsed_time": "8:22:23", "remaining_time": "5:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2767, "total_steps": 4438, "loss": 0.1522, "learning_rate": 1.700224458411849e-06, "epoch": 0.6234263666319317, "percentage": 62.35, "elapsed_time": "8:22:34", "remaining_time": "5:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2768, "total_steps": 4438, "loss": 0.1457, "learning_rate": 1.6984596810648475e-06, "epoch": 0.6236516743177402, "percentage": 62.37, "elapsed_time": "8:22:44", "remaining_time": "5:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2769, "total_steps": 4438, "loss": 0.1494, "learning_rate": 1.6966953487833078e-06, "epoch": 0.6238769820035486, "percentage": 62.39, "elapsed_time": "8:22:56", "remaining_time": "5:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 4438, "loss": 0.1412, "learning_rate": 1.6949314625468985e-06, "epoch": 0.624102289689357, "percentage": 62.42, "elapsed_time": "8:23:07", "remaining_time": "5:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2771, "total_steps": 4438, "loss": 0.1439, "learning_rate": 1.6931680233350404e-06, "epoch": 0.6243275973751654, "percentage": 62.44, "elapsed_time": "8:23:17", "remaining_time": "5:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2772, "total_steps": 4438, "loss": 0.1353, "learning_rate": 1.6914050321269049e-06, "epoch": 0.6245529050609739, "percentage": 62.46, "elapsed_time": "8:23:28", "remaining_time": "5:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2773, "total_steps": 4438, "loss": 0.1289, "learning_rate": 1.6896424899014158e-06, "epoch": 0.6247782127467824, "percentage": 62.48, "elapsed_time": "8:23:39", "remaining_time": "5:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2774, "total_steps": 4438, "loss": 0.1551, "learning_rate": 1.6878803976372465e-06, "epoch": 0.6250035204325908, "percentage": 62.51, "elapsed_time": "8:23:50", "remaining_time": "5:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2775, "total_steps": 4438, "loss": 0.1461, "learning_rate": 1.6861187563128217e-06, "epoch": 0.6252288281183992, "percentage": 62.53, "elapsed_time": "8:24:00", "remaining_time": "5:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2776, "total_steps": 4438, "loss": 0.1318, "learning_rate": 1.6843575669063142e-06, "epoch": 0.6254541358042076, "percentage": 62.55, "elapsed_time": "8:24:12", "remaining_time": "5:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2777, "total_steps": 4438, "loss": 0.131, "learning_rate": 1.682596830395648e-06, "epoch": 0.625679443490016, "percentage": 62.57, "elapsed_time": "8:24:23", "remaining_time": "5:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2778, "total_steps": 4438, "loss": 0.1427, "learning_rate": 1.6808365477584953e-06, "epoch": 0.6259047511758244, "percentage": 62.6, "elapsed_time": "8:24:35", "remaining_time": "5:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2779, "total_steps": 4438, "loss": 0.1518, "learning_rate": 1.6790767199722724e-06, "epoch": 0.6261300588616329, "percentage": 62.62, "elapsed_time": "8:24:46", "remaining_time": "5:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 4438, "loss": 0.138, "learning_rate": 1.6773173480141487e-06, "epoch": 0.6263553665474414, "percentage": 62.64, "elapsed_time": "8:24:58", "remaining_time": "5:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2781, "total_steps": 4438, "loss": 0.1393, "learning_rate": 1.6755584328610364e-06, "epoch": 0.6265806742332498, "percentage": 62.66, "elapsed_time": "8:25:07", "remaining_time": "5:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2782, "total_steps": 4438, "loss": 0.1369, "learning_rate": 1.6737999754895965e-06, "epoch": 0.6268059819190582, "percentage": 62.69, "elapsed_time": "8:25:18", "remaining_time": "5:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2783, "total_steps": 4438, "loss": 0.1423, "learning_rate": 1.6720419768762343e-06, "epoch": 0.6270312896048666, "percentage": 62.71, "elapsed_time": "8:25:29", "remaining_time": "5:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2784, "total_steps": 4438, "loss": 0.1332, "learning_rate": 1.6702844379971012e-06, "epoch": 0.6272565972906751, "percentage": 62.73, "elapsed_time": "8:25:40", "remaining_time": "5:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2785, "total_steps": 4438, "loss": 0.1412, "learning_rate": 1.668527359828092e-06, "epoch": 0.6274819049764835, "percentage": 62.75, "elapsed_time": "8:25:50", "remaining_time": "5:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2786, "total_steps": 4438, "loss": 0.1425, "learning_rate": 1.6667707433448482e-06, "epoch": 0.6277072126622919, "percentage": 62.78, "elapsed_time": "8:26:01", "remaining_time": "5:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2787, "total_steps": 4438, "loss": 0.144, "learning_rate": 1.6650145895227532e-06, "epoch": 0.6279325203481003, "percentage": 62.8, "elapsed_time": "8:26:12", "remaining_time": "4:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2788, "total_steps": 4438, "loss": 0.1461, "learning_rate": 1.663258899336933e-06, "epoch": 0.6281578280339088, "percentage": 62.82, "elapsed_time": "8:26:24", "remaining_time": "4:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2789, "total_steps": 4438, "loss": 0.1345, "learning_rate": 1.6615036737622574e-06, "epoch": 0.6283831357197173, "percentage": 62.84, "elapsed_time": "8:26:33", "remaining_time": "4:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 4438, "loss": 0.1478, "learning_rate": 1.6597489137733377e-06, "epoch": 0.6286084434055257, "percentage": 62.87, "elapsed_time": "8:26:44", "remaining_time": "4:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2791, "total_steps": 4438, "loss": 0.1389, "learning_rate": 1.6579946203445269e-06, "epoch": 0.6288337510913341, "percentage": 62.89, "elapsed_time": "8:26:54", "remaining_time": "4:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2792, "total_steps": 4438, "loss": 0.1318, "learning_rate": 1.6562407944499175e-06, "epoch": 0.6290590587771425, "percentage": 62.91, "elapsed_time": "8:27:04", "remaining_time": "4:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2793, "total_steps": 4438, "loss": 0.1257, "learning_rate": 1.6544874370633456e-06, "epoch": 0.6292843664629509, "percentage": 62.93, "elapsed_time": "8:27:14", "remaining_time": "4:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2794, "total_steps": 4438, "loss": 0.1426, "learning_rate": 1.652734549158384e-06, "epoch": 0.6295096741487594, "percentage": 62.96, "elapsed_time": "8:27:25", "remaining_time": "4:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2795, "total_steps": 4438, "loss": 0.1403, "learning_rate": 1.6509821317083466e-06, "epoch": 0.6297349818345679, "percentage": 62.98, "elapsed_time": "8:27:35", "remaining_time": "4:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2796, "total_steps": 4438, "loss": 0.1256, "learning_rate": 1.6492301856862855e-06, "epoch": 0.6299602895203763, "percentage": 63.0, "elapsed_time": "8:27:47", "remaining_time": "4:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2797, "total_steps": 4438, "loss": 0.1424, "learning_rate": 1.6474787120649903e-06, "epoch": 0.6301855972061847, "percentage": 63.02, "elapsed_time": "8:28:00", "remaining_time": "4:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2798, "total_steps": 4438, "loss": 0.138, "learning_rate": 1.6457277118169893e-06, "epoch": 0.6304109048919931, "percentage": 63.05, "elapsed_time": "8:28:09", "remaining_time": "4:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2799, "total_steps": 4438, "loss": 0.136, "learning_rate": 1.6439771859145476e-06, "epoch": 0.6306362125778016, "percentage": 63.07, "elapsed_time": "8:28:21", "remaining_time": "4:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 4438, "loss": 0.1386, "learning_rate": 1.6422271353296675e-06, "epoch": 0.63086152026361, "percentage": 63.09, "elapsed_time": "8:28:31", "remaining_time": "4:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2801, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.640477561034086e-06, "epoch": 0.6310868279494184, "percentage": 63.11, "elapsed_time": "8:28:41", "remaining_time": "4:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2802, "total_steps": 4438, "loss": 0.1344, "learning_rate": 1.6387284639992773e-06, "epoch": 0.6313121356352268, "percentage": 63.14, "elapsed_time": "8:28:54", "remaining_time": "4:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2803, "total_steps": 4438, "loss": 0.1335, "learning_rate": 1.6369798451964496e-06, "epoch": 0.6315374433210353, "percentage": 63.16, "elapsed_time": "8:29:04", "remaining_time": "4:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2804, "total_steps": 4438, "loss": 0.1455, "learning_rate": 1.6352317055965458e-06, "epoch": 0.6317627510068438, "percentage": 63.18, "elapsed_time": "8:29:17", "remaining_time": "4:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2805, "total_steps": 4438, "loss": 0.1401, "learning_rate": 1.6334840461702422e-06, "epoch": 0.6319880586926522, "percentage": 63.2, "elapsed_time": "8:29:28", "remaining_time": "4:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2806, "total_steps": 4438, "loss": 0.1255, "learning_rate": 1.6317368678879497e-06, "epoch": 0.6322133663784606, "percentage": 63.23, "elapsed_time": "8:29:39", "remaining_time": "4:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2807, "total_steps": 4438, "loss": 0.1287, "learning_rate": 1.6299901717198102e-06, "epoch": 0.632438674064269, "percentage": 63.25, "elapsed_time": "8:29:49", "remaining_time": "4:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2808, "total_steps": 4438, "loss": 0.1378, "learning_rate": 1.6282439586356999e-06, "epoch": 0.6326639817500774, "percentage": 63.27, "elapsed_time": "8:30:00", "remaining_time": "4:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2809, "total_steps": 4438, "loss": 0.1373, "learning_rate": 1.6264982296052256e-06, "epoch": 0.6328892894358858, "percentage": 63.29, "elapsed_time": "8:30:10", "remaining_time": "4:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 4438, "loss": 0.124, "learning_rate": 1.6247529855977256e-06, "epoch": 0.6331145971216943, "percentage": 63.32, "elapsed_time": "8:30:21", "remaining_time": "4:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2811, "total_steps": 4438, "loss": 0.1468, "learning_rate": 1.6230082275822687e-06, "epoch": 0.6333399048075028, "percentage": 63.34, "elapsed_time": "8:30:30", "remaining_time": "4:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2812, "total_steps": 4438, "loss": 0.1274, "learning_rate": 1.6212639565276538e-06, "epoch": 0.6335652124933112, "percentage": 63.36, "elapsed_time": "8:30:40", "remaining_time": "4:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2813, "total_steps": 4438, "loss": 0.1298, "learning_rate": 1.6195201734024096e-06, "epoch": 0.6337905201791196, "percentage": 63.38, "elapsed_time": "8:30:49", "remaining_time": "4:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2814, "total_steps": 4438, "loss": 0.135, "learning_rate": 1.6177768791747957e-06, "epoch": 0.634015827864928, "percentage": 63.41, "elapsed_time": "8:31:00", "remaining_time": "4:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2815, "total_steps": 4438, "loss": 0.1423, "learning_rate": 1.6160340748127959e-06, "epoch": 0.6342411355507365, "percentage": 63.43, "elapsed_time": "8:31:09", "remaining_time": "4:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2816, "total_steps": 4438, "loss": 0.1257, "learning_rate": 1.6142917612841252e-06, "epoch": 0.6344664432365449, "percentage": 63.45, "elapsed_time": "8:31:20", "remaining_time": "4:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2817, "total_steps": 4438, "loss": 0.1297, "learning_rate": 1.612549939556225e-06, "epoch": 0.6346917509223533, "percentage": 63.47, "elapsed_time": "8:31:31", "remaining_time": "4:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2818, "total_steps": 4438, "loss": 0.1249, "learning_rate": 1.610808610596265e-06, "epoch": 0.6349170586081617, "percentage": 63.5, "elapsed_time": "8:31:42", "remaining_time": "4:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2819, "total_steps": 4438, "loss": 0.1284, "learning_rate": 1.6090677753711403e-06, "epoch": 0.6351423662939703, "percentage": 63.52, "elapsed_time": "8:31:52", "remaining_time": "4:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 4438, "loss": 0.1449, "learning_rate": 1.607327434847471e-06, "epoch": 0.6353676739797787, "percentage": 63.54, "elapsed_time": "8:32:04", "remaining_time": "4:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2821, "total_steps": 4438, "loss": 0.1447, "learning_rate": 1.6055875899916034e-06, "epoch": 0.6355929816655871, "percentage": 63.56, "elapsed_time": "8:32:15", "remaining_time": "4:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2822, "total_steps": 4438, "loss": 0.1418, "learning_rate": 1.6038482417696095e-06, "epoch": 0.6358182893513955, "percentage": 63.59, "elapsed_time": "8:32:26", "remaining_time": "4:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2823, "total_steps": 4438, "loss": 0.1441, "learning_rate": 1.6021093911472825e-06, "epoch": 0.6360435970372039, "percentage": 63.61, "elapsed_time": "8:32:38", "remaining_time": "4:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2824, "total_steps": 4438, "loss": 0.1426, "learning_rate": 1.6003710390901434e-06, "epoch": 0.6362689047230123, "percentage": 63.63, "elapsed_time": "8:32:48", "remaining_time": "4:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2825, "total_steps": 4438, "loss": 0.1525, "learning_rate": 1.5986331865634335e-06, "epoch": 0.6364942124088208, "percentage": 63.65, "elapsed_time": "8:32:59", "remaining_time": "4:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2826, "total_steps": 4438, "loss": 0.1458, "learning_rate": 1.5968958345321178e-06, "epoch": 0.6367195200946292, "percentage": 63.68, "elapsed_time": "8:33:10", "remaining_time": "4:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2827, "total_steps": 4438, "loss": 0.1403, "learning_rate": 1.5951589839608828e-06, "epoch": 0.6369448277804377, "percentage": 63.7, "elapsed_time": "8:33:21", "remaining_time": "4:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2828, "total_steps": 4438, "loss": 0.1328, "learning_rate": 1.5934226358141368e-06, "epoch": 0.6371701354662461, "percentage": 63.72, "elapsed_time": "8:33:30", "remaining_time": "4:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2829, "total_steps": 4438, "loss": 0.1325, "learning_rate": 1.5916867910560092e-06, "epoch": 0.6373954431520545, "percentage": 63.74, "elapsed_time": "8:33:40", "remaining_time": "4:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 4438, "loss": 0.1496, "learning_rate": 1.5899514506503499e-06, "epoch": 0.637620750837863, "percentage": 63.77, "elapsed_time": "8:33:51", "remaining_time": "4:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2831, "total_steps": 4438, "loss": 0.1484, "learning_rate": 1.5882166155607306e-06, "epoch": 0.6378460585236714, "percentage": 63.79, "elapsed_time": "8:34:02", "remaining_time": "4:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2832, "total_steps": 4438, "loss": 0.1412, "learning_rate": 1.5864822867504376e-06, "epoch": 0.6380713662094798, "percentage": 63.81, "elapsed_time": "8:34:13", "remaining_time": "4:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2833, "total_steps": 4438, "loss": 0.1415, "learning_rate": 1.58474846518248e-06, "epoch": 0.6382966738952882, "percentage": 63.84, "elapsed_time": "8:34:25", "remaining_time": "4:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2834, "total_steps": 4438, "loss": 0.1274, "learning_rate": 1.5830151518195846e-06, "epoch": 0.6385219815810966, "percentage": 63.86, "elapsed_time": "8:34:36", "remaining_time": "4:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2835, "total_steps": 4438, "loss": 0.1264, "learning_rate": 1.5812823476241962e-06, "epoch": 0.6387472892669052, "percentage": 63.88, "elapsed_time": "8:34:47", "remaining_time": "4:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2836, "total_steps": 4438, "loss": 0.1417, "learning_rate": 1.5795500535584758e-06, "epoch": 0.6389725969527136, "percentage": 63.9, "elapsed_time": "8:34:58", "remaining_time": "4:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2837, "total_steps": 4438, "loss": 0.1433, "learning_rate": 1.5778182705843017e-06, "epoch": 0.639197904638522, "percentage": 63.93, "elapsed_time": "8:35:09", "remaining_time": "4:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2838, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.5760869996632685e-06, "epoch": 0.6394232123243304, "percentage": 63.95, "elapsed_time": "8:35:21", "remaining_time": "4:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2839, "total_steps": 4438, "loss": 0.133, "learning_rate": 1.574356241756686e-06, "epoch": 0.6396485200101388, "percentage": 63.97, "elapsed_time": "8:35:34", "remaining_time": "4:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 4438, "loss": 0.141, "learning_rate": 1.572625997825581e-06, "epoch": 0.6398738276959473, "percentage": 63.99, "elapsed_time": "8:35:46", "remaining_time": "4:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2841, "total_steps": 4438, "loss": 0.1489, "learning_rate": 1.5708962688306916e-06, "epoch": 0.6400991353817557, "percentage": 64.02, "elapsed_time": "8:35:56", "remaining_time": "4:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2842, "total_steps": 4438, "loss": 0.1439, "learning_rate": 1.5691670557324734e-06, "epoch": 0.6403244430675642, "percentage": 64.04, "elapsed_time": "8:36:06", "remaining_time": "4:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2843, "total_steps": 4438, "loss": 0.1411, "learning_rate": 1.5674383594910931e-06, "epoch": 0.6405497507533726, "percentage": 64.06, "elapsed_time": "8:36:16", "remaining_time": "4:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2844, "total_steps": 4438, "loss": 0.1423, "learning_rate": 1.5657101810664314e-06, "epoch": 0.640775058439181, "percentage": 64.08, "elapsed_time": "8:36:27", "remaining_time": "4:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2845, "total_steps": 4438, "loss": 0.1257, "learning_rate": 1.5639825214180808e-06, "epoch": 0.6410003661249895, "percentage": 64.11, "elapsed_time": "8:36:36", "remaining_time": "4:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2846, "total_steps": 4438, "loss": 0.1446, "learning_rate": 1.5622553815053476e-06, "epoch": 0.6412256738107979, "percentage": 64.13, "elapsed_time": "8:36:48", "remaining_time": "4:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2847, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.5605287622872478e-06, "epoch": 0.6414509814966063, "percentage": 64.15, "elapsed_time": "8:36:57", "remaining_time": "4:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2848, "total_steps": 4438, "loss": 0.1274, "learning_rate": 1.558802664722508e-06, "epoch": 0.6416762891824147, "percentage": 64.17, "elapsed_time": "8:37:09", "remaining_time": "4:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2849, "total_steps": 4438, "loss": 0.1318, "learning_rate": 1.5570770897695672e-06, "epoch": 0.6419015968682231, "percentage": 64.2, "elapsed_time": "8:37:20", "remaining_time": "4:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 4438, "loss": 0.1415, "learning_rate": 1.555352038386571e-06, "epoch": 0.6421269045540317, "percentage": 64.22, "elapsed_time": "8:37:30", "remaining_time": "4:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2851, "total_steps": 4438, "loss": 0.1271, "learning_rate": 1.5536275115313776e-06, "epoch": 0.6423522122398401, "percentage": 64.24, "elapsed_time": "8:37:41", "remaining_time": "4:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2852, "total_steps": 4438, "loss": 0.1426, "learning_rate": 1.5519035101615518e-06, "epoch": 0.6425775199256485, "percentage": 64.26, "elapsed_time": "8:37:52", "remaining_time": "4:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2853, "total_steps": 4438, "loss": 0.1451, "learning_rate": 1.5501800352343673e-06, "epoch": 0.6428028276114569, "percentage": 64.29, "elapsed_time": "8:38:03", "remaining_time": "4:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2854, "total_steps": 4438, "loss": 0.1453, "learning_rate": 1.5484570877068055e-06, "epoch": 0.6430281352972653, "percentage": 64.31, "elapsed_time": "8:38:14", "remaining_time": "4:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2855, "total_steps": 4438, "loss": 0.1553, "learning_rate": 1.5467346685355553e-06, "epoch": 0.6432534429830737, "percentage": 64.33, "elapsed_time": "8:38:24", "remaining_time": "4:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2856, "total_steps": 4438, "loss": 0.1465, "learning_rate": 1.5450127786770116e-06, "epoch": 0.6434787506688822, "percentage": 64.35, "elapsed_time": "8:38:36", "remaining_time": "4:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2857, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.5432914190872757e-06, "epoch": 0.6437040583546906, "percentage": 64.38, "elapsed_time": "8:38:46", "remaining_time": "4:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2858, "total_steps": 4438, "loss": 0.1238, "learning_rate": 1.5415705907221545e-06, "epoch": 0.6439293660404991, "percentage": 64.4, "elapsed_time": "8:38:56", "remaining_time": "4:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2859, "total_steps": 4438, "loss": 0.1332, "learning_rate": 1.53985029453716e-06, "epoch": 0.6441546737263075, "percentage": 64.42, "elapsed_time": "8:39:07", "remaining_time": "4:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 4438, "loss": 0.1414, "learning_rate": 1.5381305314875084e-06, "epoch": 0.6443799814121159, "percentage": 64.44, "elapsed_time": "8:39:17", "remaining_time": "4:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2861, "total_steps": 4438, "loss": 0.1355, "learning_rate": 1.536411302528119e-06, "epoch": 0.6446052890979244, "percentage": 64.47, "elapsed_time": "8:39:28", "remaining_time": "4:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2862, "total_steps": 4438, "loss": 0.1383, "learning_rate": 1.5346926086136171e-06, "epoch": 0.6448305967837328, "percentage": 64.49, "elapsed_time": "8:39:39", "remaining_time": "4:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2863, "total_steps": 4438, "loss": 0.1403, "learning_rate": 1.5329744506983292e-06, "epoch": 0.6450559044695412, "percentage": 64.51, "elapsed_time": "8:39:50", "remaining_time": "4:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2864, "total_steps": 4438, "loss": 0.1293, "learning_rate": 1.5312568297362834e-06, "epoch": 0.6452812121553496, "percentage": 64.53, "elapsed_time": "8:40:01", "remaining_time": "4:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2865, "total_steps": 4438, "loss": 0.1438, "learning_rate": 1.5295397466812115e-06, "epoch": 0.645506519841158, "percentage": 64.56, "elapsed_time": "8:40:13", "remaining_time": "4:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2866, "total_steps": 4438, "loss": 0.1275, "learning_rate": 1.5278232024865458e-06, "epoch": 0.6457318275269666, "percentage": 64.58, "elapsed_time": "8:40:22", "remaining_time": "4:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2867, "total_steps": 4438, "loss": 0.1387, "learning_rate": 1.5261071981054183e-06, "epoch": 0.645957135212775, "percentage": 64.6, "elapsed_time": "8:40:32", "remaining_time": "4:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2868, "total_steps": 4438, "loss": 0.1369, "learning_rate": 1.5243917344906625e-06, "epoch": 0.6461824428985834, "percentage": 64.62, "elapsed_time": "8:40:42", "remaining_time": "4:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2869, "total_steps": 4438, "loss": 0.1223, "learning_rate": 1.5226768125948122e-06, "epoch": 0.6464077505843918, "percentage": 64.65, "elapsed_time": "8:40:54", "remaining_time": "4:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 4438, "loss": 0.1254, "learning_rate": 1.5209624333700985e-06, "epoch": 0.6466330582702002, "percentage": 64.67, "elapsed_time": "8:41:05", "remaining_time": "4:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2871, "total_steps": 4438, "loss": 0.1373, "learning_rate": 1.5192485977684528e-06, "epoch": 0.6468583659560087, "percentage": 64.69, "elapsed_time": "8:41:18", "remaining_time": "4:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2872, "total_steps": 4438, "loss": 0.1363, "learning_rate": 1.517535306741505e-06, "epoch": 0.6470836736418171, "percentage": 64.71, "elapsed_time": "8:41:29", "remaining_time": "4:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2873, "total_steps": 4438, "loss": 0.1315, "learning_rate": 1.5158225612405808e-06, "epoch": 0.6473089813276255, "percentage": 64.74, "elapsed_time": "8:41:40", "remaining_time": "4:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2874, "total_steps": 4438, "loss": 0.133, "learning_rate": 1.5141103622167042e-06, "epoch": 0.647534289013434, "percentage": 64.76, "elapsed_time": "8:41:49", "remaining_time": "4:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2875, "total_steps": 4438, "loss": 0.1336, "learning_rate": 1.512398710620595e-06, "epoch": 0.6477595966992424, "percentage": 64.78, "elapsed_time": "8:41:59", "remaining_time": "4:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2876, "total_steps": 4438, "loss": 0.124, "learning_rate": 1.51068760740267e-06, "epoch": 0.6479849043850509, "percentage": 64.8, "elapsed_time": "8:42:11", "remaining_time": "4:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2877, "total_steps": 4438, "loss": 0.1267, "learning_rate": 1.508977053513041e-06, "epoch": 0.6482102120708593, "percentage": 64.83, "elapsed_time": "8:42:22", "remaining_time": "4:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2878, "total_steps": 4438, "loss": 0.1311, "learning_rate": 1.5072670499015151e-06, "epoch": 0.6484355197566677, "percentage": 64.85, "elapsed_time": "8:42:34", "remaining_time": "4:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2879, "total_steps": 4438, "loss": 0.1498, "learning_rate": 1.5055575975175929e-06, "epoch": 0.6486608274424761, "percentage": 64.87, "elapsed_time": "8:42:45", "remaining_time": "4:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 4438, "loss": 0.154, "learning_rate": 1.5038486973104704e-06, "epoch": 0.6488861351282845, "percentage": 64.89, "elapsed_time": "8:42:55", "remaining_time": "4:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2881, "total_steps": 4438, "loss": 0.1253, "learning_rate": 1.5021403502290354e-06, "epoch": 0.6491114428140929, "percentage": 64.92, "elapsed_time": "8:43:04", "remaining_time": "4:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2882, "total_steps": 4438, "loss": 0.127, "learning_rate": 1.5004325572218698e-06, "epoch": 0.6493367504999015, "percentage": 64.94, "elapsed_time": "8:43:14", "remaining_time": "4:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2883, "total_steps": 4438, "loss": 0.1403, "learning_rate": 1.4987253192372471e-06, "epoch": 0.6495620581857099, "percentage": 64.96, "elapsed_time": "8:43:25", "remaining_time": "4:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2884, "total_steps": 4438, "loss": 0.1413, "learning_rate": 1.4970186372231347e-06, "epoch": 0.6497873658715183, "percentage": 64.98, "elapsed_time": "8:43:36", "remaining_time": "4:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2885, "total_steps": 4438, "loss": 0.1423, "learning_rate": 1.4953125121271866e-06, "epoch": 0.6500126735573267, "percentage": 65.01, "elapsed_time": "8:43:45", "remaining_time": "4:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2886, "total_steps": 4438, "loss": 0.1293, "learning_rate": 1.493606944896751e-06, "epoch": 0.6502379812431351, "percentage": 65.03, "elapsed_time": "8:43:56", "remaining_time": "4:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2887, "total_steps": 4438, "loss": 0.1241, "learning_rate": 1.4919019364788678e-06, "epoch": 0.6504632889289436, "percentage": 65.05, "elapsed_time": "8:44:07", "remaining_time": "4:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2888, "total_steps": 4438, "loss": 0.1426, "learning_rate": 1.490197487820263e-06, "epoch": 0.650688596614752, "percentage": 65.07, "elapsed_time": "8:44:18", "remaining_time": "4:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2889, "total_steps": 4438, "loss": 0.1377, "learning_rate": 1.4884935998673539e-06, "epoch": 0.6509139043005604, "percentage": 65.1, "elapsed_time": "8:44:27", "remaining_time": "4:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 4438, "loss": 0.1449, "learning_rate": 1.486790273566246e-06, "epoch": 0.6511392119863689, "percentage": 65.12, "elapsed_time": "8:44:39", "remaining_time": "4:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2891, "total_steps": 4438, "loss": 0.1336, "learning_rate": 1.4850875098627326e-06, "epoch": 0.6513645196721773, "percentage": 65.14, "elapsed_time": "8:44:50", "remaining_time": "4:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2892, "total_steps": 4438, "loss": 0.1459, "learning_rate": 1.483385309702295e-06, "epoch": 0.6515898273579858, "percentage": 65.16, "elapsed_time": "8:45:00", "remaining_time": "4:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2893, "total_steps": 4438, "loss": 0.1391, "learning_rate": 1.4816836740301019e-06, "epoch": 0.6518151350437942, "percentage": 65.19, "elapsed_time": "8:45:10", "remaining_time": "4:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2894, "total_steps": 4438, "loss": 0.159, "learning_rate": 1.4799826037910082e-06, "epoch": 0.6520404427296026, "percentage": 65.21, "elapsed_time": "8:45:22", "remaining_time": "4:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2895, "total_steps": 4438, "loss": 0.1222, "learning_rate": 1.478282099929554e-06, "epoch": 0.652265750415411, "percentage": 65.23, "elapsed_time": "8:45:32", "remaining_time": "4:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2896, "total_steps": 4438, "loss": 0.1396, "learning_rate": 1.4765821633899663e-06, "epoch": 0.6524910581012194, "percentage": 65.25, "elapsed_time": "8:45:43", "remaining_time": "4:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2897, "total_steps": 4438, "loss": 0.1316, "learning_rate": 1.4748827951161566e-06, "epoch": 0.652716365787028, "percentage": 65.28, "elapsed_time": "8:45:54", "remaining_time": "4:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2898, "total_steps": 4438, "loss": 0.1397, "learning_rate": 1.4731839960517202e-06, "epoch": 0.6529416734728364, "percentage": 65.3, "elapsed_time": "8:46:05", "remaining_time": "4:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2899, "total_steps": 4438, "loss": 0.1489, "learning_rate": 1.4714857671399374e-06, "epoch": 0.6531669811586448, "percentage": 65.32, "elapsed_time": "8:46:15", "remaining_time": "4:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 4438, "loss": 0.1345, "learning_rate": 1.4697881093237714e-06, "epoch": 0.6533922888444532, "percentage": 65.34, "elapsed_time": "8:46:26", "remaining_time": "4:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2901, "total_steps": 4438, "loss": 0.1385, "learning_rate": 1.4680910235458692e-06, "epoch": 0.6536175965302616, "percentage": 65.37, "elapsed_time": "8:46:36", "remaining_time": "4:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2902, "total_steps": 4438, "loss": 0.1326, "learning_rate": 1.4663945107485567e-06, "epoch": 0.65384290421607, "percentage": 65.39, "elapsed_time": "8:46:45", "remaining_time": "4:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2903, "total_steps": 4438, "loss": 0.1378, "learning_rate": 1.4646985718738466e-06, "epoch": 0.6540682119018785, "percentage": 65.41, "elapsed_time": "8:46:55", "remaining_time": "4:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2904, "total_steps": 4438, "loss": 0.1337, "learning_rate": 1.4630032078634293e-06, "epoch": 0.6542935195876869, "percentage": 65.43, "elapsed_time": "8:47:06", "remaining_time": "4:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2905, "total_steps": 4438, "loss": 0.1367, "learning_rate": 1.461308419658678e-06, "epoch": 0.6545188272734954, "percentage": 65.46, "elapsed_time": "8:47:16", "remaining_time": "4:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2906, "total_steps": 4438, "loss": 0.1286, "learning_rate": 1.4596142082006448e-06, "epoch": 0.6547441349593038, "percentage": 65.48, "elapsed_time": "8:47:27", "remaining_time": "4:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2907, "total_steps": 4438, "loss": 0.1609, "learning_rate": 1.457920574430062e-06, "epoch": 0.6549694426451123, "percentage": 65.5, "elapsed_time": "8:47:39", "remaining_time": "4:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2908, "total_steps": 4438, "loss": 0.1459, "learning_rate": 1.456227519287343e-06, "epoch": 0.6551947503309207, "percentage": 65.53, "elapsed_time": "8:47:49", "remaining_time": "4:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2909, "total_steps": 4438, "loss": 0.1355, "learning_rate": 1.4545350437125755e-06, "epoch": 0.6554200580167291, "percentage": 65.55, "elapsed_time": "8:47:59", "remaining_time": "4:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 4438, "loss": 0.1406, "learning_rate": 1.4528431486455311e-06, "epoch": 0.6556453657025375, "percentage": 65.57, "elapsed_time": "8:48:11", "remaining_time": "4:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2911, "total_steps": 4438, "loss": 0.1372, "learning_rate": 1.451151835025653e-06, "epoch": 0.6558706733883459, "percentage": 65.59, "elapsed_time": "8:48:22", "remaining_time": "4:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2912, "total_steps": 4438, "loss": 0.1293, "learning_rate": 1.4494611037920667e-06, "epoch": 0.6560959810741543, "percentage": 65.62, "elapsed_time": "8:48:32", "remaining_time": "4:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2913, "total_steps": 4438, "loss": 0.1396, "learning_rate": 1.4477709558835724e-06, "epoch": 0.6563212887599629, "percentage": 65.64, "elapsed_time": "8:48:44", "remaining_time": "4:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2914, "total_steps": 4438, "loss": 0.134, "learning_rate": 1.4460813922386446e-06, "epoch": 0.6565465964457713, "percentage": 65.66, "elapsed_time": "8:48:55", "remaining_time": "4:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2915, "total_steps": 4438, "loss": 0.1266, "learning_rate": 1.4443924137954368e-06, "epoch": 0.6567719041315797, "percentage": 65.68, "elapsed_time": "8:49:06", "remaining_time": "4:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2916, "total_steps": 4438, "loss": 0.1371, "learning_rate": 1.4427040214917742e-06, "epoch": 0.6569972118173881, "percentage": 65.71, "elapsed_time": "8:49:16", "remaining_time": "4:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2917, "total_steps": 4438, "loss": 0.1346, "learning_rate": 1.4410162162651586e-06, "epoch": 0.6572225195031965, "percentage": 65.73, "elapsed_time": "8:49:27", "remaining_time": "4:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2918, "total_steps": 4438, "loss": 0.1236, "learning_rate": 1.4393289990527665e-06, "epoch": 0.657447827189005, "percentage": 65.75, "elapsed_time": "8:49:36", "remaining_time": "4:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2919, "total_steps": 4438, "loss": 0.1408, "learning_rate": 1.4376423707914462e-06, "epoch": 0.6576731348748134, "percentage": 65.77, "elapsed_time": "8:49:47", "remaining_time": "4:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 4438, "loss": 0.1316, "learning_rate": 1.4359563324177176e-06, "epoch": 0.6578984425606218, "percentage": 65.8, "elapsed_time": "8:50:00", "remaining_time": "4:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2921, "total_steps": 4438, "loss": 0.1321, "learning_rate": 1.4342708848677774e-06, "epoch": 0.6581237502464303, "percentage": 65.82, "elapsed_time": "8:50:10", "remaining_time": "4:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2922, "total_steps": 4438, "loss": 0.1365, "learning_rate": 1.43258602907749e-06, "epoch": 0.6583490579322387, "percentage": 65.84, "elapsed_time": "8:50:19", "remaining_time": "4:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2923, "total_steps": 4438, "loss": 0.1401, "learning_rate": 1.430901765982395e-06, "epoch": 0.6585743656180472, "percentage": 65.86, "elapsed_time": "8:50:30", "remaining_time": "4:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2924, "total_steps": 4438, "loss": 0.139, "learning_rate": 1.429218096517699e-06, "epoch": 0.6587996733038556, "percentage": 65.89, "elapsed_time": "8:50:41", "remaining_time": "4:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2925, "total_steps": 4438, "loss": 0.1113, "learning_rate": 1.4275350216182824e-06, "epoch": 0.659024980989664, "percentage": 65.91, "elapsed_time": "8:50:52", "remaining_time": "4:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2926, "total_steps": 4438, "loss": 0.1479, "learning_rate": 1.425852542218692e-06, "epoch": 0.6592502886754724, "percentage": 65.93, "elapsed_time": "8:51:04", "remaining_time": "4:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2927, "total_steps": 4438, "loss": 0.1398, "learning_rate": 1.4241706592531473e-06, "epoch": 0.6594755963612808, "percentage": 65.95, "elapsed_time": "8:51:15", "remaining_time": "4:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2928, "total_steps": 4438, "loss": 0.1381, "learning_rate": 1.4224893736555364e-06, "epoch": 0.6597009040470893, "percentage": 65.98, "elapsed_time": "8:51:25", "remaining_time": "4:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2929, "total_steps": 4438, "loss": 0.1441, "learning_rate": 1.420808686359412e-06, "epoch": 0.6599262117328978, "percentage": 66.0, "elapsed_time": "8:51:36", "remaining_time": "4:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 4438, "loss": 0.124, "learning_rate": 1.4191285982979992e-06, "epoch": 0.6601515194187062, "percentage": 66.02, "elapsed_time": "8:51:46", "remaining_time": "4:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2931, "total_steps": 4438, "loss": 0.1394, "learning_rate": 1.4174491104041866e-06, "epoch": 0.6603768271045146, "percentage": 66.04, "elapsed_time": "8:51:56", "remaining_time": "4:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2932, "total_steps": 4438, "loss": 0.1444, "learning_rate": 1.4157702236105326e-06, "epoch": 0.660602134790323, "percentage": 66.07, "elapsed_time": "8:52:07", "remaining_time": "4:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2933, "total_steps": 4438, "loss": 0.1379, "learning_rate": 1.414091938849259e-06, "epoch": 0.6608274424761315, "percentage": 66.09, "elapsed_time": "8:52:18", "remaining_time": "4:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2934, "total_steps": 4438, "loss": 0.1307, "learning_rate": 1.412414257052256e-06, "epoch": 0.6610527501619399, "percentage": 66.11, "elapsed_time": "8:52:30", "remaining_time": "4:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2935, "total_steps": 4438, "loss": 0.1441, "learning_rate": 1.410737179151078e-06, "epoch": 0.6612780578477483, "percentage": 66.13, "elapsed_time": "8:52:40", "remaining_time": "4:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2936, "total_steps": 4438, "loss": 0.1256, "learning_rate": 1.4090607060769423e-06, "epoch": 0.6615033655335567, "percentage": 66.16, "elapsed_time": "8:52:50", "remaining_time": "4:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2937, "total_steps": 4438, "loss": 0.1427, "learning_rate": 1.407384838760734e-06, "epoch": 0.6617286732193652, "percentage": 66.18, "elapsed_time": "8:53:00", "remaining_time": "4:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2938, "total_steps": 4438, "loss": 0.1274, "learning_rate": 1.4057095781329983e-06, "epoch": 0.6619539809051737, "percentage": 66.2, "elapsed_time": "8:53:11", "remaining_time": "4:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2939, "total_steps": 4438, "loss": 0.1159, "learning_rate": 1.4040349251239444e-06, "epoch": 0.6621792885909821, "percentage": 66.22, "elapsed_time": "8:53:23", "remaining_time": "4:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 4438, "loss": 0.1354, "learning_rate": 1.402360880663447e-06, "epoch": 0.6624045962767905, "percentage": 66.25, "elapsed_time": "8:53:34", "remaining_time": "4:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2941, "total_steps": 4438, "loss": 0.1359, "learning_rate": 1.4006874456810377e-06, "epoch": 0.6626299039625989, "percentage": 66.27, "elapsed_time": "8:53:46", "remaining_time": "4:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2942, "total_steps": 4438, "loss": 0.1416, "learning_rate": 1.3990146211059141e-06, "epoch": 0.6628552116484073, "percentage": 66.29, "elapsed_time": "8:53:57", "remaining_time": "4:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2943, "total_steps": 4438, "loss": 0.1346, "learning_rate": 1.3973424078669346e-06, "epoch": 0.6630805193342157, "percentage": 66.31, "elapsed_time": "8:54:10", "remaining_time": "4:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2944, "total_steps": 4438, "loss": 0.1504, "learning_rate": 1.3956708068926141e-06, "epoch": 0.6633058270200243, "percentage": 66.34, "elapsed_time": "8:54:20", "remaining_time": "4:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2945, "total_steps": 4438, "loss": 0.138, "learning_rate": 1.393999819111133e-06, "epoch": 0.6635311347058327, "percentage": 66.36, "elapsed_time": "8:54:30", "remaining_time": "4:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2946, "total_steps": 4438, "loss": 0.133, "learning_rate": 1.3923294454503263e-06, "epoch": 0.6637564423916411, "percentage": 66.38, "elapsed_time": "8:54:40", "remaining_time": "4:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2947, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.3906596868376923e-06, "epoch": 0.6639817500774495, "percentage": 66.4, "elapsed_time": "8:54:52", "remaining_time": "4:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2948, "total_steps": 4438, "loss": 0.1147, "learning_rate": 1.3889905442003836e-06, "epoch": 0.664207057763258, "percentage": 66.43, "elapsed_time": "8:55:00", "remaining_time": "4:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2949, "total_steps": 4438, "loss": 0.1419, "learning_rate": 1.3873220184652143e-06, "epoch": 0.6644323654490664, "percentage": 66.45, "elapsed_time": "8:55:13", "remaining_time": "4:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 4438, "loss": 0.1393, "learning_rate": 1.3856541105586545e-06, "epoch": 0.6646576731348748, "percentage": 66.47, "elapsed_time": "8:55:22", "remaining_time": "4:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2951, "total_steps": 4438, "loss": 0.1395, "learning_rate": 1.3839868214068303e-06, "epoch": 0.6648829808206832, "percentage": 66.49, "elapsed_time": "8:55:33", "remaining_time": "4:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2952, "total_steps": 4438, "loss": 0.1245, "learning_rate": 1.382320151935527e-06, "epoch": 0.6651082885064917, "percentage": 66.52, "elapsed_time": "8:55:43", "remaining_time": "4:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2953, "total_steps": 4438, "loss": 0.1251, "learning_rate": 1.380654103070182e-06, "epoch": 0.6653335961923001, "percentage": 66.54, "elapsed_time": "8:55:54", "remaining_time": "4:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2954, "total_steps": 4438, "loss": 0.1397, "learning_rate": 1.3789886757358916e-06, "epoch": 0.6655589038781086, "percentage": 66.56, "elapsed_time": "8:56:04", "remaining_time": "4:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2955, "total_steps": 4438, "loss": 0.1447, "learning_rate": 1.3773238708574054e-06, "epoch": 0.665784211563917, "percentage": 66.58, "elapsed_time": "8:56:15", "remaining_time": "4:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2956, "total_steps": 4438, "loss": 0.132, "learning_rate": 1.375659689359126e-06, "epoch": 0.6660095192497254, "percentage": 66.61, "elapsed_time": "8:56:26", "remaining_time": "4:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2957, "total_steps": 4438, "loss": 0.1349, "learning_rate": 1.3739961321651139e-06, "epoch": 0.6662348269355338, "percentage": 66.63, "elapsed_time": "8:56:37", "remaining_time": "4:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2958, "total_steps": 4438, "loss": 0.1261, "learning_rate": 1.3723332001990774e-06, "epoch": 0.6664601346213422, "percentage": 66.65, "elapsed_time": "8:56:48", "remaining_time": "4:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2959, "total_steps": 4438, "loss": 0.1148, "learning_rate": 1.3706708943843822e-06, "epoch": 0.6666854423071507, "percentage": 66.67, "elapsed_time": "8:56:57", "remaining_time": "4:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 4438, "loss": 0.1295, "learning_rate": 1.369009215644046e-06, "epoch": 0.6669107499929592, "percentage": 66.7, "elapsed_time": "8:57:08", "remaining_time": "4:28:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2961, "total_steps": 4438, "loss": 0.1319, "learning_rate": 1.3673481649007347e-06, "epoch": 0.6671360576787676, "percentage": 66.72, "elapsed_time": "8:57:19", "remaining_time": "4:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2962, "total_steps": 4438, "loss": 0.1212, "learning_rate": 1.36568774307677e-06, "epoch": 0.667361365364576, "percentage": 66.74, "elapsed_time": "8:57:29", "remaining_time": "4:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2963, "total_steps": 4438, "loss": 0.132, "learning_rate": 1.36402795109412e-06, "epoch": 0.6675866730503844, "percentage": 66.76, "elapsed_time": "8:57:40", "remaining_time": "4:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2964, "total_steps": 4438, "loss": 0.1253, "learning_rate": 1.362368789874407e-06, "epoch": 0.6678119807361929, "percentage": 66.79, "elapsed_time": "8:57:52", "remaining_time": "4:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2965, "total_steps": 4438, "loss": 0.1313, "learning_rate": 1.3607102603389016e-06, "epoch": 0.6680372884220013, "percentage": 66.81, "elapsed_time": "8:58:02", "remaining_time": "4:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2966, "total_steps": 4438, "loss": 0.1354, "learning_rate": 1.3590523634085218e-06, "epoch": 0.6682625961078097, "percentage": 66.83, "elapsed_time": "8:58:13", "remaining_time": "4:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2967, "total_steps": 4438, "loss": 0.1261, "learning_rate": 1.3573951000038376e-06, "epoch": 0.6684879037936181, "percentage": 66.85, "elapsed_time": "8:58:24", "remaining_time": "4:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2968, "total_steps": 4438, "loss": 0.1428, "learning_rate": 1.3557384710450644e-06, "epoch": 0.6687132114794266, "percentage": 66.88, "elapsed_time": "8:58:35", "remaining_time": "4:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2969, "total_steps": 4438, "loss": 0.1395, "learning_rate": 1.3540824774520678e-06, "epoch": 0.6689385191652351, "percentage": 66.9, "elapsed_time": "8:58:44", "remaining_time": "4:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 4438, "loss": 0.1306, "learning_rate": 1.3524271201443578e-06, "epoch": 0.6691638268510435, "percentage": 66.92, "elapsed_time": "8:58:55", "remaining_time": "4:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2971, "total_steps": 4438, "loss": 0.1474, "learning_rate": 1.3507724000410933e-06, "epoch": 0.6693891345368519, "percentage": 66.94, "elapsed_time": "8:59:05", "remaining_time": "4:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2972, "total_steps": 4438, "loss": 0.129, "learning_rate": 1.3491183180610807e-06, "epoch": 0.6696144422226603, "percentage": 66.97, "elapsed_time": "8:59:16", "remaining_time": "4:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2973, "total_steps": 4438, "loss": 0.1219, "learning_rate": 1.347464875122766e-06, "epoch": 0.6698397499084687, "percentage": 66.99, "elapsed_time": "8:59:28", "remaining_time": "4:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2974, "total_steps": 4438, "loss": 0.1206, "learning_rate": 1.3458120721442464e-06, "epoch": 0.6700650575942771, "percentage": 67.01, "elapsed_time": "8:59:38", "remaining_time": "4:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2975, "total_steps": 4438, "loss": 0.1254, "learning_rate": 1.3441599100432635e-06, "epoch": 0.6702903652800856, "percentage": 67.03, "elapsed_time": "8:59:48", "remaining_time": "4:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2976, "total_steps": 4438, "loss": 0.1294, "learning_rate": 1.3425083897371983e-06, "epoch": 0.6705156729658941, "percentage": 67.06, "elapsed_time": "9:00:00", "remaining_time": "4:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2977, "total_steps": 4438, "loss": 0.1341, "learning_rate": 1.3408575121430812e-06, "epoch": 0.6707409806517025, "percentage": 67.08, "elapsed_time": "9:00:11", "remaining_time": "4:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2978, "total_steps": 4438, "loss": 0.1329, "learning_rate": 1.3392072781775806e-06, "epoch": 0.6709662883375109, "percentage": 67.1, "elapsed_time": "9:00:21", "remaining_time": "4:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2979, "total_steps": 4438, "loss": 0.1219, "learning_rate": 1.337557688757012e-06, "epoch": 0.6711915960233193, "percentage": 67.12, "elapsed_time": "9:00:32", "remaining_time": "4:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 4438, "loss": 0.135, "learning_rate": 1.335908744797329e-06, "epoch": 0.6714169037091278, "percentage": 67.15, "elapsed_time": "9:00:43", "remaining_time": "4:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2981, "total_steps": 4438, "loss": 0.1416, "learning_rate": 1.3342604472141296e-06, "epoch": 0.6716422113949362, "percentage": 67.17, "elapsed_time": "9:00:54", "remaining_time": "4:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2982, "total_steps": 4438, "loss": 0.1419, "learning_rate": 1.3326127969226535e-06, "epoch": 0.6718675190807446, "percentage": 67.19, "elapsed_time": "9:01:05", "remaining_time": "4:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2983, "total_steps": 4438, "loss": 0.1315, "learning_rate": 1.3309657948377768e-06, "epoch": 0.672092826766553, "percentage": 67.21, "elapsed_time": "9:01:17", "remaining_time": "4:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2984, "total_steps": 4438, "loss": 0.1363, "learning_rate": 1.3293194418740207e-06, "epoch": 0.6723181344523615, "percentage": 67.24, "elapsed_time": "9:01:28", "remaining_time": "4:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2985, "total_steps": 4438, "loss": 0.1346, "learning_rate": 1.3276737389455416e-06, "epoch": 0.67254344213817, "percentage": 67.26, "elapsed_time": "9:01:39", "remaining_time": "4:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2986, "total_steps": 4438, "loss": 0.1294, "learning_rate": 1.3260286869661378e-06, "epoch": 0.6727687498239784, "percentage": 67.28, "elapsed_time": "9:01:50", "remaining_time": "4:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2987, "total_steps": 4438, "loss": 0.1286, "learning_rate": 1.3243842868492468e-06, "epoch": 0.6729940575097868, "percentage": 67.31, "elapsed_time": "9:02:02", "remaining_time": "4:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2988, "total_steps": 4438, "loss": 0.135, "learning_rate": 1.32274053950794e-06, "epoch": 0.6732193651955952, "percentage": 67.33, "elapsed_time": "9:02:14", "remaining_time": "4:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2989, "total_steps": 4438, "loss": 0.1403, "learning_rate": 1.3210974458549318e-06, "epoch": 0.6734446728814036, "percentage": 67.35, "elapsed_time": "9:02:25", "remaining_time": "4:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 4438, "loss": 0.1347, "learning_rate": 1.3194550068025697e-06, "epoch": 0.6736699805672121, "percentage": 67.37, "elapsed_time": "9:02:35", "remaining_time": "4:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2991, "total_steps": 4438, "loss": 0.1313, "learning_rate": 1.3178132232628374e-06, "epoch": 0.6738952882530206, "percentage": 67.4, "elapsed_time": "9:02:46", "remaining_time": "4:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2992, "total_steps": 4438, "loss": 0.139, "learning_rate": 1.3161720961473583e-06, "epoch": 0.674120595938829, "percentage": 67.42, "elapsed_time": "9:02:57", "remaining_time": "4:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2993, "total_steps": 4438, "loss": 0.123, "learning_rate": 1.3145316263673874e-06, "epoch": 0.6743459036246374, "percentage": 67.44, "elapsed_time": "9:03:06", "remaining_time": "4:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2994, "total_steps": 4438, "loss": 0.1402, "learning_rate": 1.3128918148338183e-06, "epoch": 0.6745712113104458, "percentage": 67.46, "elapsed_time": "9:03:15", "remaining_time": "4:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2995, "total_steps": 4438, "loss": 0.1424, "learning_rate": 1.3112526624571753e-06, "epoch": 0.6747965189962543, "percentage": 67.49, "elapsed_time": "9:03:27", "remaining_time": "4:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2996, "total_steps": 4438, "loss": 0.1413, "learning_rate": 1.3096141701476189e-06, "epoch": 0.6750218266820627, "percentage": 67.51, "elapsed_time": "9:03:37", "remaining_time": "4:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2997, "total_steps": 4438, "loss": 0.1431, "learning_rate": 1.307976338814945e-06, "epoch": 0.6752471343678711, "percentage": 67.53, "elapsed_time": "9:03:49", "remaining_time": "4:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2998, "total_steps": 4438, "loss": 0.1577, "learning_rate": 1.3063391693685773e-06, "epoch": 0.6754724420536795, "percentage": 67.55, "elapsed_time": "9:04:00", "remaining_time": "4:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2999, "total_steps": 4438, "loss": 0.1264, "learning_rate": 1.3047026627175774e-06, "epoch": 0.675697749739488, "percentage": 67.58, "elapsed_time": "9:04:09", "remaining_time": "4:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 4438, "loss": 0.1324, "learning_rate": 1.3030668197706347e-06, "epoch": 0.6759230574252965, "percentage": 67.6, "elapsed_time": "9:04:22", "remaining_time": "4:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 4438, "eval_loss": 0.13576775789260864, "epoch": 0.6759230574252965, "percentage": 67.6, "elapsed_time": "9:06:24", "remaining_time": "4:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3001, "total_steps": 4438, "loss": 0.1237, "learning_rate": 1.3014316414360732e-06, "epoch": 0.6761483651111049, "percentage": 67.62, "elapsed_time": "9:06:36", "remaining_time": "4:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3002, "total_steps": 4438, "loss": 0.1251, "learning_rate": 1.2997971286218448e-06, "epoch": 0.6763736727969133, "percentage": 67.64, "elapsed_time": "9:06:44", "remaining_time": "4:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3003, "total_steps": 4438, "loss": 0.131, "learning_rate": 1.2981632822355344e-06, "epoch": 0.6765989804827217, "percentage": 67.67, "elapsed_time": "9:06:55", "remaining_time": "4:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3004, "total_steps": 4438, "loss": 0.1322, "learning_rate": 1.2965301031843574e-06, "epoch": 0.6768242881685301, "percentage": 67.69, "elapsed_time": "9:07:06", "remaining_time": "4:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3005, "total_steps": 4438, "loss": 0.1293, "learning_rate": 1.294897592375155e-06, "epoch": 0.6770495958543385, "percentage": 67.71, "elapsed_time": "9:07:16", "remaining_time": "4:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3006, "total_steps": 4438, "loss": 0.1362, "learning_rate": 1.2932657507144014e-06, "epoch": 0.677274903540147, "percentage": 67.73, "elapsed_time": "9:07:26", "remaining_time": "4:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3007, "total_steps": 4438, "loss": 0.1349, "learning_rate": 1.2916345791081964e-06, "epoch": 0.6775002112259555, "percentage": 67.76, "elapsed_time": "9:07:36", "remaining_time": "4:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3008, "total_steps": 4438, "loss": 0.1358, "learning_rate": 1.2900040784622686e-06, "epoch": 0.6777255189117639, "percentage": 67.78, "elapsed_time": "9:07:47", "remaining_time": "4:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3009, "total_steps": 4438, "loss": 0.1271, "learning_rate": 1.2883742496819751e-06, "epoch": 0.6779508265975723, "percentage": 67.8, "elapsed_time": "9:07:58", "remaining_time": "4:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 4438, "loss": 0.134, "learning_rate": 1.286745093672298e-06, "epoch": 0.6781761342833807, "percentage": 67.82, "elapsed_time": "9:08:08", "remaining_time": "4:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3011, "total_steps": 4438, "loss": 0.1381, "learning_rate": 1.2851166113378471e-06, "epoch": 0.6784014419691892, "percentage": 67.85, "elapsed_time": "9:08:18", "remaining_time": "4:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3012, "total_steps": 4438, "loss": 0.1225, "learning_rate": 1.2834888035828597e-06, "epoch": 0.6786267496549976, "percentage": 67.87, "elapsed_time": "9:08:30", "remaining_time": "4:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3013, "total_steps": 4438, "loss": 0.1354, "learning_rate": 1.2818616713111945e-06, "epoch": 0.678852057340806, "percentage": 67.89, "elapsed_time": "9:08:41", "remaining_time": "4:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3014, "total_steps": 4438, "loss": 0.1278, "learning_rate": 1.2802352154263392e-06, "epoch": 0.6790773650266144, "percentage": 67.91, "elapsed_time": "9:08:51", "remaining_time": "4:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3015, "total_steps": 4438, "loss": 0.127, "learning_rate": 1.2786094368314023e-06, "epoch": 0.679302672712423, "percentage": 67.94, "elapsed_time": "9:09:02", "remaining_time": "4:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3016, "total_steps": 4438, "loss": 0.1448, "learning_rate": 1.2769843364291202e-06, "epoch": 0.6795279803982314, "percentage": 67.96, "elapsed_time": "9:09:13", "remaining_time": "4:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3017, "total_steps": 4438, "loss": 0.135, "learning_rate": 1.2753599151218483e-06, "epoch": 0.6797532880840398, "percentage": 67.98, "elapsed_time": "9:09:25", "remaining_time": "4:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3018, "total_steps": 4438, "loss": 0.1192, "learning_rate": 1.2737361738115681e-06, "epoch": 0.6799785957698482, "percentage": 68.0, "elapsed_time": "9:09:35", "remaining_time": "4:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3019, "total_steps": 4438, "loss": 0.1357, "learning_rate": 1.2721131133998837e-06, "epoch": 0.6802039034556566, "percentage": 68.03, "elapsed_time": "9:09:46", "remaining_time": "4:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 4438, "loss": 0.1358, "learning_rate": 1.2704907347880185e-06, "epoch": 0.680429211141465, "percentage": 68.05, "elapsed_time": "9:09:57", "remaining_time": "4:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3021, "total_steps": 4438, "loss": 0.1462, "learning_rate": 1.2688690388768205e-06, "epoch": 0.6806545188272735, "percentage": 68.07, "elapsed_time": "9:10:07", "remaining_time": "4:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3022, "total_steps": 4438, "loss": 0.1376, "learning_rate": 1.2672480265667553e-06, "epoch": 0.6808798265130819, "percentage": 68.09, "elapsed_time": "9:10:17", "remaining_time": "4:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3023, "total_steps": 4438, "loss": 0.14, "learning_rate": 1.2656276987579118e-06, "epoch": 0.6811051341988904, "percentage": 68.12, "elapsed_time": "9:10:28", "remaining_time": "4:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3024, "total_steps": 4438, "loss": 0.1285, "learning_rate": 1.2640080563499977e-06, "epoch": 0.6813304418846988, "percentage": 68.14, "elapsed_time": "9:10:40", "remaining_time": "4:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3025, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.2623891002423383e-06, "epoch": 0.6815557495705072, "percentage": 68.16, "elapsed_time": "9:10:50", "remaining_time": "4:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3026, "total_steps": 4438, "loss": 0.1473, "learning_rate": 1.2607708313338818e-06, "epoch": 0.6817810572563157, "percentage": 68.18, "elapsed_time": "9:10:59", "remaining_time": "4:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3027, "total_steps": 4438, "loss": 0.1489, "learning_rate": 1.2591532505231906e-06, "epoch": 0.6820063649421241, "percentage": 68.21, "elapsed_time": "9:11:10", "remaining_time": "4:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3028, "total_steps": 4438, "loss": 0.133, "learning_rate": 1.2575363587084486e-06, "epoch": 0.6822316726279325, "percentage": 68.23, "elapsed_time": "9:11:22", "remaining_time": "4:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3029, "total_steps": 4438, "loss": 0.1307, "learning_rate": 1.2559201567874554e-06, "epoch": 0.6824569803137409, "percentage": 68.25, "elapsed_time": "9:11:33", "remaining_time": "4:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 4438, "loss": 0.1388, "learning_rate": 1.2543046456576267e-06, "epoch": 0.6826822879995493, "percentage": 68.27, "elapsed_time": "9:11:44", "remaining_time": "4:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3031, "total_steps": 4438, "loss": 0.1262, "learning_rate": 1.252689826215997e-06, "epoch": 0.6829075956853579, "percentage": 68.3, "elapsed_time": "9:11:54", "remaining_time": "4:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3032, "total_steps": 4438, "loss": 0.1263, "learning_rate": 1.2510756993592138e-06, "epoch": 0.6831329033711663, "percentage": 68.32, "elapsed_time": "9:12:04", "remaining_time": "4:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3033, "total_steps": 4438, "loss": 0.1225, "learning_rate": 1.2494622659835421e-06, "epoch": 0.6833582110569747, "percentage": 68.34, "elapsed_time": "9:12:16", "remaining_time": "4:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3034, "total_steps": 4438, "loss": 0.1291, "learning_rate": 1.2478495269848626e-06, "epoch": 0.6835835187427831, "percentage": 68.36, "elapsed_time": "9:12:26", "remaining_time": "4:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3035, "total_steps": 4438, "loss": 0.14, "learning_rate": 1.246237483258667e-06, "epoch": 0.6838088264285915, "percentage": 68.39, "elapsed_time": "9:12:35", "remaining_time": "4:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3036, "total_steps": 4438, "loss": 0.1187, "learning_rate": 1.2446261357000655e-06, "epoch": 0.6840341341144, "percentage": 68.41, "elapsed_time": "9:12:46", "remaining_time": "4:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3037, "total_steps": 4438, "loss": 0.1272, "learning_rate": 1.243015485203777e-06, "epoch": 0.6842594418002084, "percentage": 68.43, "elapsed_time": "9:12:56", "remaining_time": "4:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3038, "total_steps": 4438, "loss": 0.14, "learning_rate": 1.2414055326641378e-06, "epoch": 0.6844847494860169, "percentage": 68.45, "elapsed_time": "9:13:07", "remaining_time": "4:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3039, "total_steps": 4438, "loss": 0.1235, "learning_rate": 1.2397962789750923e-06, "epoch": 0.6847100571718253, "percentage": 68.48, "elapsed_time": "9:13:18", "remaining_time": "4:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 4438, "loss": 0.1472, "learning_rate": 1.2381877250302002e-06, "epoch": 0.6849353648576337, "percentage": 68.5, "elapsed_time": "9:13:29", "remaining_time": "4:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3041, "total_steps": 4438, "loss": 0.1458, "learning_rate": 1.236579871722633e-06, "epoch": 0.6851606725434422, "percentage": 68.52, "elapsed_time": "9:13:39", "remaining_time": "4:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3042, "total_steps": 4438, "loss": 0.1483, "learning_rate": 1.2349727199451696e-06, "epoch": 0.6853859802292506, "percentage": 68.54, "elapsed_time": "9:13:50", "remaining_time": "4:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3043, "total_steps": 4438, "loss": 0.1313, "learning_rate": 1.233366270590202e-06, "epoch": 0.685611287915059, "percentage": 68.57, "elapsed_time": "9:14:00", "remaining_time": "4:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3044, "total_steps": 4438, "loss": 0.1287, "learning_rate": 1.2317605245497324e-06, "epoch": 0.6858365956008674, "percentage": 68.59, "elapsed_time": "9:14:10", "remaining_time": "4:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3045, "total_steps": 4438, "loss": 0.1344, "learning_rate": 1.2301554827153703e-06, "epoch": 0.6860619032866758, "percentage": 68.61, "elapsed_time": "9:14:20", "remaining_time": "4:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3046, "total_steps": 4438, "loss": 0.1459, "learning_rate": 1.2285511459783373e-06, "epoch": 0.6862872109724844, "percentage": 68.63, "elapsed_time": "9:14:30", "remaining_time": "4:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3047, "total_steps": 4438, "loss": 0.1203, "learning_rate": 1.2269475152294601e-06, "epoch": 0.6865125186582928, "percentage": 68.66, "elapsed_time": "9:14:40", "remaining_time": "4:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3048, "total_steps": 4438, "loss": 0.134, "learning_rate": 1.225344591359177e-06, "epoch": 0.6867378263441012, "percentage": 68.68, "elapsed_time": "9:14:50", "remaining_time": "4:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3049, "total_steps": 4438, "loss": 0.1394, "learning_rate": 1.2237423752575297e-06, "epoch": 0.6869631340299096, "percentage": 68.7, "elapsed_time": "9:15:01", "remaining_time": "4:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 4438, "loss": 0.1391, "learning_rate": 1.2221408678141702e-06, "epoch": 0.687188441715718, "percentage": 68.72, "elapsed_time": "9:15:13", "remaining_time": "4:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3051, "total_steps": 4438, "loss": 0.1418, "learning_rate": 1.220540069918357e-06, "epoch": 0.6874137494015264, "percentage": 68.75, "elapsed_time": "9:15:24", "remaining_time": "4:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3052, "total_steps": 4438, "loss": 0.1251, "learning_rate": 1.2189399824589513e-06, "epoch": 0.6876390570873349, "percentage": 68.77, "elapsed_time": "9:15:34", "remaining_time": "4:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3053, "total_steps": 4438, "loss": 0.1465, "learning_rate": 1.217340606324424e-06, "epoch": 0.6878643647731433, "percentage": 68.79, "elapsed_time": "9:15:45", "remaining_time": "4:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3054, "total_steps": 4438, "loss": 0.139, "learning_rate": 1.2157419424028473e-06, "epoch": 0.6880896724589518, "percentage": 68.81, "elapsed_time": "9:15:57", "remaining_time": "4:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3055, "total_steps": 4438, "loss": 0.1349, "learning_rate": 1.2141439915819008e-06, "epoch": 0.6883149801447602, "percentage": 68.84, "elapsed_time": "9:16:07", "remaining_time": "4:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3056, "total_steps": 4438, "loss": 0.156, "learning_rate": 1.2125467547488676e-06, "epoch": 0.6885402878305686, "percentage": 68.86, "elapsed_time": "9:16:19", "remaining_time": "4:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3057, "total_steps": 4438, "loss": 0.1413, "learning_rate": 1.210950232790632e-06, "epoch": 0.6887655955163771, "percentage": 68.88, "elapsed_time": "9:16:30", "remaining_time": "4:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3058, "total_steps": 4438, "loss": 0.1361, "learning_rate": 1.2093544265936848e-06, "epoch": 0.6889909032021855, "percentage": 68.9, "elapsed_time": "9:16:41", "remaining_time": "4:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3059, "total_steps": 4438, "loss": 0.1325, "learning_rate": 1.2077593370441165e-06, "epoch": 0.6892162108879939, "percentage": 68.93, "elapsed_time": "9:16:51", "remaining_time": "4:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 4438, "loss": 0.1346, "learning_rate": 1.206164965027622e-06, "epoch": 0.6894415185738023, "percentage": 68.95, "elapsed_time": "9:17:02", "remaining_time": "4:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3061, "total_steps": 4438, "loss": 0.13, "learning_rate": 1.204571311429496e-06, "epoch": 0.6896668262596107, "percentage": 68.97, "elapsed_time": "9:17:13", "remaining_time": "4:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3062, "total_steps": 4438, "loss": 0.1396, "learning_rate": 1.2029783771346344e-06, "epoch": 0.6898921339454193, "percentage": 69.0, "elapsed_time": "9:17:24", "remaining_time": "4:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3063, "total_steps": 4438, "loss": 0.1394, "learning_rate": 1.2013861630275353e-06, "epoch": 0.6901174416312277, "percentage": 69.02, "elapsed_time": "9:17:36", "remaining_time": "4:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3064, "total_steps": 4438, "loss": 0.1312, "learning_rate": 1.1997946699922946e-06, "epoch": 0.6903427493170361, "percentage": 69.04, "elapsed_time": "9:17:47", "remaining_time": "4:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3065, "total_steps": 4438, "loss": 0.1353, "learning_rate": 1.1982038989126096e-06, "epoch": 0.6905680570028445, "percentage": 69.06, "elapsed_time": "9:17:58", "remaining_time": "4:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3066, "total_steps": 4438, "loss": 0.1377, "learning_rate": 1.1966138506717776e-06, "epoch": 0.6907933646886529, "percentage": 69.09, "elapsed_time": "9:18:09", "remaining_time": "4:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3067, "total_steps": 4438, "loss": 0.14, "learning_rate": 1.195024526152691e-06, "epoch": 0.6910186723744614, "percentage": 69.11, "elapsed_time": "9:18:20", "remaining_time": "4:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3068, "total_steps": 4438, "loss": 0.1397, "learning_rate": 1.1934359262378443e-06, "epoch": 0.6912439800602698, "percentage": 69.13, "elapsed_time": "9:18:32", "remaining_time": "4:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3069, "total_steps": 4438, "loss": 0.1326, "learning_rate": 1.1918480518093259e-06, "epoch": 0.6914692877460782, "percentage": 69.15, "elapsed_time": "9:18:42", "remaining_time": "4:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 4438, "loss": 0.1141, "learning_rate": 1.190260903748825e-06, "epoch": 0.6916945954318867, "percentage": 69.18, "elapsed_time": "9:18:52", "remaining_time": "4:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3071, "total_steps": 4438, "loss": 0.1316, "learning_rate": 1.1886744829376243e-06, "epoch": 0.6919199031176951, "percentage": 69.2, "elapsed_time": "9:19:04", "remaining_time": "4:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3072, "total_steps": 4438, "loss": 0.1416, "learning_rate": 1.187088790256605e-06, "epoch": 0.6921452108035036, "percentage": 69.22, "elapsed_time": "9:19:15", "remaining_time": "4:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3073, "total_steps": 4438, "loss": 0.1528, "learning_rate": 1.185503826586244e-06, "epoch": 0.692370518489312, "percentage": 69.24, "elapsed_time": "9:19:26", "remaining_time": "4:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3074, "total_steps": 4438, "loss": 0.1328, "learning_rate": 1.1839195928066101e-06, "epoch": 0.6925958261751204, "percentage": 69.27, "elapsed_time": "9:19:35", "remaining_time": "4:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3075, "total_steps": 4438, "loss": 0.1526, "learning_rate": 1.1823360897973723e-06, "epoch": 0.6928211338609288, "percentage": 69.29, "elapsed_time": "9:19:47", "remaining_time": "4:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3076, "total_steps": 4438, "loss": 0.1266, "learning_rate": 1.1807533184377882e-06, "epoch": 0.6930464415467372, "percentage": 69.31, "elapsed_time": "9:19:58", "remaining_time": "4:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3077, "total_steps": 4438, "loss": 0.1164, "learning_rate": 1.1791712796067134e-06, "epoch": 0.6932717492325456, "percentage": 69.33, "elapsed_time": "9:20:07", "remaining_time": "4:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3078, "total_steps": 4438, "loss": 0.1359, "learning_rate": 1.1775899741825947e-06, "epoch": 0.6934970569183542, "percentage": 69.36, "elapsed_time": "9:20:18", "remaining_time": "4:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3079, "total_steps": 4438, "loss": 0.1373, "learning_rate": 1.176009403043471e-06, "epoch": 0.6937223646041626, "percentage": 69.38, "elapsed_time": "9:20:30", "remaining_time": "4:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 4438, "loss": 0.1386, "learning_rate": 1.1744295670669752e-06, "epoch": 0.693947672289971, "percentage": 69.4, "elapsed_time": "9:20:42", "remaining_time": "4:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3081, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.1728504671303326e-06, "epoch": 0.6941729799757794, "percentage": 69.42, "elapsed_time": "9:20:52", "remaining_time": "4:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3082, "total_steps": 4438, "loss": 0.133, "learning_rate": 1.171272104110356e-06, "epoch": 0.6943982876615878, "percentage": 69.45, "elapsed_time": "9:21:03", "remaining_time": "4:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3083, "total_steps": 4438, "loss": 0.1338, "learning_rate": 1.1696944788834546e-06, "epoch": 0.6946235953473963, "percentage": 69.47, "elapsed_time": "9:21:12", "remaining_time": "4:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3084, "total_steps": 4438, "loss": 0.137, "learning_rate": 1.168117592325622e-06, "epoch": 0.6948489030332047, "percentage": 69.49, "elapsed_time": "9:21:23", "remaining_time": "4:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3085, "total_steps": 4438, "loss": 0.135, "learning_rate": 1.1665414453124468e-06, "epoch": 0.6950742107190131, "percentage": 69.51, "elapsed_time": "9:21:34", "remaining_time": "4:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3086, "total_steps": 4438, "loss": 0.1302, "learning_rate": 1.1649660387191027e-06, "epoch": 0.6952995184048216, "percentage": 69.54, "elapsed_time": "9:21:45", "remaining_time": "4:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3087, "total_steps": 4438, "loss": 0.1325, "learning_rate": 1.1633913734203552e-06, "epoch": 0.69552482609063, "percentage": 69.56, "elapsed_time": "9:21:56", "remaining_time": "4:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3088, "total_steps": 4438, "loss": 0.1278, "learning_rate": 1.1618174502905586e-06, "epoch": 0.6957501337764385, "percentage": 69.58, "elapsed_time": "9:22:07", "remaining_time": "4:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3089, "total_steps": 4438, "loss": 0.1416, "learning_rate": 1.1602442702036513e-06, "epoch": 0.6959754414622469, "percentage": 69.6, "elapsed_time": "9:22:16", "remaining_time": "4:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 4438, "loss": 0.1362, "learning_rate": 1.1586718340331634e-06, "epoch": 0.6962007491480553, "percentage": 69.63, "elapsed_time": "9:22:26", "remaining_time": "4:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3091, "total_steps": 4438, "loss": 0.1385, "learning_rate": 1.1571001426522088e-06, "epoch": 0.6964260568338637, "percentage": 69.65, "elapsed_time": "9:22:35", "remaining_time": "4:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3092, "total_steps": 4438, "loss": 0.1397, "learning_rate": 1.1555291969334907e-06, "epoch": 0.6966513645196721, "percentage": 69.67, "elapsed_time": "9:22:46", "remaining_time": "4:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3093, "total_steps": 4438, "loss": 0.1121, "learning_rate": 1.1539589977492946e-06, "epoch": 0.6968766722054807, "percentage": 69.69, "elapsed_time": "9:22:55", "remaining_time": "4:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3094, "total_steps": 4438, "loss": 0.1382, "learning_rate": 1.1523895459714948e-06, "epoch": 0.6971019798912891, "percentage": 69.72, "elapsed_time": "9:23:05", "remaining_time": "4:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3095, "total_steps": 4438, "loss": 0.139, "learning_rate": 1.1508208424715511e-06, "epoch": 0.6973272875770975, "percentage": 69.74, "elapsed_time": "9:23:16", "remaining_time": "4:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3096, "total_steps": 4438, "loss": 0.1317, "learning_rate": 1.1492528881205027e-06, "epoch": 0.6975525952629059, "percentage": 69.76, "elapsed_time": "9:23:26", "remaining_time": "4:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3097, "total_steps": 4438, "loss": 0.1405, "learning_rate": 1.1476856837889774e-06, "epoch": 0.6977779029487143, "percentage": 69.78, "elapsed_time": "9:23:37", "remaining_time": "4:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3098, "total_steps": 4438, "loss": 0.1394, "learning_rate": 1.146119230347187e-06, "epoch": 0.6980032106345228, "percentage": 69.81, "elapsed_time": "9:23:47", "remaining_time": "4:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3099, "total_steps": 4438, "loss": 0.1301, "learning_rate": 1.1445535286649223e-06, "epoch": 0.6982285183203312, "percentage": 69.83, "elapsed_time": "9:23:57", "remaining_time": "4:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 4438, "loss": 0.1271, "learning_rate": 1.142988579611561e-06, "epoch": 0.6984538260061396, "percentage": 69.85, "elapsed_time": "9:24:08", "remaining_time": "4:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3101, "total_steps": 4438, "loss": 0.1309, "learning_rate": 1.1414243840560595e-06, "epoch": 0.6986791336919481, "percentage": 69.87, "elapsed_time": "9:24:18", "remaining_time": "4:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3102, "total_steps": 4438, "loss": 0.1397, "learning_rate": 1.1398609428669582e-06, "epoch": 0.6989044413777565, "percentage": 69.9, "elapsed_time": "9:24:29", "remaining_time": "4:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3103, "total_steps": 4438, "loss": 0.1155, "learning_rate": 1.1382982569123781e-06, "epoch": 0.699129749063565, "percentage": 69.92, "elapsed_time": "9:24:39", "remaining_time": "4:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3104, "total_steps": 4438, "loss": 0.1281, "learning_rate": 1.136736327060019e-06, "epoch": 0.6993550567493734, "percentage": 69.94, "elapsed_time": "9:24:48", "remaining_time": "4:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3105, "total_steps": 4438, "loss": 0.1415, "learning_rate": 1.1351751541771644e-06, "epoch": 0.6995803644351818, "percentage": 69.96, "elapsed_time": "9:24:59", "remaining_time": "4:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3106, "total_steps": 4438, "loss": 0.1341, "learning_rate": 1.133614739130673e-06, "epoch": 0.6998056721209902, "percentage": 69.99, "elapsed_time": "9:25:10", "remaining_time": "4:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3107, "total_steps": 4438, "loss": 0.1454, "learning_rate": 1.1320550827869875e-06, "epoch": 0.7000309798067986, "percentage": 70.01, "elapsed_time": "9:25:21", "remaining_time": "4:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3108, "total_steps": 4438, "loss": 0.1499, "learning_rate": 1.1304961860121246e-06, "epoch": 0.700256287492607, "percentage": 70.03, "elapsed_time": "9:25:32", "remaining_time": "4:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3109, "total_steps": 4438, "loss": 0.144, "learning_rate": 1.128938049671683e-06, "epoch": 0.7004815951784156, "percentage": 70.05, "elapsed_time": "9:25:44", "remaining_time": "4:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 4438, "loss": 0.1376, "learning_rate": 1.127380674630838e-06, "epoch": 0.700706902864224, "percentage": 70.08, "elapsed_time": "9:25:55", "remaining_time": "4:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3111, "total_steps": 4438, "loss": 0.1384, "learning_rate": 1.1258240617543407e-06, "epoch": 0.7009322105500324, "percentage": 70.1, "elapsed_time": "9:26:05", "remaining_time": "4:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3112, "total_steps": 4438, "loss": 0.1286, "learning_rate": 1.1242682119065217e-06, "epoch": 0.7011575182358408, "percentage": 70.12, "elapsed_time": "9:26:16", "remaining_time": "4:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3113, "total_steps": 4438, "loss": 0.1441, "learning_rate": 1.1227131259512857e-06, "epoch": 0.7013828259216492, "percentage": 70.14, "elapsed_time": "9:26:25", "remaining_time": "4:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3114, "total_steps": 4438, "loss": 0.1365, "learning_rate": 1.121158804752113e-06, "epoch": 0.7016081336074577, "percentage": 70.17, "elapsed_time": "9:26:35", "remaining_time": "4:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3115, "total_steps": 4438, "loss": 0.1384, "learning_rate": 1.119605249172062e-06, "epoch": 0.7018334412932661, "percentage": 70.19, "elapsed_time": "9:26:46", "remaining_time": "4:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3116, "total_steps": 4438, "loss": 0.1324, "learning_rate": 1.1180524600737624e-06, "epoch": 0.7020587489790745, "percentage": 70.21, "elapsed_time": "9:26:56", "remaining_time": "4:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3117, "total_steps": 4438, "loss": 0.1391, "learning_rate": 1.1165004383194218e-06, "epoch": 0.702284056664883, "percentage": 70.23, "elapsed_time": "9:27:06", "remaining_time": "4:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3118, "total_steps": 4438, "loss": 0.1332, "learning_rate": 1.1149491847708186e-06, "epoch": 0.7025093643506914, "percentage": 70.26, "elapsed_time": "9:27:17", "remaining_time": "4:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3119, "total_steps": 4438, "loss": 0.128, "learning_rate": 1.1133987002893062e-06, "epoch": 0.7027346720364999, "percentage": 70.28, "elapsed_time": "9:27:27", "remaining_time": "3:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 4438, "loss": 0.1308, "learning_rate": 1.1118489857358129e-06, "epoch": 0.7029599797223083, "percentage": 70.3, "elapsed_time": "9:27:37", "remaining_time": "3:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3121, "total_steps": 4438, "loss": 0.1303, "learning_rate": 1.1103000419708347e-06, "epoch": 0.7031852874081167, "percentage": 70.32, "elapsed_time": "9:27:48", "remaining_time": "3:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3122, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.1087518698544444e-06, "epoch": 0.7034105950939251, "percentage": 70.35, "elapsed_time": "9:27:59", "remaining_time": "3:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3123, "total_steps": 4438, "loss": 0.1462, "learning_rate": 1.1072044702462825e-06, "epoch": 0.7036359027797335, "percentage": 70.37, "elapsed_time": "9:28:10", "remaining_time": "3:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3124, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.1056578440055631e-06, "epoch": 0.703861210465542, "percentage": 70.39, "elapsed_time": "9:28:20", "remaining_time": "3:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3125, "total_steps": 4438, "loss": 0.1372, "learning_rate": 1.1041119919910715e-06, "epoch": 0.7040865181513505, "percentage": 70.41, "elapsed_time": "9:28:32", "remaining_time": "3:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3126, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.1025669150611594e-06, "epoch": 0.7043118258371589, "percentage": 70.44, "elapsed_time": "9:28:43", "remaining_time": "3:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3127, "total_steps": 4438, "loss": 0.1298, "learning_rate": 1.101022614073752e-06, "epoch": 0.7045371335229673, "percentage": 70.46, "elapsed_time": "9:28:53", "remaining_time": "3:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3128, "total_steps": 4438, "loss": 0.1385, "learning_rate": 1.0994790898863409e-06, "epoch": 0.7047624412087757, "percentage": 70.48, "elapsed_time": "9:29:04", "remaining_time": "3:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3129, "total_steps": 4438, "loss": 0.1297, "learning_rate": 1.0979363433559892e-06, "epoch": 0.7049877488945842, "percentage": 70.5, "elapsed_time": "9:29:16", "remaining_time": "3:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 4438, "loss": 0.13, "learning_rate": 1.0963943753393252e-06, "epoch": 0.7052130565803926, "percentage": 70.53, "elapsed_time": "9:29:25", "remaining_time": "3:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3131, "total_steps": 4438, "loss": 0.119, "learning_rate": 1.094853186692546e-06, "epoch": 0.705438364266201, "percentage": 70.55, "elapsed_time": "9:29:36", "remaining_time": "3:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3132, "total_steps": 4438, "loss": 0.1203, "learning_rate": 1.0933127782714175e-06, "epoch": 0.7056636719520094, "percentage": 70.57, "elapsed_time": "9:29:47", "remaining_time": "3:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3133, "total_steps": 4438, "loss": 0.1266, "learning_rate": 1.0917731509312696e-06, "epoch": 0.7058889796378179, "percentage": 70.59, "elapsed_time": "9:29:57", "remaining_time": "3:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3134, "total_steps": 4438, "loss": 0.1428, "learning_rate": 1.0902343055270006e-06, "epoch": 0.7061142873236264, "percentage": 70.62, "elapsed_time": "9:30:08", "remaining_time": "3:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3135, "total_steps": 4438, "loss": 0.13, "learning_rate": 1.0886962429130754e-06, "epoch": 0.7063395950094348, "percentage": 70.64, "elapsed_time": "9:30:18", "remaining_time": "3:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3136, "total_steps": 4438, "loss": 0.1314, "learning_rate": 1.0871589639435204e-06, "epoch": 0.7065649026952432, "percentage": 70.66, "elapsed_time": "9:30:29", "remaining_time": "3:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3137, "total_steps": 4438, "loss": 0.1366, "learning_rate": 1.0856224694719313e-06, "epoch": 0.7067902103810516, "percentage": 70.68, "elapsed_time": "9:30:41", "remaining_time": "3:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3138, "total_steps": 4438, "loss": 0.1518, "learning_rate": 1.0840867603514648e-06, "epoch": 0.70701551806686, "percentage": 70.71, "elapsed_time": "9:30:51", "remaining_time": "3:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3139, "total_steps": 4438, "loss": 0.1446, "learning_rate": 1.0825518374348442e-06, "epoch": 0.7072408257526684, "percentage": 70.73, "elapsed_time": "9:31:02", "remaining_time": "3:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 4438, "loss": 0.1282, "learning_rate": 1.0810177015743536e-06, "epoch": 0.707466133438477, "percentage": 70.75, "elapsed_time": "9:31:12", "remaining_time": "3:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3141, "total_steps": 4438, "loss": 0.1348, "learning_rate": 1.079484353621842e-06, "epoch": 0.7076914411242854, "percentage": 70.78, "elapsed_time": "9:31:23", "remaining_time": "3:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3142, "total_steps": 4438, "loss": 0.1282, "learning_rate": 1.0779517944287216e-06, "epoch": 0.7079167488100938, "percentage": 70.8, "elapsed_time": "9:31:34", "remaining_time": "3:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3143, "total_steps": 4438, "loss": 0.114, "learning_rate": 1.0764200248459633e-06, "epoch": 0.7081420564959022, "percentage": 70.82, "elapsed_time": "9:31:44", "remaining_time": "3:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3144, "total_steps": 4438, "loss": 0.1252, "learning_rate": 1.0748890457241037e-06, "epoch": 0.7083673641817106, "percentage": 70.84, "elapsed_time": "9:31:54", "remaining_time": "3:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3145, "total_steps": 4438, "loss": 0.1383, "learning_rate": 1.0733588579132365e-06, "epoch": 0.7085926718675191, "percentage": 70.87, "elapsed_time": "9:32:06", "remaining_time": "3:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3146, "total_steps": 4438, "loss": 0.1332, "learning_rate": 1.0718294622630188e-06, "epoch": 0.7088179795533275, "percentage": 70.89, "elapsed_time": "9:32:18", "remaining_time": "3:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3147, "total_steps": 4438, "loss": 0.1215, "learning_rate": 1.0703008596226692e-06, "epoch": 0.7090432872391359, "percentage": 70.91, "elapsed_time": "9:32:29", "remaining_time": "3:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3148, "total_steps": 4438, "loss": 0.1429, "learning_rate": 1.0687730508409594e-06, "epoch": 0.7092685949249444, "percentage": 70.93, "elapsed_time": "9:32:41", "remaining_time": "3:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3149, "total_steps": 4438, "loss": 0.134, "learning_rate": 1.0672460367662271e-06, "epoch": 0.7094939026107528, "percentage": 70.96, "elapsed_time": "9:32:52", "remaining_time": "3:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 4438, "loss": 0.1352, "learning_rate": 1.065719818246367e-06, "epoch": 0.7097192102965613, "percentage": 70.98, "elapsed_time": "9:33:02", "remaining_time": "3:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3151, "total_steps": 4438, "loss": 0.1361, "learning_rate": 1.0641943961288298e-06, "epoch": 0.7099445179823697, "percentage": 71.0, "elapsed_time": "9:33:13", "remaining_time": "3:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3152, "total_steps": 4438, "loss": 0.1398, "learning_rate": 1.062669771260627e-06, "epoch": 0.7101698256681781, "percentage": 71.02, "elapsed_time": "9:33:25", "remaining_time": "3:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3153, "total_steps": 4438, "loss": 0.1285, "learning_rate": 1.0611459444883243e-06, "epoch": 0.7103951333539865, "percentage": 71.05, "elapsed_time": "9:33:36", "remaining_time": "3:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3154, "total_steps": 4438, "loss": 0.1395, "learning_rate": 1.0596229166580477e-06, "epoch": 0.7106204410397949, "percentage": 71.07, "elapsed_time": "9:33:46", "remaining_time": "3:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3155, "total_steps": 4438, "loss": 0.1319, "learning_rate": 1.0581006886154758e-06, "epoch": 0.7108457487256034, "percentage": 71.09, "elapsed_time": "9:33:57", "remaining_time": "3:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3156, "total_steps": 4438, "loss": 0.1385, "learning_rate": 1.0565792612058462e-06, "epoch": 0.7110710564114119, "percentage": 71.11, "elapsed_time": "9:34:08", "remaining_time": "3:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3157, "total_steps": 4438, "loss": 0.1349, "learning_rate": 1.0550586352739519e-06, "epoch": 0.7112963640972203, "percentage": 71.14, "elapsed_time": "9:34:19", "remaining_time": "3:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3158, "total_steps": 4438, "loss": 0.13, "learning_rate": 1.0535388116641376e-06, "epoch": 0.7115216717830287, "percentage": 71.16, "elapsed_time": "9:34:31", "remaining_time": "3:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3159, "total_steps": 4438, "loss": 0.115, "learning_rate": 1.0520197912203067e-06, "epoch": 0.7117469794688371, "percentage": 71.18, "elapsed_time": "9:34:41", "remaining_time": "3:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 4438, "loss": 0.1431, "learning_rate": 1.050501574785913e-06, "epoch": 0.7119722871546456, "percentage": 71.2, "elapsed_time": "9:34:53", "remaining_time": "3:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3161, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.048984163203967e-06, "epoch": 0.712197594840454, "percentage": 71.23, "elapsed_time": "9:35:04", "remaining_time": "3:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3162, "total_steps": 4438, "loss": 0.1347, "learning_rate": 1.0474675573170293e-06, "epoch": 0.7124229025262624, "percentage": 71.25, "elapsed_time": "9:35:14", "remaining_time": "3:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3163, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.045951757967215e-06, "epoch": 0.7126482102120708, "percentage": 71.27, "elapsed_time": "9:35:25", "remaining_time": "3:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3164, "total_steps": 4438, "loss": 0.1406, "learning_rate": 1.0444367659961927e-06, "epoch": 0.7128735178978793, "percentage": 71.29, "elapsed_time": "9:35:35", "remaining_time": "3:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3165, "total_steps": 4438, "loss": 0.1302, "learning_rate": 1.0429225822451792e-06, "epoch": 0.7130988255836878, "percentage": 71.32, "elapsed_time": "9:35:46", "remaining_time": "3:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3166, "total_steps": 4438, "loss": 0.1371, "learning_rate": 1.041409207554944e-06, "epoch": 0.7133241332694962, "percentage": 71.34, "elapsed_time": "9:35:56", "remaining_time": "3:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3167, "total_steps": 4438, "loss": 0.129, "learning_rate": 1.0398966427658091e-06, "epoch": 0.7135494409553046, "percentage": 71.36, "elapsed_time": "9:36:07", "remaining_time": "3:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3168, "total_steps": 4438, "loss": 0.1435, "learning_rate": 1.0383848887176437e-06, "epoch": 0.713774748641113, "percentage": 71.38, "elapsed_time": "9:36:19", "remaining_time": "3:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3169, "total_steps": 4438, "loss": 0.1246, "learning_rate": 1.0368739462498704e-06, "epoch": 0.7140000563269214, "percentage": 71.41, "elapsed_time": "9:36:29", "remaining_time": "3:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 4438, "loss": 0.1339, "learning_rate": 1.035363816201457e-06, "epoch": 0.7142253640127298, "percentage": 71.43, "elapsed_time": "9:36:42", "remaining_time": "3:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3171, "total_steps": 4438, "loss": 0.1268, "learning_rate": 1.033854499410924e-06, "epoch": 0.7144506716985383, "percentage": 71.45, "elapsed_time": "9:36:51", "remaining_time": "3:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3172, "total_steps": 4438, "loss": 0.1251, "learning_rate": 1.032345996716339e-06, "epoch": 0.7146759793843468, "percentage": 71.47, "elapsed_time": "9:37:01", "remaining_time": "3:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3173, "total_steps": 4438, "loss": 0.1204, "learning_rate": 1.030838308955316e-06, "epoch": 0.7149012870701552, "percentage": 71.5, "elapsed_time": "9:37:12", "remaining_time": "3:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3174, "total_steps": 4438, "loss": 0.1446, "learning_rate": 1.0293314369650193e-06, "epoch": 0.7151265947559636, "percentage": 71.52, "elapsed_time": "9:37:23", "remaining_time": "3:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3175, "total_steps": 4438, "loss": 0.1137, "learning_rate": 1.027825381582157e-06, "epoch": 0.715351902441772, "percentage": 71.54, "elapsed_time": "9:37:33", "remaining_time": "3:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3176, "total_steps": 4438, "loss": 0.1334, "learning_rate": 1.0263201436429873e-06, "epoch": 0.7155772101275805, "percentage": 71.56, "elapsed_time": "9:37:45", "remaining_time": "3:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3177, "total_steps": 4438, "loss": 0.1249, "learning_rate": 1.0248157239833111e-06, "epoch": 0.7158025178133889, "percentage": 71.59, "elapsed_time": "9:37:56", "remaining_time": "3:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3178, "total_steps": 4438, "loss": 0.1351, "learning_rate": 1.0233121234384777e-06, "epoch": 0.7160278254991973, "percentage": 71.61, "elapsed_time": "9:38:05", "remaining_time": "3:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3179, "total_steps": 4438, "loss": 0.1407, "learning_rate": 1.0218093428433807e-06, "epoch": 0.7162531331850057, "percentage": 71.63, "elapsed_time": "9:38:17", "remaining_time": "3:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 4438, "loss": 0.1381, "learning_rate": 1.0203073830324566e-06, "epoch": 0.7164784408708142, "percentage": 71.65, "elapsed_time": "9:38:28", "remaining_time": "3:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3181, "total_steps": 4438, "loss": 0.1336, "learning_rate": 1.0188062448396897e-06, "epoch": 0.7167037485566227, "percentage": 71.68, "elapsed_time": "9:38:39", "remaining_time": "3:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3182, "total_steps": 4438, "loss": 0.1245, "learning_rate": 1.0173059290986048e-06, "epoch": 0.7169290562424311, "percentage": 71.7, "elapsed_time": "9:38:49", "remaining_time": "3:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3183, "total_steps": 4438, "loss": 0.14, "learning_rate": 1.015806436642271e-06, "epoch": 0.7171543639282395, "percentage": 71.72, "elapsed_time": "9:39:01", "remaining_time": "3:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3184, "total_steps": 4438, "loss": 0.1312, "learning_rate": 1.0143077683033017e-06, "epoch": 0.7173796716140479, "percentage": 71.74, "elapsed_time": "9:39:09", "remaining_time": "3:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3185, "total_steps": 4438, "loss": 0.1466, "learning_rate": 1.0128099249138502e-06, "epoch": 0.7176049792998563, "percentage": 71.77, "elapsed_time": "9:39:21", "remaining_time": "3:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3186, "total_steps": 4438, "loss": 0.1416, "learning_rate": 1.0113129073056149e-06, "epoch": 0.7178302869856648, "percentage": 71.79, "elapsed_time": "9:39:32", "remaining_time": "3:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3187, "total_steps": 4438, "loss": 0.1371, "learning_rate": 1.0098167163098319e-06, "epoch": 0.7180555946714733, "percentage": 71.81, "elapsed_time": "9:39:42", "remaining_time": "3:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3188, "total_steps": 4438, "loss": 0.1444, "learning_rate": 1.008321352757281e-06, "epoch": 0.7182809023572817, "percentage": 71.83, "elapsed_time": "9:39:53", "remaining_time": "3:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3189, "total_steps": 4438, "loss": 0.146, "learning_rate": 1.0068268174782833e-06, "epoch": 0.7185062100430901, "percentage": 71.86, "elapsed_time": "9:40:03", "remaining_time": "3:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 4438, "loss": 0.1305, "learning_rate": 1.0053331113026962e-06, "epoch": 0.7187315177288985, "percentage": 71.88, "elapsed_time": "9:40:14", "remaining_time": "3:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3191, "total_steps": 4438, "loss": 0.1288, "learning_rate": 1.0038402350599214e-06, "epoch": 0.718956825414707, "percentage": 71.9, "elapsed_time": "9:40:25", "remaining_time": "3:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3192, "total_steps": 4438, "loss": 0.1396, "learning_rate": 1.002348189578895e-06, "epoch": 0.7191821331005154, "percentage": 71.92, "elapsed_time": "9:40:37", "remaining_time": "3:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3193, "total_steps": 4438, "loss": 0.1246, "learning_rate": 1.0008569756880956e-06, "epoch": 0.7194074407863238, "percentage": 71.95, "elapsed_time": "9:40:46", "remaining_time": "3:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3194, "total_steps": 4438, "loss": 0.1299, "learning_rate": 9.993665942155395e-07, "epoch": 0.7196327484721322, "percentage": 71.97, "elapsed_time": "9:40:56", "remaining_time": "3:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3195, "total_steps": 4438, "loss": 0.1301, "learning_rate": 9.978770459887778e-07, "epoch": 0.7198580561579407, "percentage": 71.99, "elapsed_time": "9:41:07", "remaining_time": "3:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3196, "total_steps": 4438, "loss": 0.1445, "learning_rate": 9.963883318349039e-07, "epoch": 0.7200833638437492, "percentage": 72.01, "elapsed_time": "9:41:17", "remaining_time": "3:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3197, "total_steps": 4438, "loss": 0.1235, "learning_rate": 9.949004525805423e-07, "epoch": 0.7203086715295576, "percentage": 72.04, "elapsed_time": "9:41:28", "remaining_time": "3:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3198, "total_steps": 4438, "loss": 0.1074, "learning_rate": 9.934134090518593e-07, "epoch": 0.720533979215366, "percentage": 72.06, "elapsed_time": "9:41:38", "remaining_time": "3:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3199, "total_steps": 4438, "loss": 0.1336, "learning_rate": 9.919272020745529e-07, "epoch": 0.7207592869011744, "percentage": 72.08, "elapsed_time": "9:41:48", "remaining_time": "3:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 4438, "loss": 0.1298, "learning_rate": 9.904418324738605e-07, "epoch": 0.7209845945869828, "percentage": 72.1, "elapsed_time": "9:42:00", "remaining_time": "3:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3201, "total_steps": 4438, "loss": 0.1378, "learning_rate": 9.889573010745507e-07, "epoch": 0.7212099022727912, "percentage": 72.13, "elapsed_time": "9:42:10", "remaining_time": "3:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3202, "total_steps": 4438, "loss": 0.1281, "learning_rate": 9.874736087009285e-07, "epoch": 0.7214352099585997, "percentage": 72.15, "elapsed_time": "9:42:22", "remaining_time": "3:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3203, "total_steps": 4438, "loss": 0.1286, "learning_rate": 9.859907561768335e-07, "epoch": 0.7216605176444082, "percentage": 72.17, "elapsed_time": "9:42:32", "remaining_time": "3:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3204, "total_steps": 4438, "loss": 0.1239, "learning_rate": 9.84508744325639e-07, "epoch": 0.7218858253302166, "percentage": 72.19, "elapsed_time": "9:42:42", "remaining_time": "3:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3205, "total_steps": 4438, "loss": 0.1271, "learning_rate": 9.830275739702497e-07, "epoch": 0.722111133016025, "percentage": 72.22, "elapsed_time": "9:42:53", "remaining_time": "3:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3206, "total_steps": 4438, "loss": 0.1324, "learning_rate": 9.815472459331061e-07, "epoch": 0.7223364407018334, "percentage": 72.24, "elapsed_time": "9:43:04", "remaining_time": "3:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3207, "total_steps": 4438, "loss": 0.1261, "learning_rate": 9.800677610361768e-07, "epoch": 0.7225617483876419, "percentage": 72.26, "elapsed_time": "9:43:16", "remaining_time": "3:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3208, "total_steps": 4438, "loss": 0.118, "learning_rate": 9.785891201009667e-07, "epoch": 0.7227870560734503, "percentage": 72.28, "elapsed_time": "9:43:26", "remaining_time": "3:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3209, "total_steps": 4438, "loss": 0.1392, "learning_rate": 9.771113239485084e-07, "epoch": 0.7230123637592587, "percentage": 72.31, "elapsed_time": "9:43:37", "remaining_time": "3:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 4438, "loss": 0.1414, "learning_rate": 9.756343733993679e-07, "epoch": 0.7232376714450671, "percentage": 72.33, "elapsed_time": "9:43:47", "remaining_time": "3:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3211, "total_steps": 4438, "loss": 0.1277, "learning_rate": 9.741582692736412e-07, "epoch": 0.7234629791308756, "percentage": 72.35, "elapsed_time": "9:43:57", "remaining_time": "3:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3212, "total_steps": 4438, "loss": 0.1414, "learning_rate": 9.726830123909527e-07, "epoch": 0.7236882868166841, "percentage": 72.37, "elapsed_time": "9:44:06", "remaining_time": "3:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3213, "total_steps": 4438, "loss": 0.1326, "learning_rate": 9.71208603570459e-07, "epoch": 0.7239135945024925, "percentage": 72.4, "elapsed_time": "9:44:19", "remaining_time": "3:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3214, "total_steps": 4438, "loss": 0.1322, "learning_rate": 9.697350436308428e-07, "epoch": 0.7241389021883009, "percentage": 72.42, "elapsed_time": "9:44:30", "remaining_time": "3:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3215, "total_steps": 4438, "loss": 0.1243, "learning_rate": 9.68262333390318e-07, "epoch": 0.7243642098741093, "percentage": 72.44, "elapsed_time": "9:44:41", "remaining_time": "3:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3216, "total_steps": 4438, "loss": 0.1445, "learning_rate": 9.667904736666258e-07, "epoch": 0.7245895175599177, "percentage": 72.47, "elapsed_time": "9:44:53", "remaining_time": "3:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3217, "total_steps": 4438, "loss": 0.1253, "learning_rate": 9.653194652770343e-07, "epoch": 0.7248148252457262, "percentage": 72.49, "elapsed_time": "9:45:03", "remaining_time": "3:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3218, "total_steps": 4438, "loss": 0.1229, "learning_rate": 9.638493090383408e-07, "epoch": 0.7250401329315346, "percentage": 72.51, "elapsed_time": "9:45:15", "remaining_time": "3:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3219, "total_steps": 4438, "loss": 0.1329, "learning_rate": 9.623800057668675e-07, "epoch": 0.7252654406173431, "percentage": 72.53, "elapsed_time": "9:45:25", "remaining_time": "3:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 4438, "loss": 0.132, "learning_rate": 9.60911556278463e-07, "epoch": 0.7254907483031515, "percentage": 72.56, "elapsed_time": "9:45:37", "remaining_time": "3:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3221, "total_steps": 4438, "loss": 0.1293, "learning_rate": 9.594439613885044e-07, "epoch": 0.7257160559889599, "percentage": 72.58, "elapsed_time": "9:45:48", "remaining_time": "3:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3222, "total_steps": 4438, "loss": 0.1206, "learning_rate": 9.579772219118899e-07, "epoch": 0.7259413636747684, "percentage": 72.6, "elapsed_time": "9:45:59", "remaining_time": "3:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3223, "total_steps": 4438, "loss": 0.1332, "learning_rate": 9.565113386630482e-07, "epoch": 0.7261666713605768, "percentage": 72.62, "elapsed_time": "9:46:08", "remaining_time": "3:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3224, "total_steps": 4438, "loss": 0.1386, "learning_rate": 9.550463124559267e-07, "epoch": 0.7263919790463852, "percentage": 72.65, "elapsed_time": "9:46:19", "remaining_time": "3:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3225, "total_steps": 4438, "loss": 0.1369, "learning_rate": 9.535821441040017e-07, "epoch": 0.7266172867321936, "percentage": 72.67, "elapsed_time": "9:46:30", "remaining_time": "3:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3226, "total_steps": 4438, "loss": 0.1411, "learning_rate": 9.521188344202717e-07, "epoch": 0.726842594418002, "percentage": 72.69, "elapsed_time": "9:46:42", "remaining_time": "3:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3227, "total_steps": 4438, "loss": 0.1333, "learning_rate": 9.506563842172565e-07, "epoch": 0.7270679021038106, "percentage": 72.71, "elapsed_time": "9:46:52", "remaining_time": "3:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3228, "total_steps": 4438, "loss": 0.1347, "learning_rate": 9.491947943070015e-07, "epoch": 0.727293209789619, "percentage": 72.74, "elapsed_time": "9:47:02", "remaining_time": "3:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3229, "total_steps": 4438, "loss": 0.1278, "learning_rate": 9.477340655010717e-07, "epoch": 0.7275185174754274, "percentage": 72.76, "elapsed_time": "9:47:14", "remaining_time": "3:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 4438, "loss": 0.1394, "learning_rate": 9.462741986105573e-07, "epoch": 0.7277438251612358, "percentage": 72.78, "elapsed_time": "9:47:25", "remaining_time": "3:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3231, "total_steps": 4438, "loss": 0.1297, "learning_rate": 9.448151944460657e-07, "epoch": 0.7279691328470442, "percentage": 72.8, "elapsed_time": "9:47:36", "remaining_time": "3:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3232, "total_steps": 4438, "loss": 0.1188, "learning_rate": 9.433570538177289e-07, "epoch": 0.7281944405328526, "percentage": 72.83, "elapsed_time": "9:47:46", "remaining_time": "3:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3233, "total_steps": 4438, "loss": 0.1431, "learning_rate": 9.418997775351985e-07, "epoch": 0.7284197482186611, "percentage": 72.85, "elapsed_time": "9:47:58", "remaining_time": "3:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3234, "total_steps": 4438, "loss": 0.1358, "learning_rate": 9.404433664076442e-07, "epoch": 0.7286450559044696, "percentage": 72.87, "elapsed_time": "9:48:08", "remaining_time": "3:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3235, "total_steps": 4438, "loss": 0.1229, "learning_rate": 9.389878212437586e-07, "epoch": 0.728870363590278, "percentage": 72.89, "elapsed_time": "9:48:18", "remaining_time": "3:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3236, "total_steps": 4438, "loss": 0.1315, "learning_rate": 9.375331428517506e-07, "epoch": 0.7290956712760864, "percentage": 72.92, "elapsed_time": "9:48:29", "remaining_time": "3:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3237, "total_steps": 4438, "loss": 0.1388, "learning_rate": 9.360793320393483e-07, "epoch": 0.7293209789618949, "percentage": 72.94, "elapsed_time": "9:48:40", "remaining_time": "3:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3238, "total_steps": 4438, "loss": 0.1403, "learning_rate": 9.346263896138e-07, "epoch": 0.7295462866477033, "percentage": 72.96, "elapsed_time": "9:48:52", "remaining_time": "3:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3239, "total_steps": 4438, "loss": 0.1386, "learning_rate": 9.33174316381869e-07, "epoch": 0.7297715943335117, "percentage": 72.98, "elapsed_time": "9:49:00", "remaining_time": "3:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 4438, "loss": 0.1297, "learning_rate": 9.317231131498383e-07, "epoch": 0.7299969020193201, "percentage": 73.01, "elapsed_time": "9:49:12", "remaining_time": "3:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3241, "total_steps": 4438, "loss": 0.1446, "learning_rate": 9.302727807235079e-07, "epoch": 0.7302222097051285, "percentage": 73.03, "elapsed_time": "9:49:23", "remaining_time": "3:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3242, "total_steps": 4438, "loss": 0.1479, "learning_rate": 9.288233199081914e-07, "epoch": 0.730447517390937, "percentage": 73.05, "elapsed_time": "9:49:34", "remaining_time": "3:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3243, "total_steps": 4438, "loss": 0.141, "learning_rate": 9.273747315087223e-07, "epoch": 0.7306728250767455, "percentage": 73.07, "elapsed_time": "9:49:46", "remaining_time": "3:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3244, "total_steps": 4438, "loss": 0.1382, "learning_rate": 9.259270163294457e-07, "epoch": 0.7308981327625539, "percentage": 73.1, "elapsed_time": "9:49:56", "remaining_time": "3:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3245, "total_steps": 4438, "loss": 0.1222, "learning_rate": 9.244801751742258e-07, "epoch": 0.7311234404483623, "percentage": 73.12, "elapsed_time": "9:50:07", "remaining_time": "3:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3246, "total_steps": 4438, "loss": 0.136, "learning_rate": 9.230342088464381e-07, "epoch": 0.7313487481341707, "percentage": 73.14, "elapsed_time": "9:50:17", "remaining_time": "3:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3247, "total_steps": 4438, "loss": 0.1437, "learning_rate": 9.215891181489742e-07, "epoch": 0.7315740558199791, "percentage": 73.16, "elapsed_time": "9:50:29", "remaining_time": "3:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3248, "total_steps": 4438, "loss": 0.1425, "learning_rate": 9.201449038842403e-07, "epoch": 0.7317993635057876, "percentage": 73.19, "elapsed_time": "9:50:39", "remaining_time": "3:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3249, "total_steps": 4438, "loss": 0.1336, "learning_rate": 9.187015668541526e-07, "epoch": 0.732024671191596, "percentage": 73.21, "elapsed_time": "9:50:50", "remaining_time": "3:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 4438, "loss": 0.1347, "learning_rate": 9.172591078601448e-07, "epoch": 0.7322499788774045, "percentage": 73.23, "elapsed_time": "9:51:01", "remaining_time": "3:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3251, "total_steps": 4438, "loss": 0.1359, "learning_rate": 9.158175277031584e-07, "epoch": 0.7324752865632129, "percentage": 73.25, "elapsed_time": "9:51:10", "remaining_time": "3:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3252, "total_steps": 4438, "loss": 0.1398, "learning_rate": 9.143768271836506e-07, "epoch": 0.7327005942490213, "percentage": 73.28, "elapsed_time": "9:51:22", "remaining_time": "3:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3253, "total_steps": 4438, "loss": 0.1238, "learning_rate": 9.129370071015886e-07, "epoch": 0.7329259019348298, "percentage": 73.3, "elapsed_time": "9:51:32", "remaining_time": "3:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3254, "total_steps": 4438, "loss": 0.1185, "learning_rate": 9.114980682564492e-07, "epoch": 0.7331512096206382, "percentage": 73.32, "elapsed_time": "9:51:42", "remaining_time": "3:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3255, "total_steps": 4438, "loss": 0.1413, "learning_rate": 9.100600114472238e-07, "epoch": 0.7333765173064466, "percentage": 73.34, "elapsed_time": "9:51:51", "remaining_time": "3:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3256, "total_steps": 4438, "loss": 0.1372, "learning_rate": 9.086228374724096e-07, "epoch": 0.733601824992255, "percentage": 73.37, "elapsed_time": "9:52:00", "remaining_time": "3:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3257, "total_steps": 4438, "loss": 0.1391, "learning_rate": 9.071865471300168e-07, "epoch": 0.7338271326780634, "percentage": 73.39, "elapsed_time": "9:52:10", "remaining_time": "3:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3258, "total_steps": 4438, "loss": 0.1292, "learning_rate": 9.057511412175646e-07, "epoch": 0.734052440363872, "percentage": 73.41, "elapsed_time": "9:52:20", "remaining_time": "3:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3259, "total_steps": 4438, "loss": 0.1216, "learning_rate": 9.043166205320789e-07, "epoch": 0.7342777480496804, "percentage": 73.43, "elapsed_time": "9:52:29", "remaining_time": "3:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 4438, "loss": 0.135, "learning_rate": 9.028829858700974e-07, "epoch": 0.7345030557354888, "percentage": 73.46, "elapsed_time": "9:52:40", "remaining_time": "3:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3261, "total_steps": 4438, "loss": 0.1288, "learning_rate": 9.014502380276619e-07, "epoch": 0.7347283634212972, "percentage": 73.48, "elapsed_time": "9:52:51", "remaining_time": "3:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3262, "total_steps": 4438, "loss": 0.128, "learning_rate": 9.000183778003246e-07, "epoch": 0.7349536711071056, "percentage": 73.5, "elapsed_time": "9:53:02", "remaining_time": "3:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3263, "total_steps": 4438, "loss": 0.1353, "learning_rate": 8.985874059831456e-07, "epoch": 0.735178978792914, "percentage": 73.52, "elapsed_time": "9:53:14", "remaining_time": "3:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3264, "total_steps": 4438, "loss": 0.1345, "learning_rate": 8.971573233706881e-07, "epoch": 0.7354042864787225, "percentage": 73.55, "elapsed_time": "9:53:25", "remaining_time": "3:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3265, "total_steps": 4438, "loss": 0.1289, "learning_rate": 8.957281307570254e-07, "epoch": 0.7356295941645309, "percentage": 73.57, "elapsed_time": "9:53:34", "remaining_time": "3:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3266, "total_steps": 4438, "loss": 0.129, "learning_rate": 8.942998289357333e-07, "epoch": 0.7358549018503394, "percentage": 73.59, "elapsed_time": "9:53:44", "remaining_time": "3:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3267, "total_steps": 4438, "loss": 0.1216, "learning_rate": 8.928724186998961e-07, "epoch": 0.7360802095361478, "percentage": 73.61, "elapsed_time": "9:53:55", "remaining_time": "3:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3268, "total_steps": 4438, "loss": 0.1407, "learning_rate": 8.914459008421e-07, "epoch": 0.7363055172219563, "percentage": 73.64, "elapsed_time": "9:54:08", "remaining_time": "3:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3269, "total_steps": 4438, "loss": 0.1311, "learning_rate": 8.900202761544377e-07, "epoch": 0.7365308249077647, "percentage": 73.66, "elapsed_time": "9:54:18", "remaining_time": "3:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 4438, "loss": 0.1333, "learning_rate": 8.885955454285078e-07, "epoch": 0.7367561325935731, "percentage": 73.68, "elapsed_time": "9:54:29", "remaining_time": "3:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3271, "total_steps": 4438, "loss": 0.1275, "learning_rate": 8.871717094554058e-07, "epoch": 0.7369814402793815, "percentage": 73.7, "elapsed_time": "9:54:42", "remaining_time": "3:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3272, "total_steps": 4438, "loss": 0.118, "learning_rate": 8.857487690257374e-07, "epoch": 0.7372067479651899, "percentage": 73.73, "elapsed_time": "9:54:54", "remaining_time": "3:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3273, "total_steps": 4438, "loss": 0.1336, "learning_rate": 8.843267249296086e-07, "epoch": 0.7374320556509983, "percentage": 73.75, "elapsed_time": "9:55:05", "remaining_time": "3:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3274, "total_steps": 4438, "loss": 0.143, "learning_rate": 8.829055779566262e-07, "epoch": 0.7376573633368069, "percentage": 73.77, "elapsed_time": "9:55:16", "remaining_time": "3:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3275, "total_steps": 4438, "loss": 0.1346, "learning_rate": 8.814853288959016e-07, "epoch": 0.7378826710226153, "percentage": 73.79, "elapsed_time": "9:55:27", "remaining_time": "3:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3276, "total_steps": 4438, "loss": 0.1391, "learning_rate": 8.800659785360444e-07, "epoch": 0.7381079787084237, "percentage": 73.82, "elapsed_time": "9:55:36", "remaining_time": "3:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3277, "total_steps": 4438, "loss": 0.1277, "learning_rate": 8.786475276651688e-07, "epoch": 0.7383332863942321, "percentage": 73.84, "elapsed_time": "9:55:49", "remaining_time": "3:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3278, "total_steps": 4438, "loss": 0.1152, "learning_rate": 8.772299770708859e-07, "epoch": 0.7385585940800405, "percentage": 73.86, "elapsed_time": "9:55:59", "remaining_time": "3:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3279, "total_steps": 4438, "loss": 0.1374, "learning_rate": 8.758133275403097e-07, "epoch": 0.738783901765849, "percentage": 73.88, "elapsed_time": "9:56:10", "remaining_time": "3:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 4438, "loss": 0.1416, "learning_rate": 8.743975798600535e-07, "epoch": 0.7390092094516574, "percentage": 73.91, "elapsed_time": "9:56:21", "remaining_time": "3:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3281, "total_steps": 4438, "loss": 0.1418, "learning_rate": 8.729827348162278e-07, "epoch": 0.7392345171374658, "percentage": 73.93, "elapsed_time": "9:56:31", "remaining_time": "3:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3282, "total_steps": 4438, "loss": 0.1374, "learning_rate": 8.71568793194445e-07, "epoch": 0.7394598248232743, "percentage": 73.95, "elapsed_time": "9:56:42", "remaining_time": "3:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3283, "total_steps": 4438, "loss": 0.1148, "learning_rate": 8.701557557798121e-07, "epoch": 0.7396851325090827, "percentage": 73.97, "elapsed_time": "9:56:53", "remaining_time": "3:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3284, "total_steps": 4438, "loss": 0.1442, "learning_rate": 8.687436233569375e-07, "epoch": 0.7399104401948912, "percentage": 74.0, "elapsed_time": "9:57:04", "remaining_time": "3:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3285, "total_steps": 4438, "loss": 0.1294, "learning_rate": 8.673323967099259e-07, "epoch": 0.7401357478806996, "percentage": 74.02, "elapsed_time": "9:57:15", "remaining_time": "3:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3286, "total_steps": 4438, "loss": 0.1337, "learning_rate": 8.659220766223778e-07, "epoch": 0.740361055566508, "percentage": 74.04, "elapsed_time": "9:57:27", "remaining_time": "3:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3287, "total_steps": 4438, "loss": 0.1424, "learning_rate": 8.645126638773926e-07, "epoch": 0.7405863632523164, "percentage": 74.06, "elapsed_time": "9:57:37", "remaining_time": "3:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3288, "total_steps": 4438, "loss": 0.1185, "learning_rate": 8.631041592575643e-07, "epoch": 0.7408116709381248, "percentage": 74.09, "elapsed_time": "9:57:48", "remaining_time": "3:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3289, "total_steps": 4438, "loss": 0.1412, "learning_rate": 8.616965635449814e-07, "epoch": 0.7410369786239334, "percentage": 74.11, "elapsed_time": "9:57:59", "remaining_time": "3:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 4438, "loss": 0.1232, "learning_rate": 8.602898775212317e-07, "epoch": 0.7412622863097418, "percentage": 74.13, "elapsed_time": "9:58:10", "remaining_time": "3:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3291, "total_steps": 4438, "loss": 0.1327, "learning_rate": 8.588841019673938e-07, "epoch": 0.7414875939955502, "percentage": 74.16, "elapsed_time": "9:58:20", "remaining_time": "3:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3292, "total_steps": 4438, "loss": 0.1258, "learning_rate": 8.57479237664044e-07, "epoch": 0.7417129016813586, "percentage": 74.18, "elapsed_time": "9:58:30", "remaining_time": "3:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3293, "total_steps": 4438, "loss": 0.131, "learning_rate": 8.560752853912494e-07, "epoch": 0.741938209367167, "percentage": 74.2, "elapsed_time": "9:58:41", "remaining_time": "3:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3294, "total_steps": 4438, "loss": 0.1389, "learning_rate": 8.546722459285727e-07, "epoch": 0.7421635170529755, "percentage": 74.22, "elapsed_time": "9:58:52", "remaining_time": "3:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3295, "total_steps": 4438, "loss": 0.133, "learning_rate": 8.532701200550714e-07, "epoch": 0.7423888247387839, "percentage": 74.25, "elapsed_time": "9:59:04", "remaining_time": "3:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3296, "total_steps": 4438, "loss": 0.1308, "learning_rate": 8.518689085492909e-07, "epoch": 0.7426141324245923, "percentage": 74.27, "elapsed_time": "9:59:15", "remaining_time": "3:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3297, "total_steps": 4438, "loss": 0.1375, "learning_rate": 8.504686121892741e-07, "epoch": 0.7428394401104008, "percentage": 74.29, "elapsed_time": "9:59:25", "remaining_time": "3:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3298, "total_steps": 4438, "loss": 0.1272, "learning_rate": 8.490692317525514e-07, "epoch": 0.7430647477962092, "percentage": 74.31, "elapsed_time": "9:59:36", "remaining_time": "3:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3299, "total_steps": 4438, "loss": 0.135, "learning_rate": 8.476707680161486e-07, "epoch": 0.7432900554820177, "percentage": 74.34, "elapsed_time": "9:59:47", "remaining_time": "3:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 4438, "loss": 0.1281, "learning_rate": 8.462732217565783e-07, "epoch": 0.7435153631678261, "percentage": 74.36, "elapsed_time": "9:59:57", "remaining_time": "3:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3301, "total_steps": 4438, "loss": 0.1319, "learning_rate": 8.448765937498471e-07, "epoch": 0.7437406708536345, "percentage": 74.38, "elapsed_time": "10:00:09", "remaining_time": "3:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3302, "total_steps": 4438, "loss": 0.1333, "learning_rate": 8.434808847714512e-07, "epoch": 0.7439659785394429, "percentage": 74.4, "elapsed_time": "10:00:18", "remaining_time": "3:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3303, "total_steps": 4438, "loss": 0.1361, "learning_rate": 8.420860955963739e-07, "epoch": 0.7441912862252513, "percentage": 74.43, "elapsed_time": "10:00:30", "remaining_time": "3:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3304, "total_steps": 4438, "loss": 0.1464, "learning_rate": 8.406922269990917e-07, "epoch": 0.7444165939110597, "percentage": 74.45, "elapsed_time": "10:00:41", "remaining_time": "3:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3305, "total_steps": 4438, "loss": 0.1357, "learning_rate": 8.392992797535666e-07, "epoch": 0.7446419015968683, "percentage": 74.47, "elapsed_time": "10:00:51", "remaining_time": "3:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3306, "total_steps": 4438, "loss": 0.1236, "learning_rate": 8.379072546332498e-07, "epoch": 0.7448672092826767, "percentage": 74.49, "elapsed_time": "10:01:01", "remaining_time": "3:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3307, "total_steps": 4438, "loss": 0.129, "learning_rate": 8.365161524110823e-07, "epoch": 0.7450925169684851, "percentage": 74.52, "elapsed_time": "10:01:13", "remaining_time": "3:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3308, "total_steps": 4438, "loss": 0.1341, "learning_rate": 8.351259738594902e-07, "epoch": 0.7453178246542935, "percentage": 74.54, "elapsed_time": "10:01:23", "remaining_time": "3:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3309, "total_steps": 4438, "loss": 0.1317, "learning_rate": 8.337367197503881e-07, "epoch": 0.7455431323401019, "percentage": 74.56, "elapsed_time": "10:01:34", "remaining_time": "3:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 4438, "loss": 0.1309, "learning_rate": 8.323483908551783e-07, "epoch": 0.7457684400259104, "percentage": 74.58, "elapsed_time": "10:01:44", "remaining_time": "3:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3311, "total_steps": 4438, "loss": 0.1312, "learning_rate": 8.309609879447458e-07, "epoch": 0.7459937477117188, "percentage": 74.61, "elapsed_time": "10:01:55", "remaining_time": "3:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3312, "total_steps": 4438, "loss": 0.1198, "learning_rate": 8.29574511789466e-07, "epoch": 0.7462190553975272, "percentage": 74.63, "elapsed_time": "10:02:06", "remaining_time": "3:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3313, "total_steps": 4438, "loss": 0.1422, "learning_rate": 8.281889631591955e-07, "epoch": 0.7464443630833357, "percentage": 74.65, "elapsed_time": "10:02:17", "remaining_time": "3:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3314, "total_steps": 4438, "loss": 0.1462, "learning_rate": 8.268043428232798e-07, "epoch": 0.7466696707691441, "percentage": 74.67, "elapsed_time": "10:02:29", "remaining_time": "3:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3315, "total_steps": 4438, "loss": 0.1343, "learning_rate": 8.254206515505444e-07, "epoch": 0.7468949784549526, "percentage": 74.7, "elapsed_time": "10:02:39", "remaining_time": "3:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3316, "total_steps": 4438, "loss": 0.1256, "learning_rate": 8.240378901093035e-07, "epoch": 0.747120286140761, "percentage": 74.72, "elapsed_time": "10:02:50", "remaining_time": "3:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3317, "total_steps": 4438, "loss": 0.1242, "learning_rate": 8.22656059267353e-07, "epoch": 0.7473455938265694, "percentage": 74.74, "elapsed_time": "10:03:02", "remaining_time": "3:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3318, "total_steps": 4438, "loss": 0.1305, "learning_rate": 8.212751597919708e-07, "epoch": 0.7475709015123778, "percentage": 74.76, "elapsed_time": "10:03:13", "remaining_time": "3:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3319, "total_steps": 4438, "loss": 0.1359, "learning_rate": 8.198951924499202e-07, "epoch": 0.7477962091981862, "percentage": 74.79, "elapsed_time": "10:03:24", "remaining_time": "3:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 4438, "loss": 0.1238, "learning_rate": 8.185161580074444e-07, "epoch": 0.7480215168839947, "percentage": 74.81, "elapsed_time": "10:03:34", "remaining_time": "3:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3321, "total_steps": 4438, "loss": 0.1247, "learning_rate": 8.171380572302712e-07, "epoch": 0.7482468245698032, "percentage": 74.83, "elapsed_time": "10:03:44", "remaining_time": "3:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3322, "total_steps": 4438, "loss": 0.1406, "learning_rate": 8.157608908836071e-07, "epoch": 0.7484721322556116, "percentage": 74.85, "elapsed_time": "10:03:54", "remaining_time": "3:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3323, "total_steps": 4438, "loss": 0.1262, "learning_rate": 8.143846597321425e-07, "epoch": 0.74869743994142, "percentage": 74.88, "elapsed_time": "10:04:03", "remaining_time": "3:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3324, "total_steps": 4438, "loss": 0.1457, "learning_rate": 8.130093645400469e-07, "epoch": 0.7489227476272284, "percentage": 74.9, "elapsed_time": "10:04:13", "remaining_time": "3:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3325, "total_steps": 4438, "loss": 0.1284, "learning_rate": 8.116350060709696e-07, "epoch": 0.7491480553130369, "percentage": 74.92, "elapsed_time": "10:04:23", "remaining_time": "3:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3326, "total_steps": 4438, "loss": 0.1138, "learning_rate": 8.102615850880413e-07, "epoch": 0.7493733629988453, "percentage": 74.94, "elapsed_time": "10:04:33", "remaining_time": "3:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3327, "total_steps": 4438, "loss": 0.1175, "learning_rate": 8.088891023538722e-07, "epoch": 0.7495986706846537, "percentage": 74.97, "elapsed_time": "10:04:44", "remaining_time": "3:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3328, "total_steps": 4438, "loss": 0.1526, "learning_rate": 8.075175586305492e-07, "epoch": 0.7498239783704621, "percentage": 74.99, "elapsed_time": "10:04:55", "remaining_time": "3:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3329, "total_steps": 4438, "loss": 0.1461, "learning_rate": 8.061469546796413e-07, "epoch": 0.7500492860562706, "percentage": 75.01, "elapsed_time": "10:05:06", "remaining_time": "3:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 4438, "loss": 0.1325, "learning_rate": 8.047772912621921e-07, "epoch": 0.750274593742079, "percentage": 75.03, "elapsed_time": "10:05:17", "remaining_time": "3:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3331, "total_steps": 4438, "loss": 0.1411, "learning_rate": 8.034085691387253e-07, "epoch": 0.7504999014278875, "percentage": 75.06, "elapsed_time": "10:05:28", "remaining_time": "3:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3332, "total_steps": 4438, "loss": 0.1158, "learning_rate": 8.020407890692419e-07, "epoch": 0.7507252091136959, "percentage": 75.08, "elapsed_time": "10:05:38", "remaining_time": "3:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3333, "total_steps": 4438, "loss": 0.1275, "learning_rate": 8.006739518132179e-07, "epoch": 0.7509505167995043, "percentage": 75.1, "elapsed_time": "10:05:49", "remaining_time": "3:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3334, "total_steps": 4438, "loss": 0.1333, "learning_rate": 7.993080581296087e-07, "epoch": 0.7511758244853127, "percentage": 75.12, "elapsed_time": "10:05:58", "remaining_time": "3:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3335, "total_steps": 4438, "loss": 0.1246, "learning_rate": 7.979431087768424e-07, "epoch": 0.7514011321711211, "percentage": 75.15, "elapsed_time": "10:06:09", "remaining_time": "3:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3336, "total_steps": 4438, "loss": 0.1299, "learning_rate": 7.96579104512826e-07, "epoch": 0.7516264398569297, "percentage": 75.17, "elapsed_time": "10:06:20", "remaining_time": "3:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3337, "total_steps": 4438, "loss": 0.1267, "learning_rate": 7.95216046094939e-07, "epoch": 0.7518517475427381, "percentage": 75.19, "elapsed_time": "10:06:31", "remaining_time": "3:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3338, "total_steps": 4438, "loss": 0.1314, "learning_rate": 7.938539342800373e-07, "epoch": 0.7520770552285465, "percentage": 75.21, "elapsed_time": "10:06:40", "remaining_time": "3:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3339, "total_steps": 4438, "loss": 0.1245, "learning_rate": 7.92492769824452e-07, "epoch": 0.7523023629143549, "percentage": 75.24, "elapsed_time": "10:06:51", "remaining_time": "3:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 4438, "loss": 0.1275, "learning_rate": 7.911325534839851e-07, "epoch": 0.7525276706001633, "percentage": 75.26, "elapsed_time": "10:07:02", "remaining_time": "3:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3341, "total_steps": 4438, "loss": 0.1235, "learning_rate": 7.897732860139157e-07, "epoch": 0.7527529782859718, "percentage": 75.28, "elapsed_time": "10:07:12", "remaining_time": "3:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3342, "total_steps": 4438, "loss": 0.1228, "learning_rate": 7.884149681689937e-07, "epoch": 0.7529782859717802, "percentage": 75.3, "elapsed_time": "10:07:22", "remaining_time": "3:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3343, "total_steps": 4438, "loss": 0.127, "learning_rate": 7.870576007034414e-07, "epoch": 0.7532035936575886, "percentage": 75.33, "elapsed_time": "10:07:33", "remaining_time": "3:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3344, "total_steps": 4438, "loss": 0.1335, "learning_rate": 7.857011843709559e-07, "epoch": 0.7534289013433971, "percentage": 75.35, "elapsed_time": "10:07:45", "remaining_time": "3:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3345, "total_steps": 4438, "loss": 0.1454, "learning_rate": 7.843457199247034e-07, "epoch": 0.7536542090292055, "percentage": 75.37, "elapsed_time": "10:07:55", "remaining_time": "3:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3346, "total_steps": 4438, "loss": 0.1256, "learning_rate": 7.829912081173238e-07, "epoch": 0.753879516715014, "percentage": 75.39, "elapsed_time": "10:08:05", "remaining_time": "3:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3347, "total_steps": 4438, "loss": 0.1236, "learning_rate": 7.816376497009262e-07, "epoch": 0.7541048244008224, "percentage": 75.42, "elapsed_time": "10:08:17", "remaining_time": "3:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3348, "total_steps": 4438, "loss": 0.1316, "learning_rate": 7.802850454270913e-07, "epoch": 0.7543301320866308, "percentage": 75.44, "elapsed_time": "10:08:28", "remaining_time": "3:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3349, "total_steps": 4438, "loss": 0.1311, "learning_rate": 7.789333960468707e-07, "epoch": 0.7545554397724392, "percentage": 75.46, "elapsed_time": "10:08:40", "remaining_time": "3:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 4438, "loss": 0.1385, "learning_rate": 7.775827023107835e-07, "epoch": 0.7547807474582476, "percentage": 75.48, "elapsed_time": "10:08:51", "remaining_time": "3:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3351, "total_steps": 4438, "loss": 0.1205, "learning_rate": 7.762329649688214e-07, "epoch": 0.755006055144056, "percentage": 75.51, "elapsed_time": "10:09:00", "remaining_time": "3:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3352, "total_steps": 4438, "loss": 0.1163, "learning_rate": 7.74884184770441e-07, "epoch": 0.7552313628298646, "percentage": 75.53, "elapsed_time": "10:09:11", "remaining_time": "3:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3353, "total_steps": 4438, "loss": 0.1408, "learning_rate": 7.735363624645712e-07, "epoch": 0.755456670515673, "percentage": 75.55, "elapsed_time": "10:09:22", "remaining_time": "3:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3354, "total_steps": 4438, "loss": 0.1238, "learning_rate": 7.721894987996076e-07, "epoch": 0.7556819782014814, "percentage": 75.57, "elapsed_time": "10:09:33", "remaining_time": "3:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3355, "total_steps": 4438, "loss": 0.1266, "learning_rate": 7.708435945234124e-07, "epoch": 0.7559072858872898, "percentage": 75.6, "elapsed_time": "10:09:43", "remaining_time": "3:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3356, "total_steps": 4438, "loss": 0.1375, "learning_rate": 7.694986503833171e-07, "epoch": 0.7561325935730983, "percentage": 75.62, "elapsed_time": "10:09:54", "remaining_time": "3:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3357, "total_steps": 4438, "loss": 0.1443, "learning_rate": 7.681546671261181e-07, "epoch": 0.7563579012589067, "percentage": 75.64, "elapsed_time": "10:10:04", "remaining_time": "3:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3358, "total_steps": 4438, "loss": 0.1338, "learning_rate": 7.668116454980804e-07, "epoch": 0.7565832089447151, "percentage": 75.66, "elapsed_time": "10:10:13", "remaining_time": "3:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3359, "total_steps": 4438, "loss": 0.1402, "learning_rate": 7.654695862449327e-07, "epoch": 0.7568085166305235, "percentage": 75.69, "elapsed_time": "10:10:24", "remaining_time": "3:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 4438, "loss": 0.1131, "learning_rate": 7.641284901118703e-07, "epoch": 0.757033824316332, "percentage": 75.71, "elapsed_time": "10:10:34", "remaining_time": "3:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3361, "total_steps": 4438, "loss": 0.1373, "learning_rate": 7.627883578435555e-07, "epoch": 0.7572591320021405, "percentage": 75.73, "elapsed_time": "10:10:45", "remaining_time": "3:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3362, "total_steps": 4438, "loss": 0.1278, "learning_rate": 7.614491901841118e-07, "epoch": 0.7574844396879489, "percentage": 75.75, "elapsed_time": "10:10:54", "remaining_time": "3:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3363, "total_steps": 4438, "loss": 0.1287, "learning_rate": 7.601109878771301e-07, "epoch": 0.7577097473737573, "percentage": 75.78, "elapsed_time": "10:11:04", "remaining_time": "3:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3364, "total_steps": 4438, "loss": 0.1345, "learning_rate": 7.587737516656651e-07, "epoch": 0.7579350550595657, "percentage": 75.8, "elapsed_time": "10:11:16", "remaining_time": "3:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3365, "total_steps": 4438, "loss": 0.134, "learning_rate": 7.574374822922323e-07, "epoch": 0.7581603627453741, "percentage": 75.82, "elapsed_time": "10:11:27", "remaining_time": "3:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3366, "total_steps": 4438, "loss": 0.1169, "learning_rate": 7.561021804988141e-07, "epoch": 0.7583856704311825, "percentage": 75.84, "elapsed_time": "10:11:38", "remaining_time": "3:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3367, "total_steps": 4438, "loss": 0.1343, "learning_rate": 7.547678470268526e-07, "epoch": 0.758610978116991, "percentage": 75.87, "elapsed_time": "10:11:48", "remaining_time": "3:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3368, "total_steps": 4438, "loss": 0.1236, "learning_rate": 7.534344826172546e-07, "epoch": 0.7588362858027995, "percentage": 75.89, "elapsed_time": "10:11:59", "remaining_time": "3:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3369, "total_steps": 4438, "loss": 0.1342, "learning_rate": 7.52102088010386e-07, "epoch": 0.7590615934886079, "percentage": 75.91, "elapsed_time": "10:12:10", "remaining_time": "3:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 4438, "loss": 0.1069, "learning_rate": 7.507706639460768e-07, "epoch": 0.7592869011744163, "percentage": 75.94, "elapsed_time": "10:12:22", "remaining_time": "3:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3371, "total_steps": 4438, "loss": 0.1421, "learning_rate": 7.494402111636179e-07, "epoch": 0.7595122088602247, "percentage": 75.96, "elapsed_time": "10:12:33", "remaining_time": "3:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3372, "total_steps": 4438, "loss": 0.1268, "learning_rate": 7.481107304017588e-07, "epoch": 0.7597375165460332, "percentage": 75.98, "elapsed_time": "10:12:42", "remaining_time": "3:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3373, "total_steps": 4438, "loss": 0.1296, "learning_rate": 7.467822223987117e-07, "epoch": 0.7599628242318416, "percentage": 76.0, "elapsed_time": "10:12:52", "remaining_time": "3:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3374, "total_steps": 4438, "loss": 0.1232, "learning_rate": 7.454546878921465e-07, "epoch": 0.76018813191765, "percentage": 76.03, "elapsed_time": "10:13:01", "remaining_time": "3:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3375, "total_steps": 4438, "loss": 0.1189, "learning_rate": 7.441281276191939e-07, "epoch": 0.7604134396034584, "percentage": 76.05, "elapsed_time": "10:13:12", "remaining_time": "3:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3376, "total_steps": 4438, "loss": 0.1203, "learning_rate": 7.428025423164456e-07, "epoch": 0.760638747289267, "percentage": 76.07, "elapsed_time": "10:13:21", "remaining_time": "3:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3377, "total_steps": 4438, "loss": 0.1395, "learning_rate": 7.414779327199461e-07, "epoch": 0.7608640549750754, "percentage": 76.09, "elapsed_time": "10:13:31", "remaining_time": "3:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3378, "total_steps": 4438, "loss": 0.1362, "learning_rate": 7.401542995652033e-07, "epoch": 0.7610893626608838, "percentage": 76.12, "elapsed_time": "10:13:41", "remaining_time": "3:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3379, "total_steps": 4438, "loss": 0.1309, "learning_rate": 7.388316435871825e-07, "epoch": 0.7613146703466922, "percentage": 76.14, "elapsed_time": "10:13:51", "remaining_time": "3:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 4438, "loss": 0.1235, "learning_rate": 7.375099655203033e-07, "epoch": 0.7615399780325006, "percentage": 76.16, "elapsed_time": "10:14:02", "remaining_time": "3:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3381, "total_steps": 4438, "loss": 0.1165, "learning_rate": 7.361892660984459e-07, "epoch": 0.761765285718309, "percentage": 76.18, "elapsed_time": "10:14:12", "remaining_time": "3:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3382, "total_steps": 4438, "loss": 0.121, "learning_rate": 7.348695460549443e-07, "epoch": 0.7619905934041175, "percentage": 76.21, "elapsed_time": "10:14:22", "remaining_time": "3:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3383, "total_steps": 4438, "loss": 0.1297, "learning_rate": 7.335508061225907e-07, "epoch": 0.762215901089926, "percentage": 76.23, "elapsed_time": "10:14:33", "remaining_time": "3:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3384, "total_steps": 4438, "loss": 0.1325, "learning_rate": 7.322330470336314e-07, "epoch": 0.7624412087757344, "percentage": 76.25, "elapsed_time": "10:14:43", "remaining_time": "3:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3385, "total_steps": 4438, "loss": 0.1262, "learning_rate": 7.309162695197692e-07, "epoch": 0.7626665164615428, "percentage": 76.27, "elapsed_time": "10:14:53", "remaining_time": "3:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3386, "total_steps": 4438, "loss": 0.1303, "learning_rate": 7.296004743121627e-07, "epoch": 0.7628918241473512, "percentage": 76.3, "elapsed_time": "10:15:02", "remaining_time": "3:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3387, "total_steps": 4438, "loss": 0.1224, "learning_rate": 7.28285662141422e-07, "epoch": 0.7631171318331597, "percentage": 76.32, "elapsed_time": "10:15:14", "remaining_time": "3:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3388, "total_steps": 4438, "loss": 0.1373, "learning_rate": 7.26971833737615e-07, "epoch": 0.7633424395189681, "percentage": 76.34, "elapsed_time": "10:15:25", "remaining_time": "3:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3389, "total_steps": 4438, "loss": 0.1291, "learning_rate": 7.256589898302599e-07, "epoch": 0.7635677472047765, "percentage": 76.36, "elapsed_time": "10:15:37", "remaining_time": "3:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 4438, "loss": 0.1234, "learning_rate": 7.243471311483322e-07, "epoch": 0.7637930548905849, "percentage": 76.39, "elapsed_time": "10:15:48", "remaining_time": "3:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3391, "total_steps": 4438, "loss": 0.1242, "learning_rate": 7.230362584202557e-07, "epoch": 0.7640183625763934, "percentage": 76.41, "elapsed_time": "10:15:58", "remaining_time": "3:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3392, "total_steps": 4438, "loss": 0.1275, "learning_rate": 7.217263723739107e-07, "epoch": 0.7642436702622019, "percentage": 76.43, "elapsed_time": "10:16:08", "remaining_time": "3:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3393, "total_steps": 4438, "loss": 0.1229, "learning_rate": 7.204174737366293e-07, "epoch": 0.7644689779480103, "percentage": 76.45, "elapsed_time": "10:16:16", "remaining_time": "3:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3394, "total_steps": 4438, "loss": 0.1261, "learning_rate": 7.191095632351908e-07, "epoch": 0.7646942856338187, "percentage": 76.48, "elapsed_time": "10:16:27", "remaining_time": "3:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3395, "total_steps": 4438, "loss": 0.1353, "learning_rate": 7.178026415958311e-07, "epoch": 0.7649195933196271, "percentage": 76.5, "elapsed_time": "10:16:39", "remaining_time": "3:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3396, "total_steps": 4438, "loss": 0.144, "learning_rate": 7.164967095442357e-07, "epoch": 0.7651449010054355, "percentage": 76.52, "elapsed_time": "10:16:49", "remaining_time": "3:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3397, "total_steps": 4438, "loss": 0.1359, "learning_rate": 7.151917678055384e-07, "epoch": 0.765370208691244, "percentage": 76.54, "elapsed_time": "10:17:00", "remaining_time": "3:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3398, "total_steps": 4438, "loss": 0.1259, "learning_rate": 7.138878171043262e-07, "epoch": 0.7655955163770524, "percentage": 76.57, "elapsed_time": "10:17:12", "remaining_time": "3:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3399, "total_steps": 4438, "loss": 0.1379, "learning_rate": 7.125848581646327e-07, "epoch": 0.7658208240628609, "percentage": 76.59, "elapsed_time": "10:17:24", "remaining_time": "3:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 4438, "loss": 0.1209, "learning_rate": 7.112828917099438e-07, "epoch": 0.7660461317486693, "percentage": 76.61, "elapsed_time": "10:17:35", "remaining_time": "3:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3401, "total_steps": 4438, "loss": 0.1266, "learning_rate": 7.099819184631929e-07, "epoch": 0.7662714394344777, "percentage": 76.63, "elapsed_time": "10:17:48", "remaining_time": "3:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3402, "total_steps": 4438, "loss": 0.1276, "learning_rate": 7.086819391467612e-07, "epoch": 0.7664967471202861, "percentage": 76.66, "elapsed_time": "10:18:00", "remaining_time": "3:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3403, "total_steps": 4438, "loss": 0.1317, "learning_rate": 7.073829544824795e-07, "epoch": 0.7667220548060946, "percentage": 76.68, "elapsed_time": "10:18:10", "remaining_time": "3:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3404, "total_steps": 4438, "loss": 0.1271, "learning_rate": 7.060849651916244e-07, "epoch": 0.766947362491903, "percentage": 76.7, "elapsed_time": "10:18:21", "remaining_time": "3:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3405, "total_steps": 4438, "loss": 0.126, "learning_rate": 7.047879719949227e-07, "epoch": 0.7671726701777114, "percentage": 76.72, "elapsed_time": "10:18:32", "remaining_time": "3:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3406, "total_steps": 4438, "loss": 0.1253, "learning_rate": 7.034919756125447e-07, "epoch": 0.7673979778635198, "percentage": 76.75, "elapsed_time": "10:18:42", "remaining_time": "3:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3407, "total_steps": 4438, "loss": 0.1261, "learning_rate": 7.021969767641096e-07, "epoch": 0.7676232855493283, "percentage": 76.77, "elapsed_time": "10:18:54", "remaining_time": "3:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3408, "total_steps": 4438, "loss": 0.1352, "learning_rate": 7.009029761686825e-07, "epoch": 0.7678485932351368, "percentage": 76.79, "elapsed_time": "10:19:03", "remaining_time": "3:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3409, "total_steps": 4438, "loss": 0.1252, "learning_rate": 6.996099745447726e-07, "epoch": 0.7680739009209452, "percentage": 76.81, "elapsed_time": "10:19:14", "remaining_time": "3:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 4438, "loss": 0.1412, "learning_rate": 6.98317972610337e-07, "epoch": 0.7682992086067536, "percentage": 76.84, "elapsed_time": "10:19:24", "remaining_time": "3:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3411, "total_steps": 4438, "loss": 0.1178, "learning_rate": 6.970269710827754e-07, "epoch": 0.768524516292562, "percentage": 76.86, "elapsed_time": "10:19:36", "remaining_time": "3:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3412, "total_steps": 4438, "loss": 0.1257, "learning_rate": 6.957369706789319e-07, "epoch": 0.7687498239783704, "percentage": 76.88, "elapsed_time": "10:19:47", "remaining_time": "3:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3413, "total_steps": 4438, "loss": 0.1268, "learning_rate": 6.944479721150971e-07, "epoch": 0.7689751316641789, "percentage": 76.9, "elapsed_time": "10:19:56", "remaining_time": "3:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3414, "total_steps": 4438, "loss": 0.1396, "learning_rate": 6.931599761070027e-07, "epoch": 0.7692004393499873, "percentage": 76.93, "elapsed_time": "10:20:07", "remaining_time": "3:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3415, "total_steps": 4438, "loss": 0.1369, "learning_rate": 6.91872983369826e-07, "epoch": 0.7694257470357958, "percentage": 76.95, "elapsed_time": "10:20:17", "remaining_time": "3:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3416, "total_steps": 4438, "loss": 0.1372, "learning_rate": 6.905869946181848e-07, "epoch": 0.7696510547216042, "percentage": 76.97, "elapsed_time": "10:20:28", "remaining_time": "3:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3417, "total_steps": 4438, "loss": 0.1249, "learning_rate": 6.893020105661416e-07, "epoch": 0.7698763624074126, "percentage": 76.99, "elapsed_time": "10:20:40", "remaining_time": "3:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3418, "total_steps": 4438, "loss": 0.1296, "learning_rate": 6.880180319272006e-07, "epoch": 0.7701016700932211, "percentage": 77.02, "elapsed_time": "10:20:49", "remaining_time": "3:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3419, "total_steps": 4438, "loss": 0.1411, "learning_rate": 6.867350594143058e-07, "epoch": 0.7703269777790295, "percentage": 77.04, "elapsed_time": "10:21:00", "remaining_time": "3:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 4438, "loss": 0.1313, "learning_rate": 6.854530937398459e-07, "epoch": 0.7705522854648379, "percentage": 77.06, "elapsed_time": "10:21:10", "remaining_time": "3:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3421, "total_steps": 4438, "loss": 0.1339, "learning_rate": 6.841721356156466e-07, "epoch": 0.7707775931506463, "percentage": 77.08, "elapsed_time": "10:21:20", "remaining_time": "3:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3422, "total_steps": 4438, "loss": 0.1205, "learning_rate": 6.828921857529774e-07, "epoch": 0.7710029008364547, "percentage": 77.11, "elapsed_time": "10:21:30", "remaining_time": "3:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3423, "total_steps": 4438, "loss": 0.1258, "learning_rate": 6.816132448625474e-07, "epoch": 0.7712282085222633, "percentage": 77.13, "elapsed_time": "10:21:40", "remaining_time": "3:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3424, "total_steps": 4438, "loss": 0.1238, "learning_rate": 6.803353136545033e-07, "epoch": 0.7714535162080717, "percentage": 77.15, "elapsed_time": "10:21:50", "remaining_time": "3:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3425, "total_steps": 4438, "loss": 0.1357, "learning_rate": 6.790583928384339e-07, "epoch": 0.7716788238938801, "percentage": 77.17, "elapsed_time": "10:22:02", "remaining_time": "3:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3426, "total_steps": 4438, "loss": 0.1404, "learning_rate": 6.777824831233645e-07, "epoch": 0.7719041315796885, "percentage": 77.2, "elapsed_time": "10:22:14", "remaining_time": "3:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3427, "total_steps": 4438, "loss": 0.1299, "learning_rate": 6.765075852177619e-07, "epoch": 0.7721294392654969, "percentage": 77.22, "elapsed_time": "10:22:24", "remaining_time": "3:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3428, "total_steps": 4438, "loss": 0.1308, "learning_rate": 6.752336998295281e-07, "epoch": 0.7723547469513053, "percentage": 77.24, "elapsed_time": "10:22:35", "remaining_time": "3:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3429, "total_steps": 4438, "loss": 0.1297, "learning_rate": 6.739608276660037e-07, "epoch": 0.7725800546371138, "percentage": 77.26, "elapsed_time": "10:22:46", "remaining_time": "3:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 4438, "loss": 0.1289, "learning_rate": 6.726889694339689e-07, "epoch": 0.7728053623229223, "percentage": 77.29, "elapsed_time": "10:22:57", "remaining_time": "3:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3431, "total_steps": 4438, "loss": 0.1463, "learning_rate": 6.714181258396371e-07, "epoch": 0.7730306700087307, "percentage": 77.31, "elapsed_time": "10:23:09", "remaining_time": "3:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3432, "total_steps": 4438, "loss": 0.1447, "learning_rate": 6.701482975886617e-07, "epoch": 0.7732559776945391, "percentage": 77.33, "elapsed_time": "10:23:19", "remaining_time": "3:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3433, "total_steps": 4438, "loss": 0.1383, "learning_rate": 6.688794853861316e-07, "epoch": 0.7734812853803475, "percentage": 77.35, "elapsed_time": "10:23:31", "remaining_time": "3:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3434, "total_steps": 4438, "loss": 0.1355, "learning_rate": 6.676116899365692e-07, "epoch": 0.773706593066156, "percentage": 77.38, "elapsed_time": "10:23:43", "remaining_time": "3:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3435, "total_steps": 4438, "loss": 0.1189, "learning_rate": 6.663449119439358e-07, "epoch": 0.7739319007519644, "percentage": 77.4, "elapsed_time": "10:23:52", "remaining_time": "3:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3436, "total_steps": 4438, "loss": 0.1214, "learning_rate": 6.650791521116243e-07, "epoch": 0.7741572084377728, "percentage": 77.42, "elapsed_time": "10:24:02", "remaining_time": "3:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3437, "total_steps": 4438, "loss": 0.1313, "learning_rate": 6.638144111424655e-07, "epoch": 0.7743825161235812, "percentage": 77.44, "elapsed_time": "10:24:13", "remaining_time": "3:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3438, "total_steps": 4438, "loss": 0.1212, "learning_rate": 6.625506897387215e-07, "epoch": 0.7746078238093898, "percentage": 77.47, "elapsed_time": "10:24:23", "remaining_time": "3:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3439, "total_steps": 4438, "loss": 0.1351, "learning_rate": 6.612879886020907e-07, "epoch": 0.7748331314951982, "percentage": 77.49, "elapsed_time": "10:24:35", "remaining_time": "3:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 4438, "loss": 0.1269, "learning_rate": 6.600263084337041e-07, "epoch": 0.7750584391810066, "percentage": 77.51, "elapsed_time": "10:24:46", "remaining_time": "3:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3441, "total_steps": 4438, "loss": 0.1324, "learning_rate": 6.587656499341247e-07, "epoch": 0.775283746866815, "percentage": 77.53, "elapsed_time": "10:24:55", "remaining_time": "3:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3442, "total_steps": 4438, "loss": 0.1236, "learning_rate": 6.575060138033504e-07, "epoch": 0.7755090545526234, "percentage": 77.56, "elapsed_time": "10:25:05", "remaining_time": "3:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3443, "total_steps": 4438, "loss": 0.1269, "learning_rate": 6.562474007408087e-07, "epoch": 0.7757343622384318, "percentage": 77.58, "elapsed_time": "10:25:16", "remaining_time": "3:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3444, "total_steps": 4438, "loss": 0.1236, "learning_rate": 6.549898114453615e-07, "epoch": 0.7759596699242403, "percentage": 77.6, "elapsed_time": "10:25:27", "remaining_time": "3:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3445, "total_steps": 4438, "loss": 0.1312, "learning_rate": 6.537332466153018e-07, "epoch": 0.7761849776100487, "percentage": 77.63, "elapsed_time": "10:25:37", "remaining_time": "3:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3446, "total_steps": 4438, "loss": 0.1271, "learning_rate": 6.524777069483526e-07, "epoch": 0.7764102852958572, "percentage": 77.65, "elapsed_time": "10:25:48", "remaining_time": "3:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3447, "total_steps": 4438, "loss": 0.1443, "learning_rate": 6.512231931416674e-07, "epoch": 0.7766355929816656, "percentage": 77.67, "elapsed_time": "10:25:58", "remaining_time": "2:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3448, "total_steps": 4438, "loss": 0.1261, "learning_rate": 6.499697058918326e-07, "epoch": 0.776860900667474, "percentage": 77.69, "elapsed_time": "10:26:11", "remaining_time": "2:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3449, "total_steps": 4438, "loss": 0.1321, "learning_rate": 6.487172458948612e-07, "epoch": 0.7770862083532825, "percentage": 77.72, "elapsed_time": "10:26:21", "remaining_time": "2:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 4438, "loss": 0.1394, "learning_rate": 6.474658138461992e-07, "epoch": 0.7773115160390909, "percentage": 77.74, "elapsed_time": "10:26:32", "remaining_time": "2:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3451, "total_steps": 4438, "loss": 0.1341, "learning_rate": 6.462154104407187e-07, "epoch": 0.7775368237248993, "percentage": 77.76, "elapsed_time": "10:26:43", "remaining_time": "2:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3452, "total_steps": 4438, "loss": 0.1125, "learning_rate": 6.449660363727236e-07, "epoch": 0.7777621314107077, "percentage": 77.78, "elapsed_time": "10:26:53", "remaining_time": "2:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3453, "total_steps": 4438, "loss": 0.1264, "learning_rate": 6.437176923359434e-07, "epoch": 0.7779874390965161, "percentage": 77.81, "elapsed_time": "10:27:04", "remaining_time": "2:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3454, "total_steps": 4438, "loss": 0.1316, "learning_rate": 6.424703790235374e-07, "epoch": 0.7782127467823247, "percentage": 77.83, "elapsed_time": "10:27:13", "remaining_time": "2:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3455, "total_steps": 4438, "loss": 0.1358, "learning_rate": 6.41224097128093e-07, "epoch": 0.7784380544681331, "percentage": 77.85, "elapsed_time": "10:27:24", "remaining_time": "2:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3456, "total_steps": 4438, "loss": 0.1431, "learning_rate": 6.399788473416229e-07, "epoch": 0.7786633621539415, "percentage": 77.87, "elapsed_time": "10:27:35", "remaining_time": "2:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3457, "total_steps": 4438, "loss": 0.132, "learning_rate": 6.387346303555691e-07, "epoch": 0.7788886698397499, "percentage": 77.9, "elapsed_time": "10:27:46", "remaining_time": "2:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3458, "total_steps": 4438, "loss": 0.1367, "learning_rate": 6.374914468607976e-07, "epoch": 0.7791139775255583, "percentage": 77.92, "elapsed_time": "10:27:55", "remaining_time": "2:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3459, "total_steps": 4438, "loss": 0.1401, "learning_rate": 6.362492975476033e-07, "epoch": 0.7793392852113668, "percentage": 77.94, "elapsed_time": "10:28:06", "remaining_time": "2:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 4438, "loss": 0.1342, "learning_rate": 6.35008183105704e-07, "epoch": 0.7795645928971752, "percentage": 77.96, "elapsed_time": "10:28:16", "remaining_time": "2:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3461, "total_steps": 4438, "loss": 0.1225, "learning_rate": 6.337681042242447e-07, "epoch": 0.7797899005829836, "percentage": 77.99, "elapsed_time": "10:28:28", "remaining_time": "2:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3462, "total_steps": 4438, "loss": 0.126, "learning_rate": 6.325290615917961e-07, "epoch": 0.7800152082687921, "percentage": 78.01, "elapsed_time": "10:28:38", "remaining_time": "2:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3463, "total_steps": 4438, "loss": 0.1416, "learning_rate": 6.312910558963505e-07, "epoch": 0.7802405159546005, "percentage": 78.03, "elapsed_time": "10:28:50", "remaining_time": "2:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3464, "total_steps": 4438, "loss": 0.1395, "learning_rate": 6.300540878253286e-07, "epoch": 0.780465823640409, "percentage": 78.05, "elapsed_time": "10:29:00", "remaining_time": "2:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3465, "total_steps": 4438, "loss": 0.1256, "learning_rate": 6.288181580655709e-07, "epoch": 0.7806911313262174, "percentage": 78.08, "elapsed_time": "10:29:10", "remaining_time": "2:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3466, "total_steps": 4438, "loss": 0.1241, "learning_rate": 6.27583267303343e-07, "epoch": 0.7809164390120258, "percentage": 78.1, "elapsed_time": "10:29:20", "remaining_time": "2:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3467, "total_steps": 4438, "loss": 0.1368, "learning_rate": 6.263494162243352e-07, "epoch": 0.7811417466978342, "percentage": 78.12, "elapsed_time": "10:29:31", "remaining_time": "2:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3468, "total_steps": 4438, "loss": 0.1417, "learning_rate": 6.251166055136573e-07, "epoch": 0.7813670543836426, "percentage": 78.14, "elapsed_time": "10:29:41", "remaining_time": "2:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3469, "total_steps": 4438, "loss": 0.119, "learning_rate": 6.238848358558439e-07, "epoch": 0.781592362069451, "percentage": 78.17, "elapsed_time": "10:29:51", "remaining_time": "2:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 4438, "loss": 0.1305, "learning_rate": 6.226541079348517e-07, "epoch": 0.7818176697552596, "percentage": 78.19, "elapsed_time": "10:30:02", "remaining_time": "2:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3471, "total_steps": 4438, "loss": 0.1238, "learning_rate": 6.214244224340563e-07, "epoch": 0.782042977441068, "percentage": 78.21, "elapsed_time": "10:30:11", "remaining_time": "2:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3472, "total_steps": 4438, "loss": 0.123, "learning_rate": 6.201957800362579e-07, "epoch": 0.7822682851268764, "percentage": 78.23, "elapsed_time": "10:30:22", "remaining_time": "2:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3473, "total_steps": 4438, "loss": 0.1287, "learning_rate": 6.189681814236742e-07, "epoch": 0.7824935928126848, "percentage": 78.26, "elapsed_time": "10:30:35", "remaining_time": "2:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3474, "total_steps": 4438, "loss": 0.135, "learning_rate": 6.177416272779468e-07, "epoch": 0.7827189004984932, "percentage": 78.28, "elapsed_time": "10:30:45", "remaining_time": "2:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3475, "total_steps": 4438, "loss": 0.1203, "learning_rate": 6.165161182801336e-07, "epoch": 0.7829442081843017, "percentage": 78.3, "elapsed_time": "10:30:55", "remaining_time": "2:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3476, "total_steps": 4438, "loss": 0.132, "learning_rate": 6.152916551107149e-07, "epoch": 0.7831695158701101, "percentage": 78.32, "elapsed_time": "10:31:06", "remaining_time": "2:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3477, "total_steps": 4438, "loss": 0.1293, "learning_rate": 6.140682384495902e-07, "epoch": 0.7833948235559185, "percentage": 78.35, "elapsed_time": "10:31:16", "remaining_time": "2:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3478, "total_steps": 4438, "loss": 0.1346, "learning_rate": 6.12845868976076e-07, "epoch": 0.783620131241727, "percentage": 78.37, "elapsed_time": "10:31:27", "remaining_time": "2:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3479, "total_steps": 4438, "loss": 0.1285, "learning_rate": 6.116245473689094e-07, "epoch": 0.7838454389275354, "percentage": 78.39, "elapsed_time": "10:31:38", "remaining_time": "2:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 4438, "loss": 0.1423, "learning_rate": 6.104042743062439e-07, "epoch": 0.7840707466133439, "percentage": 78.41, "elapsed_time": "10:31:49", "remaining_time": "2:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3481, "total_steps": 4438, "loss": 0.1295, "learning_rate": 6.091850504656527e-07, "epoch": 0.7842960542991523, "percentage": 78.44, "elapsed_time": "10:32:00", "remaining_time": "2:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3482, "total_steps": 4438, "loss": 0.115, "learning_rate": 6.079668765241248e-07, "epoch": 0.7845213619849607, "percentage": 78.46, "elapsed_time": "10:32:11", "remaining_time": "2:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3483, "total_steps": 4438, "loss": 0.1369, "learning_rate": 6.06749753158066e-07, "epoch": 0.7847466696707691, "percentage": 78.48, "elapsed_time": "10:32:21", "remaining_time": "2:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3484, "total_steps": 4438, "loss": 0.133, "learning_rate": 6.05533681043301e-07, "epoch": 0.7849719773565775, "percentage": 78.5, "elapsed_time": "10:32:32", "remaining_time": "2:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3485, "total_steps": 4438, "loss": 0.1186, "learning_rate": 6.04318660855068e-07, "epoch": 0.7851972850423861, "percentage": 78.53, "elapsed_time": "10:32:43", "remaining_time": "2:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3486, "total_steps": 4438, "loss": 0.1286, "learning_rate": 6.031046932680229e-07, "epoch": 0.7854225927281945, "percentage": 78.55, "elapsed_time": "10:32:53", "remaining_time": "2:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3487, "total_steps": 4438, "loss": 0.1439, "learning_rate": 6.018917789562372e-07, "epoch": 0.7856479004140029, "percentage": 78.57, "elapsed_time": "10:33:04", "remaining_time": "2:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3488, "total_steps": 4438, "loss": 0.1231, "learning_rate": 6.006799185931964e-07, "epoch": 0.7858732080998113, "percentage": 78.59, "elapsed_time": "10:33:13", "remaining_time": "2:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3489, "total_steps": 4438, "loss": 0.1293, "learning_rate": 5.994691128518019e-07, "epoch": 0.7860985157856197, "percentage": 78.62, "elapsed_time": "10:33:25", "remaining_time": "2:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 4438, "loss": 0.1389, "learning_rate": 5.982593624043682e-07, "epoch": 0.7863238234714282, "percentage": 78.64, "elapsed_time": "10:33:35", "remaining_time": "2:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3491, "total_steps": 4438, "loss": 0.1343, "learning_rate": 5.970506679226249e-07, "epoch": 0.7865491311572366, "percentage": 78.66, "elapsed_time": "10:33:45", "remaining_time": "2:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3492, "total_steps": 4438, "loss": 0.1329, "learning_rate": 5.958430300777157e-07, "epoch": 0.786774438843045, "percentage": 78.68, "elapsed_time": "10:33:57", "remaining_time": "2:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3493, "total_steps": 4438, "loss": 0.1337, "learning_rate": 5.94636449540196e-07, "epoch": 0.7869997465288535, "percentage": 78.71, "elapsed_time": "10:34:06", "remaining_time": "2:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3494, "total_steps": 4438, "loss": 0.1371, "learning_rate": 5.934309269800359e-07, "epoch": 0.7872250542146619, "percentage": 78.73, "elapsed_time": "10:34:16", "remaining_time": "2:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3495, "total_steps": 4438, "loss": 0.1246, "learning_rate": 5.922264630666161e-07, "epoch": 0.7874503619004704, "percentage": 78.75, "elapsed_time": "10:34:27", "remaining_time": "2:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3496, "total_steps": 4438, "loss": 0.131, "learning_rate": 5.910230584687316e-07, "epoch": 0.7876756695862788, "percentage": 78.77, "elapsed_time": "10:34:38", "remaining_time": "2:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3497, "total_steps": 4438, "loss": 0.1279, "learning_rate": 5.898207138545867e-07, "epoch": 0.7879009772720872, "percentage": 78.8, "elapsed_time": "10:34:49", "remaining_time": "2:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3498, "total_steps": 4438, "loss": 0.1344, "learning_rate": 5.886194298917994e-07, "epoch": 0.7881262849578956, "percentage": 78.82, "elapsed_time": "10:35:00", "remaining_time": "2:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3499, "total_steps": 4438, "loss": 0.134, "learning_rate": 5.874192072473995e-07, "epoch": 0.788351592643704, "percentage": 78.84, "elapsed_time": "10:35:09", "remaining_time": "2:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 4438, "loss": 0.1347, "learning_rate": 5.862200465878228e-07, "epoch": 0.7885769003295124, "percentage": 78.86, "elapsed_time": "10:35:19", "remaining_time": "2:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 4438, "eval_loss": 0.12961439788341522, "epoch": 0.7885769003295124, "percentage": 78.86, "elapsed_time": "10:37:22", "remaining_time": "2:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3501, "total_steps": 4438, "loss": 0.139, "learning_rate": 5.850219485789199e-07, "epoch": 0.788802208015321, "percentage": 78.89, "elapsed_time": "10:37:32", "remaining_time": "2:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3502, "total_steps": 4438, "loss": 0.1292, "learning_rate": 5.838249138859509e-07, "epoch": 0.7890275157011294, "percentage": 78.91, "elapsed_time": "10:37:44", "remaining_time": "2:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3503, "total_steps": 4438, "loss": 0.1318, "learning_rate": 5.826289431735832e-07, "epoch": 0.7892528233869378, "percentage": 78.93, "elapsed_time": "10:37:55", "remaining_time": "2:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3504, "total_steps": 4438, "loss": 0.1206, "learning_rate": 5.814340371058957e-07, "epoch": 0.7894781310727462, "percentage": 78.95, "elapsed_time": "10:38:06", "remaining_time": "2:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3505, "total_steps": 4438, "loss": 0.1255, "learning_rate": 5.802401963463741e-07, "epoch": 0.7897034387585546, "percentage": 78.98, "elapsed_time": "10:38:18", "remaining_time": "2:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3506, "total_steps": 4438, "loss": 0.1438, "learning_rate": 5.79047421557915e-07, "epoch": 0.7899287464443631, "percentage": 79.0, "elapsed_time": "10:38:30", "remaining_time": "2:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3507, "total_steps": 4438, "loss": 0.1264, "learning_rate": 5.778557134028207e-07, "epoch": 0.7901540541301715, "percentage": 79.02, "elapsed_time": "10:38:41", "remaining_time": "2:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3508, "total_steps": 4438, "loss": 0.1272, "learning_rate": 5.766650725428027e-07, "epoch": 0.7903793618159799, "percentage": 79.04, "elapsed_time": "10:38:51", "remaining_time": "2:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3509, "total_steps": 4438, "loss": 0.1118, "learning_rate": 5.754754996389799e-07, "epoch": 0.7906046695017884, "percentage": 79.07, "elapsed_time": "10:39:02", "remaining_time": "2:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 4438, "loss": 0.1451, "learning_rate": 5.742869953518773e-07, "epoch": 0.7908299771875968, "percentage": 79.09, "elapsed_time": "10:39:12", "remaining_time": "2:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3511, "total_steps": 4438, "loss": 0.1249, "learning_rate": 5.730995603414274e-07, "epoch": 0.7910552848734053, "percentage": 79.11, "elapsed_time": "10:39:23", "remaining_time": "2:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3512, "total_steps": 4438, "loss": 0.1413, "learning_rate": 5.719131952669679e-07, "epoch": 0.7912805925592137, "percentage": 79.13, "elapsed_time": "10:39:35", "remaining_time": "2:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3513, "total_steps": 4438, "loss": 0.13, "learning_rate": 5.707279007872435e-07, "epoch": 0.7915059002450221, "percentage": 79.16, "elapsed_time": "10:39:45", "remaining_time": "2:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3514, "total_steps": 4438, "loss": 0.125, "learning_rate": 5.695436775604049e-07, "epoch": 0.7917312079308305, "percentage": 79.18, "elapsed_time": "10:39:56", "remaining_time": "2:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3515, "total_steps": 4438, "loss": 0.1333, "learning_rate": 5.683605262440056e-07, "epoch": 0.7919565156166389, "percentage": 79.2, "elapsed_time": "10:40:06", "remaining_time": "2:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3516, "total_steps": 4438, "loss": 0.1161, "learning_rate": 5.671784474950068e-07, "epoch": 0.7921818233024474, "percentage": 79.22, "elapsed_time": "10:40:16", "remaining_time": "2:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3517, "total_steps": 4438, "loss": 0.1351, "learning_rate": 5.659974419697723e-07, "epoch": 0.7924071309882559, "percentage": 79.25, "elapsed_time": "10:40:27", "remaining_time": "2:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3518, "total_steps": 4438, "loss": 0.1271, "learning_rate": 5.648175103240694e-07, "epoch": 0.7926324386740643, "percentage": 79.27, "elapsed_time": "10:40:37", "remaining_time": "2:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3519, "total_steps": 4438, "loss": 0.1437, "learning_rate": 5.636386532130717e-07, "epoch": 0.7928577463598727, "percentage": 79.29, "elapsed_time": "10:40:48", "remaining_time": "2:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 4438, "loss": 0.1253, "learning_rate": 5.624608712913531e-07, "epoch": 0.7930830540456811, "percentage": 79.32, "elapsed_time": "10:41:00", "remaining_time": "2:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3521, "total_steps": 4438, "loss": 0.1398, "learning_rate": 5.612841652128939e-07, "epoch": 0.7933083617314896, "percentage": 79.34, "elapsed_time": "10:41:10", "remaining_time": "2:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3522, "total_steps": 4438, "loss": 0.1151, "learning_rate": 5.601085356310734e-07, "epoch": 0.793533669417298, "percentage": 79.36, "elapsed_time": "10:41:20", "remaining_time": "2:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3523, "total_steps": 4438, "loss": 0.1405, "learning_rate": 5.589339831986754e-07, "epoch": 0.7937589771031064, "percentage": 79.38, "elapsed_time": "10:41:30", "remaining_time": "2:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3524, "total_steps": 4438, "loss": 0.1379, "learning_rate": 5.577605085678858e-07, "epoch": 0.7939842847889148, "percentage": 79.41, "elapsed_time": "10:41:41", "remaining_time": "2:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3525, "total_steps": 4438, "loss": 0.1229, "learning_rate": 5.565881123902903e-07, "epoch": 0.7942095924747233, "percentage": 79.43, "elapsed_time": "10:41:52", "remaining_time": "2:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3526, "total_steps": 4438, "loss": 0.1316, "learning_rate": 5.554167953168779e-07, "epoch": 0.7944349001605318, "percentage": 79.45, "elapsed_time": "10:42:02", "remaining_time": "2:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3527, "total_steps": 4438, "loss": 0.1365, "learning_rate": 5.542465579980361e-07, "epoch": 0.7946602078463402, "percentage": 79.47, "elapsed_time": "10:42:12", "remaining_time": "2:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3528, "total_steps": 4438, "loss": 0.1392, "learning_rate": 5.530774010835552e-07, "epoch": 0.7948855155321486, "percentage": 79.5, "elapsed_time": "10:42:22", "remaining_time": "2:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3529, "total_steps": 4438, "loss": 0.1215, "learning_rate": 5.519093252226232e-07, "epoch": 0.795110823217957, "percentage": 79.52, "elapsed_time": "10:42:33", "remaining_time": "2:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 4438, "loss": 0.1269, "learning_rate": 5.507423310638299e-07, "epoch": 0.7953361309037654, "percentage": 79.54, "elapsed_time": "10:42:43", "remaining_time": "2:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3531, "total_steps": 4438, "loss": 0.1275, "learning_rate": 5.495764192551642e-07, "epoch": 0.7955614385895738, "percentage": 79.56, "elapsed_time": "10:42:52", "remaining_time": "2:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3532, "total_steps": 4438, "loss": 0.1353, "learning_rate": 5.48411590444012e-07, "epoch": 0.7957867462753824, "percentage": 79.59, "elapsed_time": "10:43:03", "remaining_time": "2:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3533, "total_steps": 4438, "loss": 0.1343, "learning_rate": 5.47247845277161e-07, "epoch": 0.7960120539611908, "percentage": 79.61, "elapsed_time": "10:43:14", "remaining_time": "2:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3534, "total_steps": 4438, "loss": 0.1404, "learning_rate": 5.460851844007945e-07, "epoch": 0.7962373616469992, "percentage": 79.63, "elapsed_time": "10:43:25", "remaining_time": "2:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3535, "total_steps": 4438, "loss": 0.1078, "learning_rate": 5.449236084604942e-07, "epoch": 0.7964626693328076, "percentage": 79.65, "elapsed_time": "10:43:36", "remaining_time": "2:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3536, "total_steps": 4438, "loss": 0.1314, "learning_rate": 5.437631181012415e-07, "epoch": 0.796687977018616, "percentage": 79.68, "elapsed_time": "10:43:46", "remaining_time": "2:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3537, "total_steps": 4438, "loss": 0.1204, "learning_rate": 5.426037139674117e-07, "epoch": 0.7969132847044245, "percentage": 79.7, "elapsed_time": "10:43:57", "remaining_time": "2:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3538, "total_steps": 4438, "loss": 0.1347, "learning_rate": 5.414453967027797e-07, "epoch": 0.7971385923902329, "percentage": 79.72, "elapsed_time": "10:44:08", "remaining_time": "2:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3539, "total_steps": 4438, "loss": 0.1434, "learning_rate": 5.402881669505164e-07, "epoch": 0.7973639000760413, "percentage": 79.74, "elapsed_time": "10:44:20", "remaining_time": "2:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 4438, "loss": 0.1254, "learning_rate": 5.391320253531868e-07, "epoch": 0.7975892077618498, "percentage": 79.77, "elapsed_time": "10:44:30", "remaining_time": "2:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3541, "total_steps": 4438, "loss": 0.1313, "learning_rate": 5.37976972552755e-07, "epoch": 0.7978145154476582, "percentage": 79.79, "elapsed_time": "10:44:40", "remaining_time": "2:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3542, "total_steps": 4438, "loss": 0.1206, "learning_rate": 5.368230091905774e-07, "epoch": 0.7980398231334667, "percentage": 79.81, "elapsed_time": "10:44:51", "remaining_time": "2:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3543, "total_steps": 4438, "loss": 0.1258, "learning_rate": 5.356701359074076e-07, "epoch": 0.7982651308192751, "percentage": 79.83, "elapsed_time": "10:45:03", "remaining_time": "2:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3544, "total_steps": 4438, "loss": 0.1241, "learning_rate": 5.345183533433926e-07, "epoch": 0.7984904385050835, "percentage": 79.86, "elapsed_time": "10:45:13", "remaining_time": "2:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3545, "total_steps": 4438, "loss": 0.1192, "learning_rate": 5.333676621380746e-07, "epoch": 0.7987157461908919, "percentage": 79.88, "elapsed_time": "10:45:23", "remaining_time": "2:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3546, "total_steps": 4438, "loss": 0.1172, "learning_rate": 5.322180629303902e-07, "epoch": 0.7989410538767003, "percentage": 79.9, "elapsed_time": "10:45:33", "remaining_time": "2:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3547, "total_steps": 4438, "loss": 0.1185, "learning_rate": 5.310695563586676e-07, "epoch": 0.7991663615625088, "percentage": 79.92, "elapsed_time": "10:45:44", "remaining_time": "2:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3548, "total_steps": 4438, "loss": 0.137, "learning_rate": 5.299221430606313e-07, "epoch": 0.7993916692483173, "percentage": 79.95, "elapsed_time": "10:45:54", "remaining_time": "2:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3549, "total_steps": 4438, "loss": 0.1322, "learning_rate": 5.287758236733956e-07, "epoch": 0.7996169769341257, "percentage": 79.97, "elapsed_time": "10:46:05", "remaining_time": "2:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 4438, "loss": 0.113, "learning_rate": 5.276305988334701e-07, "epoch": 0.7998422846199341, "percentage": 79.99, "elapsed_time": "10:46:14", "remaining_time": "2:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3551, "total_steps": 4438, "loss": 0.1178, "learning_rate": 5.264864691767551e-07, "epoch": 0.8000675923057425, "percentage": 80.01, "elapsed_time": "10:46:25", "remaining_time": "2:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3552, "total_steps": 4438, "loss": 0.1305, "learning_rate": 5.253434353385422e-07, "epoch": 0.800292899991551, "percentage": 80.04, "elapsed_time": "10:46:35", "remaining_time": "2:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3553, "total_steps": 4438, "loss": 0.1271, "learning_rate": 5.242014979535173e-07, "epoch": 0.8005182076773594, "percentage": 80.06, "elapsed_time": "10:46:45", "remaining_time": "2:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3554, "total_steps": 4438, "loss": 0.1168, "learning_rate": 5.23060657655754e-07, "epoch": 0.8007435153631678, "percentage": 80.08, "elapsed_time": "10:46:55", "remaining_time": "2:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3555, "total_steps": 4438, "loss": 0.1203, "learning_rate": 5.219209150787189e-07, "epoch": 0.8009688230489762, "percentage": 80.1, "elapsed_time": "10:47:07", "remaining_time": "2:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3556, "total_steps": 4438, "loss": 0.1233, "learning_rate": 5.207822708552695e-07, "epoch": 0.8011941307347847, "percentage": 80.13, "elapsed_time": "10:47:18", "remaining_time": "2:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3557, "total_steps": 4438, "loss": 0.1254, "learning_rate": 5.196447256176509e-07, "epoch": 0.8014194384205932, "percentage": 80.15, "elapsed_time": "10:47:28", "remaining_time": "2:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3558, "total_steps": 4438, "loss": 0.1233, "learning_rate": 5.185082799975013e-07, "epoch": 0.8016447461064016, "percentage": 80.17, "elapsed_time": "10:47:39", "remaining_time": "2:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3559, "total_steps": 4438, "loss": 0.1293, "learning_rate": 5.173729346258452e-07, "epoch": 0.80187005379221, "percentage": 80.19, "elapsed_time": "10:47:48", "remaining_time": "2:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 4438, "loss": 0.1319, "learning_rate": 5.162386901330977e-07, "epoch": 0.8020953614780184, "percentage": 80.22, "elapsed_time": "10:48:00", "remaining_time": "2:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3561, "total_steps": 4438, "loss": 0.1274, "learning_rate": 5.151055471490638e-07, "epoch": 0.8023206691638268, "percentage": 80.24, "elapsed_time": "10:48:11", "remaining_time": "2:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3562, "total_steps": 4438, "loss": 0.1194, "learning_rate": 5.139735063029338e-07, "epoch": 0.8025459768496352, "percentage": 80.26, "elapsed_time": "10:48:21", "remaining_time": "2:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3563, "total_steps": 4438, "loss": 0.1286, "learning_rate": 5.128425682232893e-07, "epoch": 0.8027712845354437, "percentage": 80.28, "elapsed_time": "10:48:32", "remaining_time": "2:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3564, "total_steps": 4438, "loss": 0.1292, "learning_rate": 5.117127335380967e-07, "epoch": 0.8029965922212522, "percentage": 80.31, "elapsed_time": "10:48:42", "remaining_time": "2:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3565, "total_steps": 4438, "loss": 0.1223, "learning_rate": 5.105840028747125e-07, "epoch": 0.8032218999070606, "percentage": 80.33, "elapsed_time": "10:48:53", "remaining_time": "2:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3566, "total_steps": 4438, "loss": 0.1099, "learning_rate": 5.094563768598773e-07, "epoch": 0.803447207592869, "percentage": 80.35, "elapsed_time": "10:49:03", "remaining_time": "2:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3567, "total_steps": 4438, "loss": 0.1267, "learning_rate": 5.083298561197205e-07, "epoch": 0.8036725152786774, "percentage": 80.37, "elapsed_time": "10:49:14", "remaining_time": "2:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3568, "total_steps": 4438, "loss": 0.1197, "learning_rate": 5.07204441279758e-07, "epoch": 0.8038978229644859, "percentage": 80.4, "elapsed_time": "10:49:23", "remaining_time": "2:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3569, "total_steps": 4438, "loss": 0.1187, "learning_rate": 5.060801329648896e-07, "epoch": 0.8041231306502943, "percentage": 80.42, "elapsed_time": "10:49:34", "remaining_time": "2:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 4438, "loss": 0.1287, "learning_rate": 5.049569317994013e-07, "epoch": 0.8043484383361027, "percentage": 80.44, "elapsed_time": "10:49:44", "remaining_time": "2:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3571, "total_steps": 4438, "loss": 0.1292, "learning_rate": 5.038348384069663e-07, "epoch": 0.8045737460219111, "percentage": 80.46, "elapsed_time": "10:49:55", "remaining_time": "2:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3572, "total_steps": 4438, "loss": 0.1188, "learning_rate": 5.027138534106399e-07, "epoch": 0.8047990537077196, "percentage": 80.49, "elapsed_time": "10:50:04", "remaining_time": "2:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3573, "total_steps": 4438, "loss": 0.1223, "learning_rate": 5.015939774328643e-07, "epoch": 0.8050243613935281, "percentage": 80.51, "elapsed_time": "10:50:16", "remaining_time": "2:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3574, "total_steps": 4438, "loss": 0.1282, "learning_rate": 5.004752110954642e-07, "epoch": 0.8052496690793365, "percentage": 80.53, "elapsed_time": "10:50:26", "remaining_time": "2:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3575, "total_steps": 4438, "loss": 0.1254, "learning_rate": 4.993575550196495e-07, "epoch": 0.8054749767651449, "percentage": 80.55, "elapsed_time": "10:50:37", "remaining_time": "2:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3576, "total_steps": 4438, "loss": 0.1435, "learning_rate": 4.982410098260118e-07, "epoch": 0.8057002844509533, "percentage": 80.58, "elapsed_time": "10:50:48", "remaining_time": "2:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3577, "total_steps": 4438, "loss": 0.1303, "learning_rate": 4.971255761345278e-07, "epoch": 0.8059255921367617, "percentage": 80.6, "elapsed_time": "10:50:59", "remaining_time": "2:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3578, "total_steps": 4438, "loss": 0.136, "learning_rate": 4.96011254564557e-07, "epoch": 0.8061508998225702, "percentage": 80.62, "elapsed_time": "10:51:09", "remaining_time": "2:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3579, "total_steps": 4438, "loss": 0.1331, "learning_rate": 4.948980457348393e-07, "epoch": 0.8063762075083787, "percentage": 80.64, "elapsed_time": "10:51:19", "remaining_time": "2:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 4438, "loss": 0.1326, "learning_rate": 4.937859502634992e-07, "epoch": 0.8066015151941871, "percentage": 80.67, "elapsed_time": "10:51:31", "remaining_time": "2:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3581, "total_steps": 4438, "loss": 0.1342, "learning_rate": 4.926749687680407e-07, "epoch": 0.8068268228799955, "percentage": 80.69, "elapsed_time": "10:51:42", "remaining_time": "2:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3582, "total_steps": 4438, "loss": 0.1347, "learning_rate": 4.915651018653511e-07, "epoch": 0.8070521305658039, "percentage": 80.71, "elapsed_time": "10:51:53", "remaining_time": "2:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3583, "total_steps": 4438, "loss": 0.1267, "learning_rate": 4.904563501716986e-07, "epoch": 0.8072774382516124, "percentage": 80.73, "elapsed_time": "10:52:05", "remaining_time": "2:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3584, "total_steps": 4438, "loss": 0.14, "learning_rate": 4.893487143027307e-07, "epoch": 0.8075027459374208, "percentage": 80.76, "elapsed_time": "10:52:16", "remaining_time": "2:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3585, "total_steps": 4438, "loss": 0.1241, "learning_rate": 4.88242194873477e-07, "epoch": 0.8077280536232292, "percentage": 80.78, "elapsed_time": "10:52:26", "remaining_time": "2:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3586, "total_steps": 4438, "loss": 0.1129, "learning_rate": 4.871367924983458e-07, "epoch": 0.8079533613090376, "percentage": 80.8, "elapsed_time": "10:52:37", "remaining_time": "2:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3587, "total_steps": 4438, "loss": 0.1171, "learning_rate": 4.860325077911271e-07, "epoch": 0.8081786689948461, "percentage": 80.82, "elapsed_time": "10:52:48", "remaining_time": "2:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3588, "total_steps": 4438, "loss": 0.129, "learning_rate": 4.84929341364988e-07, "epoch": 0.8084039766806546, "percentage": 80.85, "elapsed_time": "10:52:59", "remaining_time": "2:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3589, "total_steps": 4438, "loss": 0.1243, "learning_rate": 4.838272938324753e-07, "epoch": 0.808629284366463, "percentage": 80.87, "elapsed_time": "10:53:10", "remaining_time": "2:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 4438, "loss": 0.1209, "learning_rate": 4.827263658055161e-07, "epoch": 0.8088545920522714, "percentage": 80.89, "elapsed_time": "10:53:21", "remaining_time": "2:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3591, "total_steps": 4438, "loss": 0.1156, "learning_rate": 4.816265578954135e-07, "epoch": 0.8090798997380798, "percentage": 80.91, "elapsed_time": "10:53:33", "remaining_time": "2:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3592, "total_steps": 4438, "loss": 0.1302, "learning_rate": 4.805278707128505e-07, "epoch": 0.8093052074238882, "percentage": 80.94, "elapsed_time": "10:53:44", "remaining_time": "2:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3593, "total_steps": 4438, "loss": 0.125, "learning_rate": 4.794303048678878e-07, "epoch": 0.8095305151096966, "percentage": 80.96, "elapsed_time": "10:53:54", "remaining_time": "2:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3594, "total_steps": 4438, "loss": 0.1267, "learning_rate": 4.783338609699614e-07, "epoch": 0.8097558227955051, "percentage": 80.98, "elapsed_time": "10:54:05", "remaining_time": "2:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3595, "total_steps": 4438, "loss": 0.1278, "learning_rate": 4.772385396278872e-07, "epoch": 0.8099811304813136, "percentage": 81.0, "elapsed_time": "10:54:16", "remaining_time": "2:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3596, "total_steps": 4438, "loss": 0.1324, "learning_rate": 4.7614434144985486e-07, "epoch": 0.810206438167122, "percentage": 81.03, "elapsed_time": "10:54:27", "remaining_time": "2:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3597, "total_steps": 4438, "loss": 0.1276, "learning_rate": 4.750512670434332e-07, "epoch": 0.8104317458529304, "percentage": 81.05, "elapsed_time": "10:54:36", "remaining_time": "2:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3598, "total_steps": 4438, "loss": 0.127, "learning_rate": 4.73959317015564e-07, "epoch": 0.8106570535387388, "percentage": 81.07, "elapsed_time": "10:54:47", "remaining_time": "2:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3599, "total_steps": 4438, "loss": 0.1253, "learning_rate": 4.728684919725679e-07, "epoch": 0.8108823612245473, "percentage": 81.1, "elapsed_time": "10:54:57", "remaining_time": "2:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 4438, "loss": 0.126, "learning_rate": 4.7177879252013945e-07, "epoch": 0.8111076689103557, "percentage": 81.12, "elapsed_time": "10:55:08", "remaining_time": "2:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3601, "total_steps": 4438, "loss": 0.1283, "learning_rate": 4.70690219263347e-07, "epoch": 0.8113329765961641, "percentage": 81.14, "elapsed_time": "10:55:18", "remaining_time": "2:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3602, "total_steps": 4438, "loss": 0.1346, "learning_rate": 4.6960277280663574e-07, "epoch": 0.8115582842819725, "percentage": 81.16, "elapsed_time": "10:55:29", "remaining_time": "2:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3603, "total_steps": 4438, "loss": 0.1218, "learning_rate": 4.685164537538234e-07, "epoch": 0.811783591967781, "percentage": 81.19, "elapsed_time": "10:55:40", "remaining_time": "2:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3604, "total_steps": 4438, "loss": 0.1301, "learning_rate": 4.674312627081032e-07, "epoch": 0.8120088996535895, "percentage": 81.21, "elapsed_time": "10:55:51", "remaining_time": "2:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3605, "total_steps": 4438, "loss": 0.1296, "learning_rate": 4.6634720027204093e-07, "epoch": 0.8122342073393979, "percentage": 81.23, "elapsed_time": "10:56:02", "remaining_time": "2:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3606, "total_steps": 4438, "loss": 0.1218, "learning_rate": 4.6526426704757545e-07, "epoch": 0.8124595150252063, "percentage": 81.25, "elapsed_time": "10:56:13", "remaining_time": "2:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3607, "total_steps": 4438, "loss": 0.1214, "learning_rate": 4.641824636360195e-07, "epoch": 0.8126848227110147, "percentage": 81.28, "elapsed_time": "10:56:25", "remaining_time": "2:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3608, "total_steps": 4438, "loss": 0.1293, "learning_rate": 4.6310179063805916e-07, "epoch": 0.8129101303968231, "percentage": 81.3, "elapsed_time": "10:56:36", "remaining_time": "2:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3609, "total_steps": 4438, "loss": 0.1196, "learning_rate": 4.620222486537507e-07, "epoch": 0.8131354380826316, "percentage": 81.32, "elapsed_time": "10:56:47", "remaining_time": "2:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 4438, "loss": 0.1252, "learning_rate": 4.609438382825246e-07, "epoch": 0.81336074576844, "percentage": 81.34, "elapsed_time": "10:56:58", "remaining_time": "2:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3611, "total_steps": 4438, "loss": 0.1311, "learning_rate": 4.598665601231805e-07, "epoch": 0.8135860534542485, "percentage": 81.37, "elapsed_time": "10:57:07", "remaining_time": "2:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3612, "total_steps": 4438, "loss": 0.1325, "learning_rate": 4.587904147738925e-07, "epoch": 0.8138113611400569, "percentage": 81.39, "elapsed_time": "10:57:19", "remaining_time": "2:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3613, "total_steps": 4438, "loss": 0.1389, "learning_rate": 4.577154028322023e-07, "epoch": 0.8140366688258653, "percentage": 81.41, "elapsed_time": "10:57:29", "remaining_time": "2:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3614, "total_steps": 4438, "loss": 0.1223, "learning_rate": 4.566415248950251e-07, "epoch": 0.8142619765116738, "percentage": 81.43, "elapsed_time": "10:57:39", "remaining_time": "2:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3615, "total_steps": 4438, "loss": 0.122, "learning_rate": 4.555687815586454e-07, "epoch": 0.8144872841974822, "percentage": 81.46, "elapsed_time": "10:57:50", "remaining_time": "2:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3616, "total_steps": 4438, "loss": 0.1281, "learning_rate": 4.5449717341871646e-07, "epoch": 0.8147125918832906, "percentage": 81.48, "elapsed_time": "10:57:59", "remaining_time": "2:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3617, "total_steps": 4438, "loss": 0.1247, "learning_rate": 4.534267010702639e-07, "epoch": 0.814937899569099, "percentage": 81.5, "elapsed_time": "10:58:09", "remaining_time": "2:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3618, "total_steps": 4438, "loss": 0.1328, "learning_rate": 4.5235736510767957e-07, "epoch": 0.8151632072549074, "percentage": 81.52, "elapsed_time": "10:58:20", "remaining_time": "2:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3619, "total_steps": 4438, "loss": 0.1397, "learning_rate": 4.5128916612472735e-07, "epoch": 0.815388514940716, "percentage": 81.55, "elapsed_time": "10:58:31", "remaining_time": "2:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 4438, "loss": 0.1154, "learning_rate": 4.5022210471453664e-07, "epoch": 0.8156138226265244, "percentage": 81.57, "elapsed_time": "10:58:41", "remaining_time": "2:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3621, "total_steps": 4438, "loss": 0.1189, "learning_rate": 4.49156181469608e-07, "epoch": 0.8158391303123328, "percentage": 81.59, "elapsed_time": "10:58:52", "remaining_time": "2:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3622, "total_steps": 4438, "loss": 0.1271, "learning_rate": 4.480913969818099e-07, "epoch": 0.8160644379981412, "percentage": 81.61, "elapsed_time": "10:59:03", "remaining_time": "2:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3623, "total_steps": 4438, "loss": 0.1211, "learning_rate": 4.470277518423749e-07, "epoch": 0.8162897456839496, "percentage": 81.64, "elapsed_time": "10:59:12", "remaining_time": "2:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3624, "total_steps": 4438, "loss": 0.1223, "learning_rate": 4.4596524664190674e-07, "epoch": 0.816515053369758, "percentage": 81.66, "elapsed_time": "10:59:22", "remaining_time": "2:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3625, "total_steps": 4438, "loss": 0.1201, "learning_rate": 4.449038819703758e-07, "epoch": 0.8167403610555665, "percentage": 81.68, "elapsed_time": "10:59:32", "remaining_time": "2:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3626, "total_steps": 4438, "loss": 0.1341, "learning_rate": 4.4384365841711684e-07, "epoch": 0.816965668741375, "percentage": 81.7, "elapsed_time": "10:59:43", "remaining_time": "2:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3627, "total_steps": 4438, "loss": 0.1326, "learning_rate": 4.427845765708341e-07, "epoch": 0.8171909764271834, "percentage": 81.73, "elapsed_time": "10:59:54", "remaining_time": "2:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3628, "total_steps": 4438, "loss": 0.1493, "learning_rate": 4.417266370195944e-07, "epoch": 0.8174162841129918, "percentage": 81.75, "elapsed_time": "11:00:04", "remaining_time": "2:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3629, "total_steps": 4438, "loss": 0.1278, "learning_rate": 4.406698403508333e-07, "epoch": 0.8176415917988002, "percentage": 81.77, "elapsed_time": "11:00:15", "remaining_time": "2:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 4438, "loss": 0.1243, "learning_rate": 4.3961418715135097e-07, "epoch": 0.8178668994846087, "percentage": 81.79, "elapsed_time": "11:00:25", "remaining_time": "2:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3631, "total_steps": 4438, "loss": 0.1235, "learning_rate": 4.385596780073112e-07, "epoch": 0.8180922071704171, "percentage": 81.82, "elapsed_time": "11:00:37", "remaining_time": "2:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3632, "total_steps": 4438, "loss": 0.1203, "learning_rate": 4.3750631350424456e-07, "epoch": 0.8183175148562255, "percentage": 81.84, "elapsed_time": "11:00:49", "remaining_time": "2:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3633, "total_steps": 4438, "loss": 0.1191, "learning_rate": 4.36454094227044e-07, "epoch": 0.8185428225420339, "percentage": 81.86, "elapsed_time": "11:01:01", "remaining_time": "2:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3634, "total_steps": 4438, "loss": 0.1193, "learning_rate": 4.354030207599691e-07, "epoch": 0.8187681302278424, "percentage": 81.88, "elapsed_time": "11:01:12", "remaining_time": "2:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3635, "total_steps": 4438, "loss": 0.134, "learning_rate": 4.3435309368664024e-07, "epoch": 0.8189934379136509, "percentage": 81.91, "elapsed_time": "11:01:24", "remaining_time": "2:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3636, "total_steps": 4438, "loss": 0.1253, "learning_rate": 4.333043135900436e-07, "epoch": 0.8192187455994593, "percentage": 81.93, "elapsed_time": "11:01:35", "remaining_time": "2:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3637, "total_steps": 4438, "loss": 0.1211, "learning_rate": 4.3225668105252834e-07, "epoch": 0.8194440532852677, "percentage": 81.95, "elapsed_time": "11:01:47", "remaining_time": "2:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3638, "total_steps": 4438, "loss": 0.1188, "learning_rate": 4.312101966558044e-07, "epoch": 0.8196693609710761, "percentage": 81.97, "elapsed_time": "11:01:57", "remaining_time": "2:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3639, "total_steps": 4438, "loss": 0.1314, "learning_rate": 4.3016486098094667e-07, "epoch": 0.8198946686568845, "percentage": 82.0, "elapsed_time": "11:02:07", "remaining_time": "2:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 4438, "loss": 0.1226, "learning_rate": 4.2912067460839066e-07, "epoch": 0.820119976342693, "percentage": 82.02, "elapsed_time": "11:02:17", "remaining_time": "2:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3641, "total_steps": 4438, "loss": 0.1404, "learning_rate": 4.280776381179336e-07, "epoch": 0.8203452840285014, "percentage": 82.04, "elapsed_time": "11:02:28", "remaining_time": "2:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3642, "total_steps": 4438, "loss": 0.1231, "learning_rate": 4.2703575208873585e-07, "epoch": 0.8205705917143099, "percentage": 82.06, "elapsed_time": "11:02:38", "remaining_time": "2:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3643, "total_steps": 4438, "loss": 0.129, "learning_rate": 4.259950170993166e-07, "epoch": 0.8207958994001183, "percentage": 82.09, "elapsed_time": "11:02:50", "remaining_time": "2:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3644, "total_steps": 4438, "loss": 0.1299, "learning_rate": 4.2495543372755854e-07, "epoch": 0.8210212070859267, "percentage": 82.11, "elapsed_time": "11:03:00", "remaining_time": "2:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3645, "total_steps": 4438, "loss": 0.1255, "learning_rate": 4.239170025507025e-07, "epoch": 0.8212465147717352, "percentage": 82.13, "elapsed_time": "11:03:10", "remaining_time": "2:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3646, "total_steps": 4438, "loss": 0.1305, "learning_rate": 4.2287972414535084e-07, "epoch": 0.8214718224575436, "percentage": 82.15, "elapsed_time": "11:03:22", "remaining_time": "2:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3647, "total_steps": 4438, "loss": 0.1207, "learning_rate": 4.218435990874664e-07, "epoch": 0.821697130143352, "percentage": 82.18, "elapsed_time": "11:03:31", "remaining_time": "2:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3648, "total_steps": 4438, "loss": 0.1272, "learning_rate": 4.208086279523699e-07, "epoch": 0.8219224378291604, "percentage": 82.2, "elapsed_time": "11:03:43", "remaining_time": "2:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3649, "total_steps": 4438, "loss": 0.1387, "learning_rate": 4.197748113147429e-07, "epoch": 0.8221477455149688, "percentage": 82.22, "elapsed_time": "11:03:55", "remaining_time": "2:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 4438, "loss": 0.1351, "learning_rate": 4.1874214974862436e-07, "epoch": 0.8223730532007774, "percentage": 82.24, "elapsed_time": "11:04:06", "remaining_time": "2:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3651, "total_steps": 4438, "loss": 0.1299, "learning_rate": 4.177106438274131e-07, "epoch": 0.8225983608865858, "percentage": 82.27, "elapsed_time": "11:04:17", "remaining_time": "2:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3652, "total_steps": 4438, "loss": 0.1215, "learning_rate": 4.1668029412386677e-07, "epoch": 0.8228236685723942, "percentage": 82.29, "elapsed_time": "11:04:29", "remaining_time": "2:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3653, "total_steps": 4438, "loss": 0.1391, "learning_rate": 4.1565110121009886e-07, "epoch": 0.8230489762582026, "percentage": 82.31, "elapsed_time": "11:04:41", "remaining_time": "2:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3654, "total_steps": 4438, "loss": 0.144, "learning_rate": 4.146230656575831e-07, "epoch": 0.823274283944011, "percentage": 82.33, "elapsed_time": "11:04:51", "remaining_time": "2:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3655, "total_steps": 4438, "loss": 0.1421, "learning_rate": 4.1359618803714805e-07, "epoch": 0.8234995916298194, "percentage": 82.36, "elapsed_time": "11:05:03", "remaining_time": "2:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3656, "total_steps": 4438, "loss": 0.1533, "learning_rate": 4.125704689189819e-07, "epoch": 0.8237248993156279, "percentage": 82.38, "elapsed_time": "11:05:13", "remaining_time": "2:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3657, "total_steps": 4438, "loss": 0.138, "learning_rate": 4.115459088726273e-07, "epoch": 0.8239502070014363, "percentage": 82.4, "elapsed_time": "11:05:24", "remaining_time": "2:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3658, "total_steps": 4438, "loss": 0.1398, "learning_rate": 4.105225084669839e-07, "epoch": 0.8241755146872448, "percentage": 82.42, "elapsed_time": "11:05:36", "remaining_time": "2:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3659, "total_steps": 4438, "loss": 0.1302, "learning_rate": 4.095002682703092e-07, "epoch": 0.8244008223730532, "percentage": 82.45, "elapsed_time": "11:05:47", "remaining_time": "2:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 4438, "loss": 0.1218, "learning_rate": 4.084791888502135e-07, "epoch": 0.8246261300588617, "percentage": 82.47, "elapsed_time": "11:05:57", "remaining_time": "2:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3661, "total_steps": 4438, "loss": 0.1238, "learning_rate": 4.0745927077366493e-07, "epoch": 0.8248514377446701, "percentage": 82.49, "elapsed_time": "11:06:07", "remaining_time": "2:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3662, "total_steps": 4438, "loss": 0.1314, "learning_rate": 4.0644051460698634e-07, "epoch": 0.8250767454304785, "percentage": 82.51, "elapsed_time": "11:06:19", "remaining_time": "2:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3663, "total_steps": 4438, "loss": 0.1196, "learning_rate": 4.0542292091585447e-07, "epoch": 0.8253020531162869, "percentage": 82.54, "elapsed_time": "11:06:29", "remaining_time": "2:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3664, "total_steps": 4438, "loss": 0.1248, "learning_rate": 4.0440649026530166e-07, "epoch": 0.8255273608020953, "percentage": 82.56, "elapsed_time": "11:06:40", "remaining_time": "2:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3665, "total_steps": 4438, "loss": 0.1325, "learning_rate": 4.033912232197132e-07, "epoch": 0.8257526684879037, "percentage": 82.58, "elapsed_time": "11:06:51", "remaining_time": "2:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3666, "total_steps": 4438, "loss": 0.1171, "learning_rate": 4.0237712034283004e-07, "epoch": 0.8259779761737123, "percentage": 82.6, "elapsed_time": "11:07:00", "remaining_time": "2:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3667, "total_steps": 4438, "loss": 0.1223, "learning_rate": 4.0136418219774457e-07, "epoch": 0.8262032838595207, "percentage": 82.63, "elapsed_time": "11:07:11", "remaining_time": "2:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3668, "total_steps": 4438, "loss": 0.1206, "learning_rate": 4.003524093469041e-07, "epoch": 0.8264285915453291, "percentage": 82.65, "elapsed_time": "11:07:22", "remaining_time": "2:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3669, "total_steps": 4438, "loss": 0.1332, "learning_rate": 3.993418023521092e-07, "epoch": 0.8266538992311375, "percentage": 82.67, "elapsed_time": "11:07:34", "remaining_time": "2:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 4438, "loss": 0.1232, "learning_rate": 3.983323617745111e-07, "epoch": 0.8268792069169459, "percentage": 82.69, "elapsed_time": "11:07:44", "remaining_time": "2:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3671, "total_steps": 4438, "loss": 0.1213, "learning_rate": 3.9732408817461544e-07, "epoch": 0.8271045146027544, "percentage": 82.72, "elapsed_time": "11:07:54", "remaining_time": "2:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3672, "total_steps": 4438, "loss": 0.1114, "learning_rate": 3.963169821122778e-07, "epoch": 0.8273298222885628, "percentage": 82.74, "elapsed_time": "11:08:04", "remaining_time": "2:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3673, "total_steps": 4438, "loss": 0.1131, "learning_rate": 3.953110441467073e-07, "epoch": 0.8275551299743712, "percentage": 82.76, "elapsed_time": "11:08:13", "remaining_time": "2:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3674, "total_steps": 4438, "loss": 0.1377, "learning_rate": 3.943062748364651e-07, "epoch": 0.8277804376601797, "percentage": 82.79, "elapsed_time": "11:08:24", "remaining_time": "2:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3675, "total_steps": 4438, "loss": 0.1167, "learning_rate": 3.9330267473945973e-07, "epoch": 0.8280057453459881, "percentage": 82.81, "elapsed_time": "11:08:35", "remaining_time": "2:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3676, "total_steps": 4438, "loss": 0.1322, "learning_rate": 3.9230024441295394e-07, "epoch": 0.8282310530317966, "percentage": 82.83, "elapsed_time": "11:08:46", "remaining_time": "2:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3677, "total_steps": 4438, "loss": 0.1253, "learning_rate": 3.9129898441356064e-07, "epoch": 0.828456360717605, "percentage": 82.85, "elapsed_time": "11:08:57", "remaining_time": "2:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3678, "total_steps": 4438, "loss": 0.1189, "learning_rate": 3.9029889529724113e-07, "epoch": 0.8286816684034134, "percentage": 82.88, "elapsed_time": "11:09:07", "remaining_time": "2:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3679, "total_steps": 4438, "loss": 0.1304, "learning_rate": 3.892999776193085e-07, "epoch": 0.8289069760892218, "percentage": 82.9, "elapsed_time": "11:09:18", "remaining_time": "2:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 4438, "loss": 0.1138, "learning_rate": 3.8830223193442345e-07, "epoch": 0.8291322837750302, "percentage": 82.92, "elapsed_time": "11:09:28", "remaining_time": "2:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3681, "total_steps": 4438, "loss": 0.1387, "learning_rate": 3.8730565879659845e-07, "epoch": 0.8293575914608388, "percentage": 82.94, "elapsed_time": "11:09:39", "remaining_time": "2:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3682, "total_steps": 4438, "loss": 0.1243, "learning_rate": 3.863102587591919e-07, "epoch": 0.8295828991466472, "percentage": 82.97, "elapsed_time": "11:09:50", "remaining_time": "2:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3683, "total_steps": 4438, "loss": 0.1579, "learning_rate": 3.853160323749128e-07, "epoch": 0.8298082068324556, "percentage": 82.99, "elapsed_time": "11:10:01", "remaining_time": "2:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3684, "total_steps": 4438, "loss": 0.1296, "learning_rate": 3.84322980195819e-07, "epoch": 0.830033514518264, "percentage": 83.01, "elapsed_time": "11:10:14", "remaining_time": "2:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3685, "total_steps": 4438, "loss": 0.1444, "learning_rate": 3.833311027733139e-07, "epoch": 0.8302588222040724, "percentage": 83.03, "elapsed_time": "11:10:24", "remaining_time": "2:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3686, "total_steps": 4438, "loss": 0.1248, "learning_rate": 3.823404006581513e-07, "epoch": 0.8304841298898809, "percentage": 83.06, "elapsed_time": "11:10:35", "remaining_time": "2:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3687, "total_steps": 4438, "loss": 0.1238, "learning_rate": 3.8135087440043017e-07, "epoch": 0.8307094375756893, "percentage": 83.08, "elapsed_time": "11:10:46", "remaining_time": "2:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3688, "total_steps": 4438, "loss": 0.1434, "learning_rate": 3.8036252454959844e-07, "epoch": 0.8309347452614977, "percentage": 83.1, "elapsed_time": "11:10:56", "remaining_time": "2:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3689, "total_steps": 4438, "loss": 0.1376, "learning_rate": 3.7937535165444875e-07, "epoch": 0.8311600529473062, "percentage": 83.12, "elapsed_time": "11:11:05", "remaining_time": "2:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 4438, "loss": 0.1124, "learning_rate": 3.7838935626312246e-07, "epoch": 0.8313853606331146, "percentage": 83.15, "elapsed_time": "11:11:15", "remaining_time": "2:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3691, "total_steps": 4438, "loss": 0.1313, "learning_rate": 3.7740453892310596e-07, "epoch": 0.831610668318923, "percentage": 83.17, "elapsed_time": "11:11:26", "remaining_time": "2:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3692, "total_steps": 4438, "loss": 0.1304, "learning_rate": 3.764209001812316e-07, "epoch": 0.8318359760047315, "percentage": 83.19, "elapsed_time": "11:11:36", "remaining_time": "2:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3693, "total_steps": 4438, "loss": 0.1321, "learning_rate": 3.754384405836767e-07, "epoch": 0.8320612836905399, "percentage": 83.21, "elapsed_time": "11:11:47", "remaining_time": "2:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3694, "total_steps": 4438, "loss": 0.1177, "learning_rate": 3.7445716067596506e-07, "epoch": 0.8322865913763483, "percentage": 83.24, "elapsed_time": "11:11:58", "remaining_time": "2:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3695, "total_steps": 4438, "loss": 0.1299, "learning_rate": 3.734770610029642e-07, "epoch": 0.8325118990621567, "percentage": 83.26, "elapsed_time": "11:12:08", "remaining_time": "2:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3696, "total_steps": 4438, "loss": 0.1308, "learning_rate": 3.72498142108888e-07, "epoch": 0.8327372067479651, "percentage": 83.28, "elapsed_time": "11:12:19", "remaining_time": "2:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3697, "total_steps": 4438, "loss": 0.1338, "learning_rate": 3.7152040453729223e-07, "epoch": 0.8329625144337737, "percentage": 83.3, "elapsed_time": "11:12:30", "remaining_time": "2:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3698, "total_steps": 4438, "loss": 0.1158, "learning_rate": 3.705438488310792e-07, "epoch": 0.8331878221195821, "percentage": 83.33, "elapsed_time": "11:12:40", "remaining_time": "2:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3699, "total_steps": 4438, "loss": 0.1189, "learning_rate": 3.695684755324938e-07, "epoch": 0.8334131298053905, "percentage": 83.35, "elapsed_time": "11:12:50", "remaining_time": "2:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 4438, "loss": 0.138, "learning_rate": 3.6859428518312394e-07, "epoch": 0.8336384374911989, "percentage": 83.37, "elapsed_time": "11:13:01", "remaining_time": "2:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3701, "total_steps": 4438, "loss": 0.1332, "learning_rate": 3.6762127832390194e-07, "epoch": 0.8338637451770073, "percentage": 83.39, "elapsed_time": "11:13:11", "remaining_time": "2:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3702, "total_steps": 4438, "loss": 0.1233, "learning_rate": 3.666494554951014e-07, "epoch": 0.8340890528628158, "percentage": 83.42, "elapsed_time": "11:13:21", "remaining_time": "2:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3703, "total_steps": 4438, "loss": 0.1144, "learning_rate": 3.656788172363401e-07, "epoch": 0.8343143605486242, "percentage": 83.44, "elapsed_time": "11:13:30", "remaining_time": "2:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3704, "total_steps": 4438, "loss": 0.1303, "learning_rate": 3.6470936408657647e-07, "epoch": 0.8345396682344326, "percentage": 83.46, "elapsed_time": "11:13:41", "remaining_time": "2:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3705, "total_steps": 4438, "loss": 0.134, "learning_rate": 3.6374109658411207e-07, "epoch": 0.8347649759202411, "percentage": 83.48, "elapsed_time": "11:13:52", "remaining_time": "2:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3706, "total_steps": 4438, "loss": 0.1228, "learning_rate": 3.6277401526659067e-07, "epoch": 0.8349902836060495, "percentage": 83.51, "elapsed_time": "11:14:03", "remaining_time": "2:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3707, "total_steps": 4438, "loss": 0.1294, "learning_rate": 3.6180812067099477e-07, "epoch": 0.835215591291858, "percentage": 83.53, "elapsed_time": "11:14:13", "remaining_time": "2:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3708, "total_steps": 4438, "loss": 0.1251, "learning_rate": 3.6084341333365135e-07, "epoch": 0.8354408989776664, "percentage": 83.55, "elapsed_time": "11:14:24", "remaining_time": "2:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3709, "total_steps": 4438, "loss": 0.1256, "learning_rate": 3.5987989379022536e-07, "epoch": 0.8356662066634748, "percentage": 83.57, "elapsed_time": "11:14:34", "remaining_time": "2:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 4438, "loss": 0.1134, "learning_rate": 3.58917562575723e-07, "epoch": 0.8358915143492832, "percentage": 83.6, "elapsed_time": "11:14:45", "remaining_time": "2:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3711, "total_steps": 4438, "loss": 0.129, "learning_rate": 3.57956420224492e-07, "epoch": 0.8361168220350916, "percentage": 83.62, "elapsed_time": "11:14:54", "remaining_time": "2:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3712, "total_steps": 4438, "loss": 0.1314, "learning_rate": 3.569964672702178e-07, "epoch": 0.8363421297209, "percentage": 83.64, "elapsed_time": "11:15:07", "remaining_time": "2:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3713, "total_steps": 4438, "loss": 0.1193, "learning_rate": 3.5603770424592785e-07, "epoch": 0.8365674374067086, "percentage": 83.66, "elapsed_time": "11:15:17", "remaining_time": "2:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3714, "total_steps": 4438, "loss": 0.1189, "learning_rate": 3.550801316839858e-07, "epoch": 0.836792745092517, "percentage": 83.69, "elapsed_time": "11:15:28", "remaining_time": "2:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3715, "total_steps": 4438, "loss": 0.1428, "learning_rate": 3.5412375011609714e-07, "epoch": 0.8370180527783254, "percentage": 83.71, "elapsed_time": "11:15:39", "remaining_time": "2:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3716, "total_steps": 4438, "loss": 0.1248, "learning_rate": 3.531685600733051e-07, "epoch": 0.8372433604641338, "percentage": 83.73, "elapsed_time": "11:15:51", "remaining_time": "2:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3717, "total_steps": 4438, "loss": 0.1224, "learning_rate": 3.5221456208598987e-07, "epoch": 0.8374686681499423, "percentage": 83.75, "elapsed_time": "11:16:00", "remaining_time": "2:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3718, "total_steps": 4438, "loss": 0.1257, "learning_rate": 3.5126175668387275e-07, "epoch": 0.8376939758357507, "percentage": 83.78, "elapsed_time": "11:16:11", "remaining_time": "2:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3719, "total_steps": 4438, "loss": 0.1262, "learning_rate": 3.503101443960094e-07, "epoch": 0.8379192835215591, "percentage": 83.8, "elapsed_time": "11:16:22", "remaining_time": "2:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 4438, "loss": 0.1302, "learning_rate": 3.4935972575079524e-07, "epoch": 0.8381445912073675, "percentage": 83.82, "elapsed_time": "11:16:33", "remaining_time": "2:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3721, "total_steps": 4438, "loss": 0.1213, "learning_rate": 3.484105012759631e-07, "epoch": 0.838369898893176, "percentage": 83.84, "elapsed_time": "11:16:43", "remaining_time": "2:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3722, "total_steps": 4438, "loss": 0.1315, "learning_rate": 3.474624714985805e-07, "epoch": 0.8385952065789845, "percentage": 83.87, "elapsed_time": "11:16:53", "remaining_time": "2:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3723, "total_steps": 4438, "loss": 0.1321, "learning_rate": 3.465156369450545e-07, "epoch": 0.8388205142647929, "percentage": 83.89, "elapsed_time": "11:17:04", "remaining_time": "2:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3724, "total_steps": 4438, "loss": 0.1257, "learning_rate": 3.455699981411259e-07, "epoch": 0.8390458219506013, "percentage": 83.91, "elapsed_time": "11:17:14", "remaining_time": "2:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3725, "total_steps": 4438, "loss": 0.1255, "learning_rate": 3.446255556118736e-07, "epoch": 0.8392711296364097, "percentage": 83.93, "elapsed_time": "11:17:24", "remaining_time": "2:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3726, "total_steps": 4438, "loss": 0.1223, "learning_rate": 3.436823098817102e-07, "epoch": 0.8394964373222181, "percentage": 83.96, "elapsed_time": "11:17:34", "remaining_time": "2:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3727, "total_steps": 4438, "loss": 0.1145, "learning_rate": 3.427402614743863e-07, "epoch": 0.8397217450080265, "percentage": 83.98, "elapsed_time": "11:17:45", "remaining_time": "2:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3728, "total_steps": 4438, "loss": 0.1265, "learning_rate": 3.417994109129852e-07, "epoch": 0.8399470526938351, "percentage": 84.0, "elapsed_time": "11:17:56", "remaining_time": "2:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3729, "total_steps": 4438, "loss": 0.1164, "learning_rate": 3.408597587199261e-07, "epoch": 0.8401723603796435, "percentage": 84.02, "elapsed_time": "11:18:07", "remaining_time": "2:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 4438, "loss": 0.1201, "learning_rate": 3.3992130541696336e-07, "epoch": 0.8403976680654519, "percentage": 84.05, "elapsed_time": "11:18:19", "remaining_time": "2:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3731, "total_steps": 4438, "loss": 0.1176, "learning_rate": 3.389840515251855e-07, "epoch": 0.8406229757512603, "percentage": 84.07, "elapsed_time": "11:18:30", "remaining_time": "2:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3732, "total_steps": 4438, "loss": 0.1234, "learning_rate": 3.3804799756501335e-07, "epoch": 0.8408482834370687, "percentage": 84.09, "elapsed_time": "11:18:40", "remaining_time": "2:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3733, "total_steps": 4438, "loss": 0.1167, "learning_rate": 3.371131440562042e-07, "epoch": 0.8410735911228772, "percentage": 84.11, "elapsed_time": "11:18:50", "remaining_time": "2:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3734, "total_steps": 4438, "loss": 0.1311, "learning_rate": 3.3617949151784623e-07, "epoch": 0.8412988988086856, "percentage": 84.14, "elapsed_time": "11:19:01", "remaining_time": "2:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3735, "total_steps": 4438, "loss": 0.1319, "learning_rate": 3.3524704046836305e-07, "epoch": 0.841524206494494, "percentage": 84.16, "elapsed_time": "11:19:11", "remaining_time": "2:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3736, "total_steps": 4438, "loss": 0.1193, "learning_rate": 3.343157914255085e-07, "epoch": 0.8417495141803025, "percentage": 84.18, "elapsed_time": "11:19:22", "remaining_time": "2:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3737, "total_steps": 4438, "loss": 0.1147, "learning_rate": 3.3338574490637154e-07, "epoch": 0.841974821866111, "percentage": 84.2, "elapsed_time": "11:19:33", "remaining_time": "2:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3738, "total_steps": 4438, "loss": 0.1132, "learning_rate": 3.3245690142737236e-07, "epoch": 0.8422001295519194, "percentage": 84.23, "elapsed_time": "11:19:43", "remaining_time": "2:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3739, "total_steps": 4438, "loss": 0.1201, "learning_rate": 3.3152926150426256e-07, "epoch": 0.8424254372377278, "percentage": 84.25, "elapsed_time": "11:19:54", "remaining_time": "2:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 4438, "loss": 0.1239, "learning_rate": 3.306028256521265e-07, "epoch": 0.8426507449235362, "percentage": 84.27, "elapsed_time": "11:20:04", "remaining_time": "2:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3741, "total_steps": 4438, "loss": 0.1355, "learning_rate": 3.296775943853789e-07, "epoch": 0.8428760526093446, "percentage": 84.29, "elapsed_time": "11:20:15", "remaining_time": "2:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3742, "total_steps": 4438, "loss": 0.1352, "learning_rate": 3.287535682177667e-07, "epoch": 0.843101360295153, "percentage": 84.32, "elapsed_time": "11:20:25", "remaining_time": "2:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3743, "total_steps": 4438, "loss": 0.1246, "learning_rate": 3.278307476623674e-07, "epoch": 0.8433266679809615, "percentage": 84.34, "elapsed_time": "11:20:36", "remaining_time": "2:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3744, "total_steps": 4438, "loss": 0.1323, "learning_rate": 3.2690913323158795e-07, "epoch": 0.84355197566677, "percentage": 84.36, "elapsed_time": "11:20:47", "remaining_time": "2:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3745, "total_steps": 4438, "loss": 0.1321, "learning_rate": 3.259887254371677e-07, "epoch": 0.8437772833525784, "percentage": 84.38, "elapsed_time": "11:20:59", "remaining_time": "2:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3746, "total_steps": 4438, "loss": 0.1329, "learning_rate": 3.2506952479017417e-07, "epoch": 0.8440025910383868, "percentage": 84.41, "elapsed_time": "11:21:11", "remaining_time": "2:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3747, "total_steps": 4438, "loss": 0.1334, "learning_rate": 3.241515318010044e-07, "epoch": 0.8442278987241952, "percentage": 84.43, "elapsed_time": "11:21:22", "remaining_time": "2:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3748, "total_steps": 4438, "loss": 0.1367, "learning_rate": 3.2323474697938727e-07, "epoch": 0.8444532064100037, "percentage": 84.45, "elapsed_time": "11:21:33", "remaining_time": "2:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3749, "total_steps": 4438, "loss": 0.1354, "learning_rate": 3.223191708343776e-07, "epoch": 0.8446785140958121, "percentage": 84.47, "elapsed_time": "11:21:43", "remaining_time": "2:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 4438, "loss": 0.1274, "learning_rate": 3.214048038743622e-07, "epoch": 0.8449038217816205, "percentage": 84.5, "elapsed_time": "11:21:54", "remaining_time": "2:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3751, "total_steps": 4438, "loss": 0.1228, "learning_rate": 3.204916466070537e-07, "epoch": 0.8451291294674289, "percentage": 84.52, "elapsed_time": "11:22:05", "remaining_time": "2:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3752, "total_steps": 4438, "loss": 0.1279, "learning_rate": 3.1957969953949506e-07, "epoch": 0.8453544371532374, "percentage": 84.54, "elapsed_time": "11:22:16", "remaining_time": "2:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3753, "total_steps": 4438, "loss": 0.1254, "learning_rate": 3.186689631780565e-07, "epoch": 0.8455797448390459, "percentage": 84.57, "elapsed_time": "11:22:27", "remaining_time": "2:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3754, "total_steps": 4438, "loss": 0.1514, "learning_rate": 3.1775943802843546e-07, "epoch": 0.8458050525248543, "percentage": 84.59, "elapsed_time": "11:22:38", "remaining_time": "2:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3755, "total_steps": 4438, "loss": 0.1288, "learning_rate": 3.168511245956582e-07, "epoch": 0.8460303602106627, "percentage": 84.61, "elapsed_time": "11:22:48", "remaining_time": "2:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3756, "total_steps": 4438, "loss": 0.1353, "learning_rate": 3.1594402338407633e-07, "epoch": 0.8462556678964711, "percentage": 84.63, "elapsed_time": "11:22:59", "remaining_time": "2:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3757, "total_steps": 4438, "loss": 0.121, "learning_rate": 3.1503813489736995e-07, "epoch": 0.8464809755822795, "percentage": 84.66, "elapsed_time": "11:23:09", "remaining_time": "2:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3758, "total_steps": 4438, "loss": 0.1233, "learning_rate": 3.141334596385448e-07, "epoch": 0.846706283268088, "percentage": 84.68, "elapsed_time": "11:23:21", "remaining_time": "2:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3759, "total_steps": 4438, "loss": 0.14, "learning_rate": 3.132299981099335e-07, "epoch": 0.8469315909538964, "percentage": 84.7, "elapsed_time": "11:23:32", "remaining_time": "2:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 4438, "loss": 0.1338, "learning_rate": 3.12327750813195e-07, "epoch": 0.8471568986397049, "percentage": 84.72, "elapsed_time": "11:23:41", "remaining_time": "2:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3761, "total_steps": 4438, "loss": 0.1224, "learning_rate": 3.1142671824931275e-07, "epoch": 0.8473822063255133, "percentage": 84.75, "elapsed_time": "11:23:52", "remaining_time": "2:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3762, "total_steps": 4438, "loss": 0.1367, "learning_rate": 3.105269009185974e-07, "epoch": 0.8476075140113217, "percentage": 84.77, "elapsed_time": "11:24:02", "remaining_time": "2:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3763, "total_steps": 4438, "loss": 0.1256, "learning_rate": 3.096282993206837e-07, "epoch": 0.8478328216971301, "percentage": 84.79, "elapsed_time": "11:24:12", "remaining_time": "2:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3764, "total_steps": 4438, "loss": 0.1234, "learning_rate": 3.087309139545311e-07, "epoch": 0.8480581293829386, "percentage": 84.81, "elapsed_time": "11:24:22", "remaining_time": "2:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3765, "total_steps": 4438, "loss": 0.1229, "learning_rate": 3.0783474531842497e-07, "epoch": 0.848283437068747, "percentage": 84.84, "elapsed_time": "11:24:33", "remaining_time": "2:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3766, "total_steps": 4438, "loss": 0.1148, "learning_rate": 3.0693979390997333e-07, "epoch": 0.8485087447545554, "percentage": 84.86, "elapsed_time": "11:24:43", "remaining_time": "2:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3767, "total_steps": 4438, "loss": 0.1309, "learning_rate": 3.0604606022611033e-07, "epoch": 0.8487340524403638, "percentage": 84.88, "elapsed_time": "11:24:53", "remaining_time": "2:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3768, "total_steps": 4438, "loss": 0.1212, "learning_rate": 3.0515354476309293e-07, "epoch": 0.8489593601261723, "percentage": 84.9, "elapsed_time": "11:25:02", "remaining_time": "2:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3769, "total_steps": 4438, "loss": 0.117, "learning_rate": 3.042622480165011e-07, "epoch": 0.8491846678119808, "percentage": 84.93, "elapsed_time": "11:25:13", "remaining_time": "2:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 4438, "loss": 0.1366, "learning_rate": 3.033721704812395e-07, "epoch": 0.8494099754977892, "percentage": 84.95, "elapsed_time": "11:25:24", "remaining_time": "2:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3771, "total_steps": 4438, "loss": 0.1258, "learning_rate": 3.024833126515339e-07, "epoch": 0.8496352831835976, "percentage": 84.97, "elapsed_time": "11:25:36", "remaining_time": "2:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3772, "total_steps": 4438, "loss": 0.1263, "learning_rate": 3.0159567502093535e-07, "epoch": 0.849860590869406, "percentage": 84.99, "elapsed_time": "11:25:45", "remaining_time": "2:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3773, "total_steps": 4438, "loss": 0.1193, "learning_rate": 3.0070925808231456e-07, "epoch": 0.8500858985552144, "percentage": 85.02, "elapsed_time": "11:25:55", "remaining_time": "2:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3774, "total_steps": 4438, "loss": 0.1168, "learning_rate": 2.9982406232786614e-07, "epoch": 0.8503112062410229, "percentage": 85.04, "elapsed_time": "11:26:07", "remaining_time": "2:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3775, "total_steps": 4438, "loss": 0.1097, "learning_rate": 2.9894008824910726e-07, "epoch": 0.8505365139268314, "percentage": 85.06, "elapsed_time": "11:26:17", "remaining_time": "2:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3776, "total_steps": 4438, "loss": 0.126, "learning_rate": 2.9805733633687467e-07, "epoch": 0.8507618216126398, "percentage": 85.08, "elapsed_time": "11:26:26", "remaining_time": "2:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3777, "total_steps": 4438, "loss": 0.1265, "learning_rate": 2.9717580708132856e-07, "epoch": 0.8509871292984482, "percentage": 85.11, "elapsed_time": "11:26:36", "remaining_time": "2:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3778, "total_steps": 4438, "loss": 0.1198, "learning_rate": 2.9629550097194787e-07, "epoch": 0.8512124369842566, "percentage": 85.13, "elapsed_time": "11:26:48", "remaining_time": "1:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3779, "total_steps": 4438, "loss": 0.1249, "learning_rate": 2.9541641849753557e-07, "epoch": 0.851437744670065, "percentage": 85.15, "elapsed_time": "11:26:58", "remaining_time": "1:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 4438, "loss": 0.1211, "learning_rate": 2.9453856014621224e-07, "epoch": 0.8516630523558735, "percentage": 85.17, "elapsed_time": "11:27:09", "remaining_time": "1:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3781, "total_steps": 4438, "loss": 0.1197, "learning_rate": 2.936619264054194e-07, "epoch": 0.8518883600416819, "percentage": 85.2, "elapsed_time": "11:27:22", "remaining_time": "1:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3782, "total_steps": 4438, "loss": 0.1201, "learning_rate": 2.9278651776192073e-07, "epoch": 0.8521136677274903, "percentage": 85.22, "elapsed_time": "11:27:33", "remaining_time": "1:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3783, "total_steps": 4438, "loss": 0.1287, "learning_rate": 2.919123347017963e-07, "epoch": 0.8523389754132988, "percentage": 85.24, "elapsed_time": "11:27:43", "remaining_time": "1:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3784, "total_steps": 4438, "loss": 0.1229, "learning_rate": 2.910393777104481e-07, "epoch": 0.8525642830991073, "percentage": 85.26, "elapsed_time": "11:27:53", "remaining_time": "1:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3785, "total_steps": 4438, "loss": 0.1209, "learning_rate": 2.901676472725973e-07, "epoch": 0.8527895907849157, "percentage": 85.29, "elapsed_time": "11:28:04", "remaining_time": "1:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3786, "total_steps": 4438, "loss": 0.1253, "learning_rate": 2.892971438722822e-07, "epoch": 0.8530148984707241, "percentage": 85.31, "elapsed_time": "11:28:14", "remaining_time": "1:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3787, "total_steps": 4438, "loss": 0.1315, "learning_rate": 2.8842786799286204e-07, "epoch": 0.8532402061565325, "percentage": 85.33, "elapsed_time": "11:28:26", "remaining_time": "1:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3788, "total_steps": 4438, "loss": 0.1249, "learning_rate": 2.8755982011701183e-07, "epoch": 0.8534655138423409, "percentage": 85.35, "elapsed_time": "11:28:36", "remaining_time": "1:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3789, "total_steps": 4438, "loss": 0.1218, "learning_rate": 2.866930007267274e-07, "epoch": 0.8536908215281493, "percentage": 85.38, "elapsed_time": "11:28:47", "remaining_time": "1:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 4438, "loss": 0.1272, "learning_rate": 2.8582741030332095e-07, "epoch": 0.8539161292139578, "percentage": 85.4, "elapsed_time": "11:28:57", "remaining_time": "1:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3791, "total_steps": 4438, "loss": 0.1172, "learning_rate": 2.8496304932742247e-07, "epoch": 0.8541414368997663, "percentage": 85.42, "elapsed_time": "11:29:09", "remaining_time": "1:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3792, "total_steps": 4438, "loss": 0.1277, "learning_rate": 2.840999182789797e-07, "epoch": 0.8543667445855747, "percentage": 85.44, "elapsed_time": "11:29:21", "remaining_time": "1:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3793, "total_steps": 4438, "loss": 0.1198, "learning_rate": 2.8323801763725623e-07, "epoch": 0.8545920522713831, "percentage": 85.47, "elapsed_time": "11:29:33", "remaining_time": "1:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3794, "total_steps": 4438, "loss": 0.1383, "learning_rate": 2.823773478808348e-07, "epoch": 0.8548173599571915, "percentage": 85.49, "elapsed_time": "11:29:45", "remaining_time": "1:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3795, "total_steps": 4438, "loss": 0.1253, "learning_rate": 2.8151790948761165e-07, "epoch": 0.855042667643, "percentage": 85.51, "elapsed_time": "11:29:55", "remaining_time": "1:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3796, "total_steps": 4438, "loss": 0.1355, "learning_rate": 2.806597029348018e-07, "epoch": 0.8552679753288084, "percentage": 85.53, "elapsed_time": "11:30:06", "remaining_time": "1:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3797, "total_steps": 4438, "loss": 0.1262, "learning_rate": 2.7980272869893633e-07, "epoch": 0.8554932830146168, "percentage": 85.56, "elapsed_time": "11:30:17", "remaining_time": "1:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3798, "total_steps": 4438, "loss": 0.1209, "learning_rate": 2.7894698725585866e-07, "epoch": 0.8557185907004252, "percentage": 85.58, "elapsed_time": "11:30:28", "remaining_time": "1:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3799, "total_steps": 4438, "loss": 0.1395, "learning_rate": 2.7809247908073184e-07, "epoch": 0.8559438983862337, "percentage": 85.6, "elapsed_time": "11:30:40", "remaining_time": "1:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 4438, "loss": 0.1241, "learning_rate": 2.772392046480324e-07, "epoch": 0.8561692060720422, "percentage": 85.62, "elapsed_time": "11:30:50", "remaining_time": "1:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3801, "total_steps": 4438, "loss": 0.1335, "learning_rate": 2.763871644315508e-07, "epoch": 0.8563945137578506, "percentage": 85.65, "elapsed_time": "11:31:00", "remaining_time": "1:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3802, "total_steps": 4438, "loss": 0.1256, "learning_rate": 2.755363589043944e-07, "epoch": 0.856619821443659, "percentage": 85.67, "elapsed_time": "11:31:11", "remaining_time": "1:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3803, "total_steps": 4438, "loss": 0.1344, "learning_rate": 2.746867885389828e-07, "epoch": 0.8568451291294674, "percentage": 85.69, "elapsed_time": "11:31:20", "remaining_time": "1:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3804, "total_steps": 4438, "loss": 0.1186, "learning_rate": 2.738384538070518e-07, "epoch": 0.8570704368152758, "percentage": 85.71, "elapsed_time": "11:31:31", "remaining_time": "1:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3805, "total_steps": 4438, "loss": 0.1354, "learning_rate": 2.7299135517964897e-07, "epoch": 0.8572957445010843, "percentage": 85.74, "elapsed_time": "11:31:42", "remaining_time": "1:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3806, "total_steps": 4438, "loss": 0.1184, "learning_rate": 2.7214549312713723e-07, "epoch": 0.8575210521868927, "percentage": 85.76, "elapsed_time": "11:31:52", "remaining_time": "1:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3807, "total_steps": 4438, "loss": 0.1295, "learning_rate": 2.713008681191923e-07, "epoch": 0.8577463598727012, "percentage": 85.78, "elapsed_time": "11:32:03", "remaining_time": "1:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3808, "total_steps": 4438, "loss": 0.1172, "learning_rate": 2.7045748062480254e-07, "epoch": 0.8579716675585096, "percentage": 85.8, "elapsed_time": "11:32:13", "remaining_time": "1:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3809, "total_steps": 4438, "loss": 0.1219, "learning_rate": 2.696153311122704e-07, "epoch": 0.858196975244318, "percentage": 85.83, "elapsed_time": "11:32:23", "remaining_time": "1:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 4438, "loss": 0.1275, "learning_rate": 2.6877442004920873e-07, "epoch": 0.8584222829301265, "percentage": 85.85, "elapsed_time": "11:32:33", "remaining_time": "1:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3811, "total_steps": 4438, "loss": 0.1289, "learning_rate": 2.6793474790254516e-07, "epoch": 0.8586475906159349, "percentage": 85.87, "elapsed_time": "11:32:44", "remaining_time": "1:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3812, "total_steps": 4438, "loss": 0.1282, "learning_rate": 2.6709631513851834e-07, "epoch": 0.8588728983017433, "percentage": 85.89, "elapsed_time": "11:32:55", "remaining_time": "1:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3813, "total_steps": 4438, "loss": 0.13, "learning_rate": 2.6625912222267844e-07, "epoch": 0.8590982059875517, "percentage": 85.92, "elapsed_time": "11:33:07", "remaining_time": "1:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3814, "total_steps": 4438, "loss": 0.1221, "learning_rate": 2.654231696198878e-07, "epoch": 0.8593235136733601, "percentage": 85.94, "elapsed_time": "11:33:19", "remaining_time": "1:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3815, "total_steps": 4438, "loss": 0.1146, "learning_rate": 2.645884577943192e-07, "epoch": 0.8595488213591687, "percentage": 85.96, "elapsed_time": "11:33:29", "remaining_time": "1:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3816, "total_steps": 4438, "loss": 0.1327, "learning_rate": 2.6375498720945717e-07, "epoch": 0.8597741290449771, "percentage": 85.98, "elapsed_time": "11:33:39", "remaining_time": "1:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3817, "total_steps": 4438, "loss": 0.1246, "learning_rate": 2.629227583280972e-07, "epoch": 0.8599994367307855, "percentage": 86.01, "elapsed_time": "11:33:48", "remaining_time": "1:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3818, "total_steps": 4438, "loss": 0.1467, "learning_rate": 2.620917716123444e-07, "epoch": 0.8602247444165939, "percentage": 86.03, "elapsed_time": "11:33:58", "remaining_time": "1:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3819, "total_steps": 4438, "loss": 0.1288, "learning_rate": 2.6126202752361554e-07, "epoch": 0.8604500521024023, "percentage": 86.05, "elapsed_time": "11:34:09", "remaining_time": "1:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 4438, "loss": 0.1242, "learning_rate": 2.604335265226354e-07, "epoch": 0.8606753597882107, "percentage": 86.07, "elapsed_time": "11:34:20", "remaining_time": "1:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3821, "total_steps": 4438, "loss": 0.1244, "learning_rate": 2.5960626906944066e-07, "epoch": 0.8609006674740192, "percentage": 86.1, "elapsed_time": "11:34:30", "remaining_time": "1:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3822, "total_steps": 4438, "loss": 0.1316, "learning_rate": 2.587802556233765e-07, "epoch": 0.8611259751598277, "percentage": 86.12, "elapsed_time": "11:34:41", "remaining_time": "1:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3823, "total_steps": 4438, "loss": 0.1173, "learning_rate": 2.5795548664309695e-07, "epoch": 0.8613512828456361, "percentage": 86.14, "elapsed_time": "11:34:51", "remaining_time": "1:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3824, "total_steps": 4438, "loss": 0.1216, "learning_rate": 2.571319625865662e-07, "epoch": 0.8615765905314445, "percentage": 86.16, "elapsed_time": "11:35:03", "remaining_time": "1:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3825, "total_steps": 4438, "loss": 0.1328, "learning_rate": 2.5630968391105515e-07, "epoch": 0.861801898217253, "percentage": 86.19, "elapsed_time": "11:35:12", "remaining_time": "1:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3826, "total_steps": 4438, "loss": 0.1175, "learning_rate": 2.5548865107314606e-07, "epoch": 0.8620272059030614, "percentage": 86.21, "elapsed_time": "11:35:23", "remaining_time": "1:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3827, "total_steps": 4438, "loss": 0.1161, "learning_rate": 2.546688645287268e-07, "epoch": 0.8622525135888698, "percentage": 86.23, "elapsed_time": "11:35:33", "remaining_time": "1:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3828, "total_steps": 4438, "loss": 0.1235, "learning_rate": 2.5385032473299433e-07, "epoch": 0.8624778212746782, "percentage": 86.26, "elapsed_time": "11:35:44", "remaining_time": "1:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3829, "total_steps": 4438, "loss": 0.1223, "learning_rate": 2.5303303214045423e-07, "epoch": 0.8627031289604866, "percentage": 86.28, "elapsed_time": "11:35:54", "remaining_time": "1:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 4438, "loss": 0.1409, "learning_rate": 2.522169872049174e-07, "epoch": 0.8629284366462951, "percentage": 86.3, "elapsed_time": "11:36:04", "remaining_time": "1:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3831, "total_steps": 4438, "loss": 0.1297, "learning_rate": 2.5140219037950416e-07, "epoch": 0.8631537443321036, "percentage": 86.32, "elapsed_time": "11:36:15", "remaining_time": "1:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3832, "total_steps": 4438, "loss": 0.1354, "learning_rate": 2.5058864211664064e-07, "epoch": 0.863379052017912, "percentage": 86.35, "elapsed_time": "11:36:26", "remaining_time": "1:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3833, "total_steps": 4438, "loss": 0.1498, "learning_rate": 2.4977634286805887e-07, "epoch": 0.8636043597037204, "percentage": 86.37, "elapsed_time": "11:36:37", "remaining_time": "1:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3834, "total_steps": 4438, "loss": 0.1214, "learning_rate": 2.4896529308479966e-07, "epoch": 0.8638296673895288, "percentage": 86.39, "elapsed_time": "11:36:50", "remaining_time": "1:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3835, "total_steps": 4438, "loss": 0.117, "learning_rate": 2.4815549321720755e-07, "epoch": 0.8640549750753372, "percentage": 86.41, "elapsed_time": "11:37:01", "remaining_time": "1:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3836, "total_steps": 4438, "loss": 0.1154, "learning_rate": 2.4734694371493507e-07, "epoch": 0.8642802827611457, "percentage": 86.44, "elapsed_time": "11:37:12", "remaining_time": "1:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3837, "total_steps": 4438, "loss": 0.1198, "learning_rate": 2.4653964502693974e-07, "epoch": 0.8645055904469541, "percentage": 86.46, "elapsed_time": "11:37:23", "remaining_time": "1:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3838, "total_steps": 4438, "loss": 0.1278, "learning_rate": 2.4573359760148354e-07, "epoch": 0.8647308981327626, "percentage": 86.48, "elapsed_time": "11:37:35", "remaining_time": "1:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3839, "total_steps": 4438, "loss": 0.1289, "learning_rate": 2.449288018861354e-07, "epoch": 0.864956205818571, "percentage": 86.5, "elapsed_time": "11:37:45", "remaining_time": "1:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3840, "total_steps": 4438, "loss": 0.1207, "learning_rate": 2.441252583277678e-07, "epoch": 0.8651815135043794, "percentage": 86.53, "elapsed_time": "11:37:56", "remaining_time": "1:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3841, "total_steps": 4438, "loss": 0.1121, "learning_rate": 2.433229673725593e-07, "epoch": 0.8654068211901879, "percentage": 86.55, "elapsed_time": "11:38:06", "remaining_time": "1:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3842, "total_steps": 4438, "loss": 0.1366, "learning_rate": 2.425219294659908e-07, "epoch": 0.8656321288759963, "percentage": 86.57, "elapsed_time": "11:38:15", "remaining_time": "1:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3843, "total_steps": 4438, "loss": 0.1345, "learning_rate": 2.4172214505285006e-07, "epoch": 0.8658574365618047, "percentage": 86.59, "elapsed_time": "11:38:27", "remaining_time": "1:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3844, "total_steps": 4438, "loss": 0.1241, "learning_rate": 2.409236145772276e-07, "epoch": 0.8660827442476131, "percentage": 86.62, "elapsed_time": "11:38:38", "remaining_time": "1:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3845, "total_steps": 4438, "loss": 0.1255, "learning_rate": 2.401263384825164e-07, "epoch": 0.8663080519334215, "percentage": 86.64, "elapsed_time": "11:38:49", "remaining_time": "1:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3846, "total_steps": 4438, "loss": 0.1175, "learning_rate": 2.393303172114159e-07, "epoch": 0.8665333596192301, "percentage": 86.66, "elapsed_time": "11:39:00", "remaining_time": "1:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3847, "total_steps": 4438, "loss": 0.1172, "learning_rate": 2.3853555120592506e-07, "epoch": 0.8667586673050385, "percentage": 86.68, "elapsed_time": "11:39:10", "remaining_time": "1:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3848, "total_steps": 4438, "loss": 0.118, "learning_rate": 2.377420409073497e-07, "epoch": 0.8669839749908469, "percentage": 86.71, "elapsed_time": "11:39:21", "remaining_time": "1:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3849, "total_steps": 4438, "loss": 0.1275, "learning_rate": 2.3694978675629476e-07, "epoch": 0.8672092826766553, "percentage": 86.73, "elapsed_time": "11:39:33", "remaining_time": "1:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 4438, "loss": 0.1403, "learning_rate": 2.3615878919267116e-07, "epoch": 0.8674345903624637, "percentage": 86.75, "elapsed_time": "11:39:43", "remaining_time": "1:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3851, "total_steps": 4438, "loss": 0.1325, "learning_rate": 2.3536904865568949e-07, "epoch": 0.8676598980482721, "percentage": 86.77, "elapsed_time": "11:39:54", "remaining_time": "1:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3852, "total_steps": 4438, "loss": 0.1275, "learning_rate": 2.345805655838626e-07, "epoch": 0.8678852057340806, "percentage": 86.8, "elapsed_time": "11:40:05", "remaining_time": "1:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3853, "total_steps": 4438, "loss": 0.1403, "learning_rate": 2.337933404150064e-07, "epoch": 0.868110513419889, "percentage": 86.82, "elapsed_time": "11:40:16", "remaining_time": "1:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3854, "total_steps": 4438, "loss": 0.133, "learning_rate": 2.3300737358623843e-07, "epoch": 0.8683358211056975, "percentage": 86.84, "elapsed_time": "11:40:27", "remaining_time": "1:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3855, "total_steps": 4438, "loss": 0.13, "learning_rate": 2.3222266553397542e-07, "epoch": 0.8685611287915059, "percentage": 86.86, "elapsed_time": "11:40:39", "remaining_time": "1:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3856, "total_steps": 4438, "loss": 0.1288, "learning_rate": 2.314392166939375e-07, "epoch": 0.8687864364773143, "percentage": 86.89, "elapsed_time": "11:40:49", "remaining_time": "1:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3857, "total_steps": 4438, "loss": 0.1138, "learning_rate": 2.3065702750114383e-07, "epoch": 0.8690117441631228, "percentage": 86.91, "elapsed_time": "11:40:59", "remaining_time": "1:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3858, "total_steps": 4438, "loss": 0.1252, "learning_rate": 2.2987609838991536e-07, "epoch": 0.8692370518489312, "percentage": 86.93, "elapsed_time": "11:41:09", "remaining_time": "1:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3859, "total_steps": 4438, "loss": 0.1242, "learning_rate": 2.2909642979387331e-07, "epoch": 0.8694623595347396, "percentage": 86.95, "elapsed_time": "11:41:19", "remaining_time": "1:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3860, "total_steps": 4438, "loss": 0.1324, "learning_rate": 2.2831802214593774e-07, "epoch": 0.869687667220548, "percentage": 86.98, "elapsed_time": "11:41:31", "remaining_time": "1:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3861, "total_steps": 4438, "loss": 0.12, "learning_rate": 2.2754087587833014e-07, "epoch": 0.8699129749063564, "percentage": 87.0, "elapsed_time": "11:41:42", "remaining_time": "1:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3862, "total_steps": 4438, "loss": 0.1393, "learning_rate": 2.2676499142257002e-07, "epoch": 0.870138282592165, "percentage": 87.02, "elapsed_time": "11:41:52", "remaining_time": "1:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3863, "total_steps": 4438, "loss": 0.1242, "learning_rate": 2.2599036920947836e-07, "epoch": 0.8703635902779734, "percentage": 87.04, "elapsed_time": "11:42:02", "remaining_time": "1:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3864, "total_steps": 4438, "loss": 0.1223, "learning_rate": 2.2521700966917276e-07, "epoch": 0.8705888979637818, "percentage": 87.07, "elapsed_time": "11:42:13", "remaining_time": "1:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3865, "total_steps": 4438, "loss": 0.1216, "learning_rate": 2.2444491323107138e-07, "epoch": 0.8708142056495902, "percentage": 87.09, "elapsed_time": "11:42:23", "remaining_time": "1:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3866, "total_steps": 4438, "loss": 0.1269, "learning_rate": 2.23674080323891e-07, "epoch": 0.8710395133353986, "percentage": 87.11, "elapsed_time": "11:42:33", "remaining_time": "1:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3867, "total_steps": 4438, "loss": 0.1385, "learning_rate": 2.229045113756456e-07, "epoch": 0.8712648210212071, "percentage": 87.13, "elapsed_time": "11:42:44", "remaining_time": "1:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3868, "total_steps": 4438, "loss": 0.1352, "learning_rate": 2.221362068136493e-07, "epoch": 0.8714901287070155, "percentage": 87.16, "elapsed_time": "11:42:55", "remaining_time": "1:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3869, "total_steps": 4438, "loss": 0.1239, "learning_rate": 2.2136916706451212e-07, "epoch": 0.8717154363928239, "percentage": 87.18, "elapsed_time": "11:43:05", "remaining_time": "1:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3870, "total_steps": 4438, "loss": 0.1252, "learning_rate": 2.2060339255414232e-07, "epoch": 0.8719407440786324, "percentage": 87.2, "elapsed_time": "11:43:15", "remaining_time": "1:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3871, "total_steps": 4438, "loss": 0.1172, "learning_rate": 2.198388837077467e-07, "epoch": 0.8721660517644408, "percentage": 87.22, "elapsed_time": "11:43:26", "remaining_time": "1:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3872, "total_steps": 4438, "loss": 0.1297, "learning_rate": 2.190756409498282e-07, "epoch": 0.8723913594502493, "percentage": 87.25, "elapsed_time": "11:43:37", "remaining_time": "1:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3873, "total_steps": 4438, "loss": 0.1405, "learning_rate": 2.1831366470418725e-07, "epoch": 0.8726166671360577, "percentage": 87.27, "elapsed_time": "11:43:49", "remaining_time": "1:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3874, "total_steps": 4438, "loss": 0.1218, "learning_rate": 2.175529553939204e-07, "epoch": 0.8728419748218661, "percentage": 87.29, "elapsed_time": "11:43:59", "remaining_time": "1:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3875, "total_steps": 4438, "loss": 0.1145, "learning_rate": 2.1679351344142146e-07, "epoch": 0.8730672825076745, "percentage": 87.31, "elapsed_time": "11:44:11", "remaining_time": "1:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3876, "total_steps": 4438, "loss": 0.1345, "learning_rate": 2.1603533926838088e-07, "epoch": 0.8732925901934829, "percentage": 87.34, "elapsed_time": "11:44:21", "remaining_time": "1:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3877, "total_steps": 4438, "loss": 0.1243, "learning_rate": 2.1527843329578328e-07, "epoch": 0.8735178978792915, "percentage": 87.36, "elapsed_time": "11:44:33", "remaining_time": "1:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3878, "total_steps": 4438, "loss": 0.1369, "learning_rate": 2.1452279594391167e-07, "epoch": 0.8737432055650999, "percentage": 87.38, "elapsed_time": "11:44:45", "remaining_time": "1:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3879, "total_steps": 4438, "loss": 0.1187, "learning_rate": 2.1376842763234178e-07, "epoch": 0.8739685132509083, "percentage": 87.4, "elapsed_time": "11:44:55", "remaining_time": "1:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3880, "total_steps": 4438, "loss": 0.1179, "learning_rate": 2.1301532877994747e-07, "epoch": 0.8741938209367167, "percentage": 87.43, "elapsed_time": "11:45:06", "remaining_time": "1:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3881, "total_steps": 4438, "loss": 0.1363, "learning_rate": 2.1226349980489614e-07, "epoch": 0.8744191286225251, "percentage": 87.45, "elapsed_time": "11:45:17", "remaining_time": "1:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3882, "total_steps": 4438, "loss": 0.1244, "learning_rate": 2.1151294112464997e-07, "epoch": 0.8746444363083336, "percentage": 87.47, "elapsed_time": "11:45:28", "remaining_time": "1:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3883, "total_steps": 4438, "loss": 0.1335, "learning_rate": 2.1076365315596704e-07, "epoch": 0.874869743994142, "percentage": 87.49, "elapsed_time": "11:45:39", "remaining_time": "1:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3884, "total_steps": 4438, "loss": 0.1264, "learning_rate": 2.1001563631489807e-07, "epoch": 0.8750950516799504, "percentage": 87.52, "elapsed_time": "11:45:50", "remaining_time": "1:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3885, "total_steps": 4438, "loss": 0.124, "learning_rate": 2.0926889101679004e-07, "epoch": 0.8753203593657589, "percentage": 87.54, "elapsed_time": "11:46:02", "remaining_time": "1:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3886, "total_steps": 4438, "loss": 0.1327, "learning_rate": 2.0852341767628182e-07, "epoch": 0.8755456670515673, "percentage": 87.56, "elapsed_time": "11:46:14", "remaining_time": "1:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3887, "total_steps": 4438, "loss": 0.1346, "learning_rate": 2.07779216707307e-07, "epoch": 0.8757709747373758, "percentage": 87.58, "elapsed_time": "11:46:25", "remaining_time": "1:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3888, "total_steps": 4438, "loss": 0.1242, "learning_rate": 2.0703628852309336e-07, "epoch": 0.8759962824231842, "percentage": 87.61, "elapsed_time": "11:46:37", "remaining_time": "1:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3889, "total_steps": 4438, "loss": 0.1241, "learning_rate": 2.0629463353616013e-07, "epoch": 0.8762215901089926, "percentage": 87.63, "elapsed_time": "11:46:49", "remaining_time": "1:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3890, "total_steps": 4438, "loss": 0.1191, "learning_rate": 2.0555425215832176e-07, "epoch": 0.876446897794801, "percentage": 87.65, "elapsed_time": "11:47:00", "remaining_time": "1:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3891, "total_steps": 4438, "loss": 0.136, "learning_rate": 2.048151448006841e-07, "epoch": 0.8766722054806094, "percentage": 87.67, "elapsed_time": "11:47:12", "remaining_time": "1:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3892, "total_steps": 4438, "loss": 0.1287, "learning_rate": 2.0407731187364556e-07, "epoch": 0.8768975131664178, "percentage": 87.7, "elapsed_time": "11:47:23", "remaining_time": "1:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3893, "total_steps": 4438, "loss": 0.136, "learning_rate": 2.0334075378689781e-07, "epoch": 0.8771228208522264, "percentage": 87.72, "elapsed_time": "11:47:34", "remaining_time": "1:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3894, "total_steps": 4438, "loss": 0.1309, "learning_rate": 2.026054709494235e-07, "epoch": 0.8773481285380348, "percentage": 87.74, "elapsed_time": "11:47:45", "remaining_time": "1:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3895, "total_steps": 4438, "loss": 0.1213, "learning_rate": 2.0187146376949852e-07, "epoch": 0.8775734362238432, "percentage": 87.76, "elapsed_time": "11:47:55", "remaining_time": "1:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3896, "total_steps": 4438, "loss": 0.1302, "learning_rate": 2.0113873265468875e-07, "epoch": 0.8777987439096516, "percentage": 87.79, "elapsed_time": "11:48:05", "remaining_time": "1:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3897, "total_steps": 4438, "loss": 0.1263, "learning_rate": 2.0040727801185323e-07, "epoch": 0.87802405159546, "percentage": 87.81, "elapsed_time": "11:48:15", "remaining_time": "1:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3898, "total_steps": 4438, "loss": 0.1152, "learning_rate": 1.996771002471415e-07, "epoch": 0.8782493592812685, "percentage": 87.83, "elapsed_time": "11:48:26", "remaining_time": "1:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3899, "total_steps": 4438, "loss": 0.1247, "learning_rate": 1.9894819976599338e-07, "epoch": 0.8784746669670769, "percentage": 87.85, "elapsed_time": "11:48:37", "remaining_time": "1:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 4438, "loss": 0.1145, "learning_rate": 1.9822057697314102e-07, "epoch": 0.8786999746528853, "percentage": 87.88, "elapsed_time": "11:48:49", "remaining_time": "1:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3901, "total_steps": 4438, "loss": 0.1134, "learning_rate": 1.9749423227260533e-07, "epoch": 0.8789252823386938, "percentage": 87.9, "elapsed_time": "11:48:59", "remaining_time": "1:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3902, "total_steps": 4438, "loss": 0.1284, "learning_rate": 1.9676916606769874e-07, "epoch": 0.8791505900245022, "percentage": 87.92, "elapsed_time": "11:49:09", "remaining_time": "1:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3903, "total_steps": 4438, "loss": 0.1256, "learning_rate": 1.9604537876102448e-07, "epoch": 0.8793758977103107, "percentage": 87.95, "elapsed_time": "11:49:20", "remaining_time": "1:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3904, "total_steps": 4438, "loss": 0.1188, "learning_rate": 1.9532287075447325e-07, "epoch": 0.8796012053961191, "percentage": 87.97, "elapsed_time": "11:49:31", "remaining_time": "1:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3905, "total_steps": 4438, "loss": 0.1263, "learning_rate": 1.9460164244922698e-07, "epoch": 0.8798265130819275, "percentage": 87.99, "elapsed_time": "11:49:43", "remaining_time": "1:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3906, "total_steps": 4438, "loss": 0.1248, "learning_rate": 1.9388169424575802e-07, "epoch": 0.8800518207677359, "percentage": 88.01, "elapsed_time": "11:49:54", "remaining_time": "1:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3907, "total_steps": 4438, "loss": 0.1163, "learning_rate": 1.9316302654382528e-07, "epoch": 0.8802771284535443, "percentage": 88.04, "elapsed_time": "11:50:04", "remaining_time": "1:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3908, "total_steps": 4438, "loss": 0.1301, "learning_rate": 1.9244563974247953e-07, "epoch": 0.8805024361393528, "percentage": 88.06, "elapsed_time": "11:50:14", "remaining_time": "1:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3909, "total_steps": 4438, "loss": 0.1337, "learning_rate": 1.917295342400577e-07, "epoch": 0.8807277438251613, "percentage": 88.08, "elapsed_time": "11:50:25", "remaining_time": "1:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3910, "total_steps": 4438, "loss": 0.1139, "learning_rate": 1.910147104341875e-07, "epoch": 0.8809530515109697, "percentage": 88.1, "elapsed_time": "11:50:37", "remaining_time": "1:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3911, "total_steps": 4438, "loss": 0.1354, "learning_rate": 1.9030116872178317e-07, "epoch": 0.8811783591967781, "percentage": 88.13, "elapsed_time": "11:50:47", "remaining_time": "1:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3912, "total_steps": 4438, "loss": 0.139, "learning_rate": 1.8958890949904802e-07, "epoch": 0.8814036668825865, "percentage": 88.15, "elapsed_time": "11:50:57", "remaining_time": "1:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3913, "total_steps": 4438, "loss": 0.1251, "learning_rate": 1.8887793316147373e-07, "epoch": 0.881628974568395, "percentage": 88.17, "elapsed_time": "11:51:10", "remaining_time": "1:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3914, "total_steps": 4438, "loss": 0.1187, "learning_rate": 1.881682401038379e-07, "epoch": 0.8818542822542034, "percentage": 88.19, "elapsed_time": "11:51:21", "remaining_time": "1:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3915, "total_steps": 4438, "loss": 0.1129, "learning_rate": 1.8745983072020774e-07, "epoch": 0.8820795899400118, "percentage": 88.22, "elapsed_time": "11:51:31", "remaining_time": "1:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3916, "total_steps": 4438, "loss": 0.1305, "learning_rate": 1.8675270540393532e-07, "epoch": 0.8823048976258202, "percentage": 88.24, "elapsed_time": "11:51:42", "remaining_time": "1:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3917, "total_steps": 4438, "loss": 0.132, "learning_rate": 1.8604686454766208e-07, "epoch": 0.8825302053116287, "percentage": 88.26, "elapsed_time": "11:51:53", "remaining_time": "1:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3918, "total_steps": 4438, "loss": 0.1323, "learning_rate": 1.8534230854331454e-07, "epoch": 0.8827555129974372, "percentage": 88.28, "elapsed_time": "11:52:03", "remaining_time": "1:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3919, "total_steps": 4438, "loss": 0.1328, "learning_rate": 1.8463903778210612e-07, "epoch": 0.8829808206832456, "percentage": 88.31, "elapsed_time": "11:52:15", "remaining_time": "1:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3920, "total_steps": 4438, "loss": 0.1284, "learning_rate": 1.8393705265453838e-07, "epoch": 0.883206128369054, "percentage": 88.33, "elapsed_time": "11:52:24", "remaining_time": "1:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3921, "total_steps": 4438, "loss": 0.127, "learning_rate": 1.832363535503956e-07, "epoch": 0.8834314360548624, "percentage": 88.35, "elapsed_time": "11:52:35", "remaining_time": "1:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3922, "total_steps": 4438, "loss": 0.1158, "learning_rate": 1.8253694085875047e-07, "epoch": 0.8836567437406708, "percentage": 88.37, "elapsed_time": "11:52:46", "remaining_time": "1:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3923, "total_steps": 4438, "loss": 0.1312, "learning_rate": 1.8183881496796146e-07, "epoch": 0.8838820514264792, "percentage": 88.4, "elapsed_time": "11:52:56", "remaining_time": "1:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3924, "total_steps": 4438, "loss": 0.1374, "learning_rate": 1.8114197626567105e-07, "epoch": 0.8841073591122878, "percentage": 88.42, "elapsed_time": "11:53:06", "remaining_time": "1:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3925, "total_steps": 4438, "loss": 0.142, "learning_rate": 1.8044642513880827e-07, "epoch": 0.8843326667980962, "percentage": 88.44, "elapsed_time": "11:53:16", "remaining_time": "1:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3926, "total_steps": 4438, "loss": 0.1296, "learning_rate": 1.7975216197358648e-07, "epoch": 0.8845579744839046, "percentage": 88.46, "elapsed_time": "11:53:26", "remaining_time": "1:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3927, "total_steps": 4438, "loss": 0.1281, "learning_rate": 1.790591871555039e-07, "epoch": 0.884783282169713, "percentage": 88.49, "elapsed_time": "11:53:37", "remaining_time": "1:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3928, "total_steps": 4438, "loss": 0.118, "learning_rate": 1.7836750106934475e-07, "epoch": 0.8850085898555214, "percentage": 88.51, "elapsed_time": "11:53:48", "remaining_time": "1:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3929, "total_steps": 4438, "loss": 0.1224, "learning_rate": 1.776771040991751e-07, "epoch": 0.8852338975413299, "percentage": 88.53, "elapsed_time": "11:54:00", "remaining_time": "1:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3930, "total_steps": 4438, "loss": 0.1281, "learning_rate": 1.7698799662834776e-07, "epoch": 0.8854592052271383, "percentage": 88.55, "elapsed_time": "11:54:10", "remaining_time": "1:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3931, "total_steps": 4438, "loss": 0.1258, "learning_rate": 1.7630017903949775e-07, "epoch": 0.8856845129129467, "percentage": 88.58, "elapsed_time": "11:54:21", "remaining_time": "1:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3932, "total_steps": 4438, "loss": 0.1345, "learning_rate": 1.7561365171454488e-07, "epoch": 0.8859098205987552, "percentage": 88.6, "elapsed_time": "11:54:32", "remaining_time": "1:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3933, "total_steps": 4438, "loss": 0.1251, "learning_rate": 1.7492841503469165e-07, "epoch": 0.8861351282845636, "percentage": 88.62, "elapsed_time": "11:54:43", "remaining_time": "1:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3934, "total_steps": 4438, "loss": 0.1253, "learning_rate": 1.7424446938042517e-07, "epoch": 0.8863604359703721, "percentage": 88.64, "elapsed_time": "11:54:53", "remaining_time": "1:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3935, "total_steps": 4438, "loss": 0.1184, "learning_rate": 1.7356181513151464e-07, "epoch": 0.8865857436561805, "percentage": 88.67, "elapsed_time": "11:55:03", "remaining_time": "1:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3936, "total_steps": 4438, "loss": 0.1109, "learning_rate": 1.7288045266701247e-07, "epoch": 0.8868110513419889, "percentage": 88.69, "elapsed_time": "11:55:15", "remaining_time": "1:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3937, "total_steps": 4438, "loss": 0.1252, "learning_rate": 1.7220038236525406e-07, "epoch": 0.8870363590277973, "percentage": 88.71, "elapsed_time": "11:55:26", "remaining_time": "1:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3938, "total_steps": 4438, "loss": 0.1195, "learning_rate": 1.7152160460385703e-07, "epoch": 0.8872616667136057, "percentage": 88.73, "elapsed_time": "11:55:35", "remaining_time": "1:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3939, "total_steps": 4438, "loss": 0.1338, "learning_rate": 1.7084411975972076e-07, "epoch": 0.8874869743994142, "percentage": 88.76, "elapsed_time": "11:55:46", "remaining_time": "1:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3940, "total_steps": 4438, "loss": 0.1314, "learning_rate": 1.701679282090285e-07, "epoch": 0.8877122820852227, "percentage": 88.78, "elapsed_time": "11:55:57", "remaining_time": "1:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3941, "total_steps": 4438, "loss": 0.1192, "learning_rate": 1.6949303032724297e-07, "epoch": 0.8879375897710311, "percentage": 88.8, "elapsed_time": "11:56:08", "remaining_time": "1:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3942, "total_steps": 4438, "loss": 0.118, "learning_rate": 1.6881942648911077e-07, "epoch": 0.8881628974568395, "percentage": 88.82, "elapsed_time": "11:56:19", "remaining_time": "1:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3943, "total_steps": 4438, "loss": 0.134, "learning_rate": 1.6814711706865827e-07, "epoch": 0.8883882051426479, "percentage": 88.85, "elapsed_time": "11:56:30", "remaining_time": "1:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3944, "total_steps": 4438, "loss": 0.1218, "learning_rate": 1.6747610243919437e-07, "epoch": 0.8886135128284564, "percentage": 88.87, "elapsed_time": "11:56:41", "remaining_time": "1:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3945, "total_steps": 4438, "loss": 0.1296, "learning_rate": 1.6680638297330854e-07, "epoch": 0.8888388205142648, "percentage": 88.89, "elapsed_time": "11:56:51", "remaining_time": "1:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3946, "total_steps": 4438, "loss": 0.1337, "learning_rate": 1.661379590428705e-07, "epoch": 0.8890641282000732, "percentage": 88.91, "elapsed_time": "11:57:03", "remaining_time": "1:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3947, "total_steps": 4438, "loss": 0.1252, "learning_rate": 1.6547083101903173e-07, "epoch": 0.8892894358858816, "percentage": 88.94, "elapsed_time": "11:57:14", "remaining_time": "1:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3948, "total_steps": 4438, "loss": 0.1349, "learning_rate": 1.6480499927222283e-07, "epoch": 0.8895147435716901, "percentage": 88.96, "elapsed_time": "11:57:26", "remaining_time": "1:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3949, "total_steps": 4438, "loss": 0.1156, "learning_rate": 1.641404641721561e-07, "epoch": 0.8897400512574986, "percentage": 88.98, "elapsed_time": "11:57:38", "remaining_time": "1:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 4438, "loss": 0.131, "learning_rate": 1.6347722608782284e-07, "epoch": 0.889965358943307, "percentage": 89.0, "elapsed_time": "11:57:49", "remaining_time": "1:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3951, "total_steps": 4438, "loss": 0.1168, "learning_rate": 1.6281528538749425e-07, "epoch": 0.8901906666291154, "percentage": 89.03, "elapsed_time": "11:58:00", "remaining_time": "1:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3952, "total_steps": 4438, "loss": 0.1203, "learning_rate": 1.6215464243872186e-07, "epoch": 0.8904159743149238, "percentage": 89.05, "elapsed_time": "11:58:12", "remaining_time": "1:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3953, "total_steps": 4438, "loss": 0.1321, "learning_rate": 1.6149529760833504e-07, "epoch": 0.8906412820007322, "percentage": 89.07, "elapsed_time": "11:58:23", "remaining_time": "1:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3954, "total_steps": 4438, "loss": 0.1125, "learning_rate": 1.608372512624448e-07, "epoch": 0.8908665896865406, "percentage": 89.09, "elapsed_time": "11:58:34", "remaining_time": "1:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3955, "total_steps": 4438, "loss": 0.1146, "learning_rate": 1.6018050376643863e-07, "epoch": 0.8910918973723491, "percentage": 89.12, "elapsed_time": "11:58:47", "remaining_time": "1:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3956, "total_steps": 4438, "loss": 0.1275, "learning_rate": 1.595250554849842e-07, "epoch": 0.8913172050581576, "percentage": 89.14, "elapsed_time": "11:58:57", "remaining_time": "1:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3957, "total_steps": 4438, "loss": 0.1216, "learning_rate": 1.5887090678202793e-07, "epoch": 0.891542512743966, "percentage": 89.16, "elapsed_time": "11:59:09", "remaining_time": "1:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3958, "total_steps": 4438, "loss": 0.1203, "learning_rate": 1.5821805802079343e-07, "epoch": 0.8917678204297744, "percentage": 89.18, "elapsed_time": "11:59:20", "remaining_time": "1:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3959, "total_steps": 4438, "loss": 0.13, "learning_rate": 1.5756650956378377e-07, "epoch": 0.8919931281155828, "percentage": 89.21, "elapsed_time": "11:59:31", "remaining_time": "1:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3960, "total_steps": 4438, "loss": 0.1279, "learning_rate": 1.5691626177277986e-07, "epoch": 0.8922184358013913, "percentage": 89.23, "elapsed_time": "11:59:43", "remaining_time": "1:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3961, "total_steps": 4438, "loss": 0.1231, "learning_rate": 1.5626731500883951e-07, "epoch": 0.8924437434871997, "percentage": 89.25, "elapsed_time": "11:59:54", "remaining_time": "1:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3962, "total_steps": 4438, "loss": 0.1302, "learning_rate": 1.5561966963229925e-07, "epoch": 0.8926690511730081, "percentage": 89.27, "elapsed_time": "12:00:04", "remaining_time": "1:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3963, "total_steps": 4438, "loss": 0.1252, "learning_rate": 1.5497332600277137e-07, "epoch": 0.8928943588588165, "percentage": 89.3, "elapsed_time": "12:00:15", "remaining_time": "1:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3964, "total_steps": 4438, "loss": 0.1265, "learning_rate": 1.5432828447914743e-07, "epoch": 0.893119666544625, "percentage": 89.32, "elapsed_time": "12:00:25", "remaining_time": "1:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3965, "total_steps": 4438, "loss": 0.1183, "learning_rate": 1.5368454541959453e-07, "epoch": 0.8933449742304335, "percentage": 89.34, "elapsed_time": "12:00:35", "remaining_time": "1:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3966, "total_steps": 4438, "loss": 0.1351, "learning_rate": 1.5304210918155677e-07, "epoch": 0.8935702819162419, "percentage": 89.36, "elapsed_time": "12:00:47", "remaining_time": "1:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3967, "total_steps": 4438, "loss": 0.1219, "learning_rate": 1.524009761217557e-07, "epoch": 0.8937955896020503, "percentage": 89.39, "elapsed_time": "12:00:57", "remaining_time": "1:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3968, "total_steps": 4438, "loss": 0.1222, "learning_rate": 1.5176114659618796e-07, "epoch": 0.8940208972878587, "percentage": 89.41, "elapsed_time": "12:01:09", "remaining_time": "1:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3969, "total_steps": 4438, "loss": 0.1237, "learning_rate": 1.5112262096012743e-07, "epoch": 0.8942462049736671, "percentage": 89.43, "elapsed_time": "12:01:18", "remaining_time": "1:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3970, "total_steps": 4438, "loss": 0.1207, "learning_rate": 1.5048539956812324e-07, "epoch": 0.8944715126594756, "percentage": 89.45, "elapsed_time": "12:01:29", "remaining_time": "1:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3971, "total_steps": 4438, "loss": 0.1313, "learning_rate": 1.4984948277400074e-07, "epoch": 0.8946968203452841, "percentage": 89.48, "elapsed_time": "12:01:40", "remaining_time": "1:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3972, "total_steps": 4438, "loss": 0.1322, "learning_rate": 1.4921487093086134e-07, "epoch": 0.8949221280310925, "percentage": 89.5, "elapsed_time": "12:01:52", "remaining_time": "1:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3973, "total_steps": 4438, "loss": 0.1141, "learning_rate": 1.4858156439108097e-07, "epoch": 0.8951474357169009, "percentage": 89.52, "elapsed_time": "12:02:02", "remaining_time": "1:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3974, "total_steps": 4438, "loss": 0.1358, "learning_rate": 1.4794956350631106e-07, "epoch": 0.8953727434027093, "percentage": 89.54, "elapsed_time": "12:02:12", "remaining_time": "1:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3975, "total_steps": 4438, "loss": 0.1262, "learning_rate": 1.473188686274782e-07, "epoch": 0.8955980510885178, "percentage": 89.57, "elapsed_time": "12:02:22", "remaining_time": "1:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3976, "total_steps": 4438, "loss": 0.1305, "learning_rate": 1.4668948010478358e-07, "epoch": 0.8958233587743262, "percentage": 89.59, "elapsed_time": "12:02:33", "remaining_time": "1:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3977, "total_steps": 4438, "loss": 0.1291, "learning_rate": 1.4606139828770378e-07, "epoch": 0.8960486664601346, "percentage": 89.61, "elapsed_time": "12:02:43", "remaining_time": "1:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3978, "total_steps": 4438, "loss": 0.1213, "learning_rate": 1.4543462352498844e-07, "epoch": 0.896273974145943, "percentage": 89.63, "elapsed_time": "12:02:53", "remaining_time": "1:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3979, "total_steps": 4438, "loss": 0.1254, "learning_rate": 1.448091561646628e-07, "epoch": 0.8964992818317515, "percentage": 89.66, "elapsed_time": "12:03:05", "remaining_time": "1:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3980, "total_steps": 4438, "loss": 0.1193, "learning_rate": 1.4418499655402512e-07, "epoch": 0.89672458951756, "percentage": 89.68, "elapsed_time": "12:03:15", "remaining_time": "1:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3981, "total_steps": 4438, "loss": 0.1258, "learning_rate": 1.435621450396485e-07, "epoch": 0.8969498972033684, "percentage": 89.7, "elapsed_time": "12:03:26", "remaining_time": "1:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3982, "total_steps": 4438, "loss": 0.1223, "learning_rate": 1.4294060196737874e-07, "epoch": 0.8971752048891768, "percentage": 89.73, "elapsed_time": "12:03:35", "remaining_time": "1:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3983, "total_steps": 4438, "loss": 0.1309, "learning_rate": 1.4232036768233565e-07, "epoch": 0.8974005125749852, "percentage": 89.75, "elapsed_time": "12:03:45", "remaining_time": "1:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3984, "total_steps": 4438, "loss": 0.1215, "learning_rate": 1.417014425289126e-07, "epoch": 0.8976258202607936, "percentage": 89.77, "elapsed_time": "12:03:55", "remaining_time": "1:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3985, "total_steps": 4438, "loss": 0.1234, "learning_rate": 1.4108382685077498e-07, "epoch": 0.897851127946602, "percentage": 89.79, "elapsed_time": "12:04:05", "remaining_time": "1:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3986, "total_steps": 4438, "loss": 0.1282, "learning_rate": 1.4046752099086236e-07, "epoch": 0.8980764356324105, "percentage": 89.82, "elapsed_time": "12:04:17", "remaining_time": "1:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3987, "total_steps": 4438, "loss": 0.1288, "learning_rate": 1.398525252913857e-07, "epoch": 0.898301743318219, "percentage": 89.84, "elapsed_time": "12:04:28", "remaining_time": "1:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3988, "total_steps": 4438, "loss": 0.1231, "learning_rate": 1.3923884009382994e-07, "epoch": 0.8985270510040274, "percentage": 89.86, "elapsed_time": "12:04:38", "remaining_time": "1:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3989, "total_steps": 4438, "loss": 0.1335, "learning_rate": 1.3862646573895134e-07, "epoch": 0.8987523586898358, "percentage": 89.88, "elapsed_time": "12:04:47", "remaining_time": "1:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3990, "total_steps": 4438, "loss": 0.1234, "learning_rate": 1.380154025667782e-07, "epoch": 0.8989776663756442, "percentage": 89.91, "elapsed_time": "12:04:58", "remaining_time": "1:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3991, "total_steps": 4438, "loss": 0.1289, "learning_rate": 1.374056509166119e-07, "epoch": 0.8992029740614527, "percentage": 89.93, "elapsed_time": "12:05:08", "remaining_time": "1:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3992, "total_steps": 4438, "loss": 0.1137, "learning_rate": 1.367972111270241e-07, "epoch": 0.8994282817472611, "percentage": 89.95, "elapsed_time": "12:05:19", "remaining_time": "1:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3993, "total_steps": 4438, "loss": 0.1272, "learning_rate": 1.3619008353585873e-07, "epoch": 0.8996535894330695, "percentage": 89.97, "elapsed_time": "12:05:30", "remaining_time": "1:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3994, "total_steps": 4438, "loss": 0.1289, "learning_rate": 1.3558426848023165e-07, "epoch": 0.8998788971188779, "percentage": 90.0, "elapsed_time": "12:05:42", "remaining_time": "1:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3995, "total_steps": 4438, "loss": 0.1205, "learning_rate": 1.3497976629652882e-07, "epoch": 0.9001042048046864, "percentage": 90.02, "elapsed_time": "12:05:52", "remaining_time": "1:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3996, "total_steps": 4438, "loss": 0.1227, "learning_rate": 1.3437657732040783e-07, "epoch": 0.9003295124904949, "percentage": 90.04, "elapsed_time": "12:06:02", "remaining_time": "1:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3997, "total_steps": 4438, "loss": 0.1274, "learning_rate": 1.337747018867977e-07, "epoch": 0.9005548201763033, "percentage": 90.06, "elapsed_time": "12:06:14", "remaining_time": "1:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3998, "total_steps": 4438, "loss": 0.125, "learning_rate": 1.3317414032989668e-07, "epoch": 0.9007801278621117, "percentage": 90.09, "elapsed_time": "12:06:24", "remaining_time": "1:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3999, "total_steps": 4438, "loss": 0.1234, "learning_rate": 1.3257489298317466e-07, "epoch": 0.9010054355479201, "percentage": 90.11, "elapsed_time": "12:06:36", "remaining_time": "1:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 4438, "loss": 0.1128, "learning_rate": 1.3197696017937106e-07, "epoch": 0.9012307432337285, "percentage": 90.13, "elapsed_time": "12:06:46", "remaining_time": "1:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 4438, "eval_loss": 0.12675930559635162, "epoch": 0.9012307432337285, "percentage": 90.13, "elapsed_time": "12:08:49", "remaining_time": "1:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4001, "total_steps": 4438, "loss": 0.1213, "learning_rate": 1.3138034225049583e-07, "epoch": 0.901456050919537, "percentage": 90.15, "elapsed_time": "12:08:59", "remaining_time": "1:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4002, "total_steps": 4438, "loss": 0.1317, "learning_rate": 1.3078503952782845e-07, "epoch": 0.9016813586053454, "percentage": 90.18, "elapsed_time": "12:09:11", "remaining_time": "1:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4003, "total_steps": 4438, "loss": 0.1301, "learning_rate": 1.3019105234191865e-07, "epoch": 0.9019066662911539, "percentage": 90.2, "elapsed_time": "12:09:21", "remaining_time": "1:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4004, "total_steps": 4438, "loss": 0.1258, "learning_rate": 1.2959838102258537e-07, "epoch": 0.9021319739769623, "percentage": 90.22, "elapsed_time": "12:09:32", "remaining_time": "1:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4005, "total_steps": 4438, "loss": 0.1258, "learning_rate": 1.2900702589891652e-07, "epoch": 0.9023572816627707, "percentage": 90.24, "elapsed_time": "12:09:42", "remaining_time": "1:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4006, "total_steps": 4438, "loss": 0.1343, "learning_rate": 1.2841698729927022e-07, "epoch": 0.9025825893485792, "percentage": 90.27, "elapsed_time": "12:09:52", "remaining_time": "1:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4007, "total_steps": 4438, "loss": 0.1263, "learning_rate": 1.278282655512722e-07, "epoch": 0.9028078970343876, "percentage": 90.29, "elapsed_time": "12:10:02", "remaining_time": "1:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4008, "total_steps": 4438, "loss": 0.1213, "learning_rate": 1.272408609818182e-07, "epoch": 0.903033204720196, "percentage": 90.31, "elapsed_time": "12:10:13", "remaining_time": "1:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4009, "total_steps": 4438, "loss": 0.112, "learning_rate": 1.2665477391707203e-07, "epoch": 0.9032585124060044, "percentage": 90.33, "elapsed_time": "12:10:23", "remaining_time": "1:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4010, "total_steps": 4438, "loss": 0.1207, "learning_rate": 1.2607000468246533e-07, "epoch": 0.9034838200918128, "percentage": 90.36, "elapsed_time": "12:10:34", "remaining_time": "1:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4011, "total_steps": 4438, "loss": 0.127, "learning_rate": 1.2548655360269974e-07, "epoch": 0.9037091277776214, "percentage": 90.38, "elapsed_time": "12:10:45", "remaining_time": "1:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4012, "total_steps": 4438, "loss": 0.1273, "learning_rate": 1.2490442100174278e-07, "epoch": 0.9039344354634298, "percentage": 90.4, "elapsed_time": "12:10:56", "remaining_time": "1:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4013, "total_steps": 4438, "loss": 0.125, "learning_rate": 1.243236072028317e-07, "epoch": 0.9041597431492382, "percentage": 90.42, "elapsed_time": "12:11:08", "remaining_time": "1:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4014, "total_steps": 4438, "loss": 0.123, "learning_rate": 1.237441125284708e-07, "epoch": 0.9043850508350466, "percentage": 90.45, "elapsed_time": "12:11:19", "remaining_time": "1:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4015, "total_steps": 4438, "loss": 0.1291, "learning_rate": 1.2316593730043154e-07, "epoch": 0.904610358520855, "percentage": 90.47, "elapsed_time": "12:11:31", "remaining_time": "1:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4016, "total_steps": 4438, "loss": 0.1204, "learning_rate": 1.2258908183975322e-07, "epoch": 0.9048356662066634, "percentage": 90.49, "elapsed_time": "12:11:43", "remaining_time": "1:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4017, "total_steps": 4438, "loss": 0.1211, "learning_rate": 1.2201354646674212e-07, "epoch": 0.9050609738924719, "percentage": 90.51, "elapsed_time": "12:11:54", "remaining_time": "1:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4018, "total_steps": 4438, "loss": 0.1305, "learning_rate": 1.2143933150097154e-07, "epoch": 0.9052862815782804, "percentage": 90.54, "elapsed_time": "12:12:06", "remaining_time": "1:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4019, "total_steps": 4438, "loss": 0.1198, "learning_rate": 1.2086643726128194e-07, "epoch": 0.9055115892640888, "percentage": 90.56, "elapsed_time": "12:12:15", "remaining_time": "1:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4020, "total_steps": 4438, "loss": 0.122, "learning_rate": 1.2029486406577972e-07, "epoch": 0.9057368969498972, "percentage": 90.58, "elapsed_time": "12:12:27", "remaining_time": "1:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4021, "total_steps": 4438, "loss": 0.1217, "learning_rate": 1.1972461223183878e-07, "epoch": 0.9059622046357056, "percentage": 90.6, "elapsed_time": "12:12:36", "remaining_time": "1:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4022, "total_steps": 4438, "loss": 0.132, "learning_rate": 1.191556820760978e-07, "epoch": 0.9061875123215141, "percentage": 90.63, "elapsed_time": "12:12:46", "remaining_time": "1:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4023, "total_steps": 4438, "loss": 0.1229, "learning_rate": 1.1858807391446319e-07, "epoch": 0.9064128200073225, "percentage": 90.65, "elapsed_time": "12:12:56", "remaining_time": "1:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4024, "total_steps": 4438, "loss": 0.1301, "learning_rate": 1.1802178806210624e-07, "epoch": 0.9066381276931309, "percentage": 90.67, "elapsed_time": "12:13:07", "remaining_time": "1:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4025, "total_steps": 4438, "loss": 0.13, "learning_rate": 1.1745682483346454e-07, "epoch": 0.9068634353789393, "percentage": 90.69, "elapsed_time": "12:13:19", "remaining_time": "1:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4026, "total_steps": 4438, "loss": 0.1144, "learning_rate": 1.1689318454224191e-07, "epoch": 0.9070887430647478, "percentage": 90.72, "elapsed_time": "12:13:29", "remaining_time": "1:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4027, "total_steps": 4438, "loss": 0.1086, "learning_rate": 1.1633086750140521e-07, "epoch": 0.9073140507505563, "percentage": 90.74, "elapsed_time": "12:13:40", "remaining_time": "1:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4028, "total_steps": 4438, "loss": 0.1284, "learning_rate": 1.1576987402318884e-07, "epoch": 0.9075393584363647, "percentage": 90.76, "elapsed_time": "12:13:50", "remaining_time": "1:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4029, "total_steps": 4438, "loss": 0.1184, "learning_rate": 1.1521020441909226e-07, "epoch": 0.9077646661221731, "percentage": 90.78, "elapsed_time": "12:14:02", "remaining_time": "1:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4030, "total_steps": 4438, "loss": 0.1304, "learning_rate": 1.1465185899987797e-07, "epoch": 0.9079899738079815, "percentage": 90.81, "elapsed_time": "12:14:13", "remaining_time": "1:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4031, "total_steps": 4438, "loss": 0.1308, "learning_rate": 1.140948380755752e-07, "epoch": 0.9082152814937899, "percentage": 90.83, "elapsed_time": "12:14:24", "remaining_time": "1:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4032, "total_steps": 4438, "loss": 0.1275, "learning_rate": 1.1353914195547655e-07, "epoch": 0.9084405891795984, "percentage": 90.85, "elapsed_time": "12:14:34", "remaining_time": "1:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4033, "total_steps": 4438, "loss": 0.1149, "learning_rate": 1.1298477094813965e-07, "epoch": 0.9086658968654068, "percentage": 90.87, "elapsed_time": "12:14:44", "remaining_time": "1:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4034, "total_steps": 4438, "loss": 0.1355, "learning_rate": 1.1243172536138547e-07, "epoch": 0.9088912045512153, "percentage": 90.9, "elapsed_time": "12:14:56", "remaining_time": "1:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4035, "total_steps": 4438, "loss": 0.1257, "learning_rate": 1.1188000550230005e-07, "epoch": 0.9091165122370237, "percentage": 90.92, "elapsed_time": "12:15:07", "remaining_time": "1:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4036, "total_steps": 4438, "loss": 0.1347, "learning_rate": 1.1132961167723305e-07, "epoch": 0.9093418199228321, "percentage": 90.94, "elapsed_time": "12:15:17", "remaining_time": "1:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4037, "total_steps": 4438, "loss": 0.1314, "learning_rate": 1.1078054419179724e-07, "epoch": 0.9095671276086406, "percentage": 90.96, "elapsed_time": "12:15:28", "remaining_time": "1:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4038, "total_steps": 4438, "loss": 0.1284, "learning_rate": 1.1023280335086956e-07, "epoch": 0.909792435294449, "percentage": 90.99, "elapsed_time": "12:15:39", "remaining_time": "1:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4039, "total_steps": 4438, "loss": 0.1274, "learning_rate": 1.0968638945858978e-07, "epoch": 0.9100177429802574, "percentage": 91.01, "elapsed_time": "12:15:50", "remaining_time": "1:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4040, "total_steps": 4438, "loss": 0.1395, "learning_rate": 1.091413028183616e-07, "epoch": 0.9102430506660658, "percentage": 91.03, "elapsed_time": "12:16:01", "remaining_time": "1:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4041, "total_steps": 4438, "loss": 0.1361, "learning_rate": 1.0859754373285125e-07, "epoch": 0.9104683583518742, "percentage": 91.05, "elapsed_time": "12:16:11", "remaining_time": "1:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4042, "total_steps": 4438, "loss": 0.121, "learning_rate": 1.0805511250398748e-07, "epoch": 0.9106936660376828, "percentage": 91.08, "elapsed_time": "12:16:22", "remaining_time": "1:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4043, "total_steps": 4438, "loss": 0.1241, "learning_rate": 1.0751400943296269e-07, "epoch": 0.9109189737234912, "percentage": 91.1, "elapsed_time": "12:16:31", "remaining_time": "1:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4044, "total_steps": 4438, "loss": 0.1142, "learning_rate": 1.06974234820231e-07, "epoch": 0.9111442814092996, "percentage": 91.12, "elapsed_time": "12:16:43", "remaining_time": "1:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4045, "total_steps": 4438, "loss": 0.1231, "learning_rate": 1.0643578896550877e-07, "epoch": 0.911369589095108, "percentage": 91.14, "elapsed_time": "12:16:53", "remaining_time": "1:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4046, "total_steps": 4438, "loss": 0.1319, "learning_rate": 1.0589867216777544e-07, "epoch": 0.9115948967809164, "percentage": 91.17, "elapsed_time": "12:17:04", "remaining_time": "1:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4047, "total_steps": 4438, "loss": 0.1218, "learning_rate": 1.0536288472527162e-07, "epoch": 0.9118202044667248, "percentage": 91.19, "elapsed_time": "12:17:13", "remaining_time": "1:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4048, "total_steps": 4438, "loss": 0.1222, "learning_rate": 1.0482842693550044e-07, "epoch": 0.9120455121525333, "percentage": 91.21, "elapsed_time": "12:17:24", "remaining_time": "1:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4049, "total_steps": 4438, "loss": 0.1203, "learning_rate": 1.042952990952259e-07, "epoch": 0.9122708198383417, "percentage": 91.23, "elapsed_time": "12:17:35", "remaining_time": "1:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 4438, "loss": 0.1293, "learning_rate": 1.0376350150047427e-07, "epoch": 0.9124961275241502, "percentage": 91.26, "elapsed_time": "12:17:46", "remaining_time": "1:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4051, "total_steps": 4438, "loss": 0.1167, "learning_rate": 1.032330344465332e-07, "epoch": 0.9127214352099586, "percentage": 91.28, "elapsed_time": "12:17:56", "remaining_time": "1:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4052, "total_steps": 4438, "loss": 0.12, "learning_rate": 1.0270389822795073e-07, "epoch": 0.912946742895767, "percentage": 91.3, "elapsed_time": "12:18:07", "remaining_time": "1:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4053, "total_steps": 4438, "loss": 0.1233, "learning_rate": 1.0217609313853738e-07, "epoch": 0.9131720505815755, "percentage": 91.32, "elapsed_time": "12:18:17", "remaining_time": "1:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4054, "total_steps": 4438, "loss": 0.1281, "learning_rate": 1.0164961947136232e-07, "epoch": 0.9133973582673839, "percentage": 91.35, "elapsed_time": "12:18:28", "remaining_time": "1:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4055, "total_steps": 4438, "loss": 0.127, "learning_rate": 1.0112447751875809e-07, "epoch": 0.9136226659531923, "percentage": 91.37, "elapsed_time": "12:18:38", "remaining_time": "1:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4056, "total_steps": 4438, "loss": 0.1211, "learning_rate": 1.0060066757231535e-07, "epoch": 0.9138479736390007, "percentage": 91.39, "elapsed_time": "12:18:50", "remaining_time": "1:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4057, "total_steps": 4438, "loss": 0.1122, "learning_rate": 1.0007818992288671e-07, "epoch": 0.9140732813248091, "percentage": 91.42, "elapsed_time": "12:19:01", "remaining_time": "1:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4058, "total_steps": 4438, "loss": 0.1242, "learning_rate": 9.955704486058482e-08, "epoch": 0.9142985890106177, "percentage": 91.44, "elapsed_time": "12:19:10", "remaining_time": "1:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4059, "total_steps": 4438, "loss": 0.1142, "learning_rate": 9.903723267478154e-08, "epoch": 0.9145238966964261, "percentage": 91.46, "elapsed_time": "12:19:21", "remaining_time": "1:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4060, "total_steps": 4438, "loss": 0.1148, "learning_rate": 9.85187536541099e-08, "epoch": 0.9147492043822345, "percentage": 91.48, "elapsed_time": "12:19:31", "remaining_time": "1:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4061, "total_steps": 4438, "loss": 0.1231, "learning_rate": 9.800160808646154e-08, "epoch": 0.9149745120680429, "percentage": 91.51, "elapsed_time": "12:19:43", "remaining_time": "1:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4062, "total_steps": 4438, "loss": 0.1196, "learning_rate": 9.748579625898758e-08, "epoch": 0.9151998197538513, "percentage": 91.53, "elapsed_time": "12:19:54", "remaining_time": "1:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4063, "total_steps": 4438, "loss": 0.1306, "learning_rate": 9.697131845810032e-08, "epoch": 0.9154251274396598, "percentage": 91.55, "elapsed_time": "12:20:05", "remaining_time": "1:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4064, "total_steps": 4438, "loss": 0.1228, "learning_rate": 9.645817496946902e-08, "epoch": 0.9156504351254682, "percentage": 91.57, "elapsed_time": "12:20:16", "remaining_time": "1:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4065, "total_steps": 4438, "loss": 0.1352, "learning_rate": 9.594636607802355e-08, "epoch": 0.9158757428112767, "percentage": 91.6, "elapsed_time": "12:20:28", "remaining_time": "1:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4066, "total_steps": 4438, "loss": 0.1287, "learning_rate": 9.54358920679524e-08, "epoch": 0.9161010504970851, "percentage": 91.62, "elapsed_time": "12:20:40", "remaining_time": "1:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4067, "total_steps": 4438, "loss": 0.1171, "learning_rate": 9.492675322270273e-08, "epoch": 0.9163263581828935, "percentage": 91.64, "elapsed_time": "12:20:51", "remaining_time": "1:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4068, "total_steps": 4438, "loss": 0.1076, "learning_rate": 9.441894982498035e-08, "epoch": 0.916551665868702, "percentage": 91.66, "elapsed_time": "12:21:01", "remaining_time": "1:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4069, "total_steps": 4438, "loss": 0.1428, "learning_rate": 9.391248215674942e-08, "epoch": 0.9167769735545104, "percentage": 91.69, "elapsed_time": "12:21:13", "remaining_time": "1:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4070, "total_steps": 4438, "loss": 0.1272, "learning_rate": 9.340735049923277e-08, "epoch": 0.9170022812403188, "percentage": 91.71, "elapsed_time": "12:21:24", "remaining_time": "1:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4071, "total_steps": 4438, "loss": 0.1031, "learning_rate": 9.290355513291105e-08, "epoch": 0.9172275889261272, "percentage": 91.73, "elapsed_time": "12:21:36", "remaining_time": "1:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4072, "total_steps": 4438, "loss": 0.1193, "learning_rate": 9.24010963375227e-08, "epoch": 0.9174528966119356, "percentage": 91.75, "elapsed_time": "12:21:47", "remaining_time": "1:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4073, "total_steps": 4438, "loss": 0.143, "learning_rate": 9.189997439206538e-08, "epoch": 0.9176782042977442, "percentage": 91.78, "elapsed_time": "12:21:58", "remaining_time": "1:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4074, "total_steps": 4438, "loss": 0.1146, "learning_rate": 9.140018957479236e-08, "epoch": 0.9179035119835526, "percentage": 91.8, "elapsed_time": "12:22:06", "remaining_time": "1:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4075, "total_steps": 4438, "loss": 0.1211, "learning_rate": 9.090174216321607e-08, "epoch": 0.918128819669361, "percentage": 91.82, "elapsed_time": "12:22:18", "remaining_time": "1:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4076, "total_steps": 4438, "loss": 0.1424, "learning_rate": 9.040463243410541e-08, "epoch": 0.9183541273551694, "percentage": 91.84, "elapsed_time": "12:22:29", "remaining_time": "1:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4077, "total_steps": 4438, "loss": 0.1158, "learning_rate": 8.990886066348764e-08, "epoch": 0.9185794350409778, "percentage": 91.87, "elapsed_time": "12:22:40", "remaining_time": "1:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4078, "total_steps": 4438, "loss": 0.1322, "learning_rate": 8.941442712664561e-08, "epoch": 0.9188047427267862, "percentage": 91.89, "elapsed_time": "12:22:52", "remaining_time": "1:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4079, "total_steps": 4438, "loss": 0.127, "learning_rate": 8.892133209811971e-08, "epoch": 0.9190300504125947, "percentage": 91.91, "elapsed_time": "12:23:03", "remaining_time": "1:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4080, "total_steps": 4438, "loss": 0.1244, "learning_rate": 8.842957585170814e-08, "epoch": 0.9192553580984031, "percentage": 91.93, "elapsed_time": "12:23:14", "remaining_time": "1:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4081, "total_steps": 4438, "loss": 0.1211, "learning_rate": 8.79391586604636e-08, "epoch": 0.9194806657842116, "percentage": 91.96, "elapsed_time": "12:23:24", "remaining_time": "1:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4082, "total_steps": 4438, "loss": 0.1363, "learning_rate": 8.745008079669742e-08, "epoch": 0.91970597347002, "percentage": 91.98, "elapsed_time": "12:23:34", "remaining_time": "1:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4083, "total_steps": 4438, "loss": 0.1353, "learning_rate": 8.696234253197599e-08, "epoch": 0.9199312811558285, "percentage": 92.0, "elapsed_time": "12:23:44", "remaining_time": "1:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4084, "total_steps": 4438, "loss": 0.1333, "learning_rate": 8.647594413712212e-08, "epoch": 0.9201565888416369, "percentage": 92.02, "elapsed_time": "12:23:55", "remaining_time": "1:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4085, "total_steps": 4438, "loss": 0.1183, "learning_rate": 8.599088588221504e-08, "epoch": 0.9203818965274453, "percentage": 92.05, "elapsed_time": "12:24:06", "remaining_time": "1:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4086, "total_steps": 4438, "loss": 0.1311, "learning_rate": 8.550716803658904e-08, "epoch": 0.9206072042132537, "percentage": 92.07, "elapsed_time": "12:24:16", "remaining_time": "1:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4087, "total_steps": 4438, "loss": 0.1386, "learning_rate": 8.502479086883481e-08, "epoch": 0.9208325118990621, "percentage": 92.09, "elapsed_time": "12:24:28", "remaining_time": "1:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4088, "total_steps": 4438, "loss": 0.1351, "learning_rate": 8.454375464679865e-08, "epoch": 0.9210578195848705, "percentage": 92.11, "elapsed_time": "12:24:37", "remaining_time": "1:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4089, "total_steps": 4438, "loss": 0.1335, "learning_rate": 8.406405963758162e-08, "epoch": 0.9212831272706791, "percentage": 92.14, "elapsed_time": "12:24:48", "remaining_time": "1:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4090, "total_steps": 4438, "loss": 0.1274, "learning_rate": 8.358570610754097e-08, "epoch": 0.9215084349564875, "percentage": 92.16, "elapsed_time": "12:25:00", "remaining_time": "1:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4091, "total_steps": 4438, "loss": 0.13, "learning_rate": 8.310869432228808e-08, "epoch": 0.9217337426422959, "percentage": 92.18, "elapsed_time": "12:25:10", "remaining_time": "1:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4092, "total_steps": 4438, "loss": 0.1203, "learning_rate": 8.263302454669025e-08, "epoch": 0.9219590503281043, "percentage": 92.2, "elapsed_time": "12:25:22", "remaining_time": "1:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4093, "total_steps": 4438, "loss": 0.1354, "learning_rate": 8.215869704486873e-08, "epoch": 0.9221843580139127, "percentage": 92.23, "elapsed_time": "12:25:34", "remaining_time": "1:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4094, "total_steps": 4438, "loss": 0.1184, "learning_rate": 8.168571208020032e-08, "epoch": 0.9224096656997212, "percentage": 92.25, "elapsed_time": "12:25:45", "remaining_time": "1:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4095, "total_steps": 4438, "loss": 0.1266, "learning_rate": 8.121406991531577e-08, "epoch": 0.9226349733855296, "percentage": 92.27, "elapsed_time": "12:25:56", "remaining_time": "1:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4096, "total_steps": 4438, "loss": 0.1174, "learning_rate": 8.074377081210033e-08, "epoch": 0.922860281071338, "percentage": 92.29, "elapsed_time": "12:26:07", "remaining_time": "1:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4097, "total_steps": 4438, "loss": 0.1254, "learning_rate": 8.027481503169371e-08, "epoch": 0.9230855887571465, "percentage": 92.32, "elapsed_time": "12:26:18", "remaining_time": "1:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4098, "total_steps": 4438, "loss": 0.1166, "learning_rate": 7.980720283448957e-08, "epoch": 0.9233108964429549, "percentage": 92.34, "elapsed_time": "12:26:29", "remaining_time": "1:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4099, "total_steps": 4438, "loss": 0.1343, "learning_rate": 7.934093448013492e-08, "epoch": 0.9235362041287634, "percentage": 92.36, "elapsed_time": "12:26:39", "remaining_time": "1:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 4438, "loss": 0.118, "learning_rate": 7.887601022753238e-08, "epoch": 0.9237615118145718, "percentage": 92.38, "elapsed_time": "12:26:49", "remaining_time": "1:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4101, "total_steps": 4438, "loss": 0.1114, "learning_rate": 7.841243033483575e-08, "epoch": 0.9239868195003802, "percentage": 92.41, "elapsed_time": "12:27:00", "remaining_time": "1:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4102, "total_steps": 4438, "loss": 0.1205, "learning_rate": 7.795019505945495e-08, "epoch": 0.9242121271861886, "percentage": 92.43, "elapsed_time": "12:27:10", "remaining_time": "1:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4103, "total_steps": 4438, "loss": 0.1254, "learning_rate": 7.748930465805105e-08, "epoch": 0.924437434871997, "percentage": 92.45, "elapsed_time": "12:27:22", "remaining_time": "1:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4104, "total_steps": 4438, "loss": 0.1264, "learning_rate": 7.702975938653934e-08, "epoch": 0.9246627425578055, "percentage": 92.47, "elapsed_time": "12:27:33", "remaining_time": "1:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4105, "total_steps": 4438, "loss": 0.1227, "learning_rate": 7.657155950008904e-08, "epoch": 0.924888050243614, "percentage": 92.5, "elapsed_time": "12:27:43", "remaining_time": "1:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4106, "total_steps": 4438, "loss": 0.1244, "learning_rate": 7.611470525312054e-08, "epoch": 0.9251133579294224, "percentage": 92.52, "elapsed_time": "12:27:53", "remaining_time": "1:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4107, "total_steps": 4438, "loss": 0.1252, "learning_rate": 7.565919689930839e-08, "epoch": 0.9253386656152308, "percentage": 92.54, "elapsed_time": "12:28:04", "remaining_time": "1:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4108, "total_steps": 4438, "loss": 0.1183, "learning_rate": 7.520503469157947e-08, "epoch": 0.9255639733010392, "percentage": 92.56, "elapsed_time": "12:28:14", "remaining_time": "1:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4109, "total_steps": 4438, "loss": 0.1227, "learning_rate": 7.47522188821126e-08, "epoch": 0.9257892809868477, "percentage": 92.59, "elapsed_time": "12:28:25", "remaining_time": "0:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4110, "total_steps": 4438, "loss": 0.1205, "learning_rate": 7.430074972234053e-08, "epoch": 0.9260145886726561, "percentage": 92.61, "elapsed_time": "12:28:37", "remaining_time": "0:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4111, "total_steps": 4438, "loss": 0.1219, "learning_rate": 7.385062746294608e-08, "epoch": 0.9262398963584645, "percentage": 92.63, "elapsed_time": "12:28:48", "remaining_time": "0:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4112, "total_steps": 4438, "loss": 0.1142, "learning_rate": 7.340185235386627e-08, "epoch": 0.9264652040442729, "percentage": 92.65, "elapsed_time": "12:28:57", "remaining_time": "0:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4113, "total_steps": 4438, "loss": 0.1322, "learning_rate": 7.29544246442887e-08, "epoch": 0.9266905117300814, "percentage": 92.68, "elapsed_time": "12:29:07", "remaining_time": "0:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4114, "total_steps": 4438, "loss": 0.12, "learning_rate": 7.250834458265355e-08, "epoch": 0.9269158194158899, "percentage": 92.7, "elapsed_time": "12:29:18", "remaining_time": "0:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4115, "total_steps": 4438, "loss": 0.1247, "learning_rate": 7.206361241665266e-08, "epoch": 0.9271411271016983, "percentage": 92.72, "elapsed_time": "12:29:28", "remaining_time": "0:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4116, "total_steps": 4438, "loss": 0.1182, "learning_rate": 7.162022839322824e-08, "epoch": 0.9273664347875067, "percentage": 92.74, "elapsed_time": "12:29:38", "remaining_time": "0:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4117, "total_steps": 4438, "loss": 0.1213, "learning_rate": 7.117819275857613e-08, "epoch": 0.9275917424733151, "percentage": 92.77, "elapsed_time": "12:29:49", "remaining_time": "0:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4118, "total_steps": 4438, "loss": 0.1285, "learning_rate": 7.073750575814136e-08, "epoch": 0.9278170501591235, "percentage": 92.79, "elapsed_time": "12:29:59", "remaining_time": "0:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4119, "total_steps": 4438, "loss": 0.12, "learning_rate": 7.029816763662129e-08, "epoch": 0.9280423578449319, "percentage": 92.81, "elapsed_time": "12:30:09", "remaining_time": "0:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4120, "total_steps": 4438, "loss": 0.1171, "learning_rate": 6.986017863796435e-08, "epoch": 0.9282676655307405, "percentage": 92.83, "elapsed_time": "12:30:19", "remaining_time": "0:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4121, "total_steps": 4438, "loss": 0.1204, "learning_rate": 6.94235390053688e-08, "epoch": 0.9284929732165489, "percentage": 92.86, "elapsed_time": "12:30:30", "remaining_time": "0:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4122, "total_steps": 4438, "loss": 0.1248, "learning_rate": 6.898824898128515e-08, "epoch": 0.9287182809023573, "percentage": 92.88, "elapsed_time": "12:30:39", "remaining_time": "0:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4123, "total_steps": 4438, "loss": 0.1222, "learning_rate": 6.85543088074131e-08, "epoch": 0.9289435885881657, "percentage": 92.9, "elapsed_time": "12:30:49", "remaining_time": "0:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4124, "total_steps": 4438, "loss": 0.1252, "learning_rate": 6.81217187247038e-08, "epoch": 0.9291688962739741, "percentage": 92.92, "elapsed_time": "12:31:00", "remaining_time": "0:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4125, "total_steps": 4438, "loss": 0.135, "learning_rate": 6.769047897335818e-08, "epoch": 0.9293942039597826, "percentage": 92.95, "elapsed_time": "12:31:11", "remaining_time": "0:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4126, "total_steps": 4438, "loss": 0.1128, "learning_rate": 6.726058979282774e-08, "epoch": 0.929619511645591, "percentage": 92.97, "elapsed_time": "12:31:21", "remaining_time": "0:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4127, "total_steps": 4438, "loss": 0.118, "learning_rate": 6.683205142181404e-08, "epoch": 0.9298448193313994, "percentage": 92.99, "elapsed_time": "12:31:32", "remaining_time": "0:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4128, "total_steps": 4438, "loss": 0.1285, "learning_rate": 6.640486409826785e-08, "epoch": 0.9300701270172079, "percentage": 93.01, "elapsed_time": "12:31:43", "remaining_time": "0:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4129, "total_steps": 4438, "loss": 0.1206, "learning_rate": 6.597902805939138e-08, "epoch": 0.9302954347030163, "percentage": 93.04, "elapsed_time": "12:31:55", "remaining_time": "0:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4130, "total_steps": 4438, "loss": 0.1307, "learning_rate": 6.555454354163437e-08, "epoch": 0.9305207423888248, "percentage": 93.06, "elapsed_time": "12:32:05", "remaining_time": "0:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4131, "total_steps": 4438, "loss": 0.1124, "learning_rate": 6.513141078069828e-08, "epoch": 0.9307460500746332, "percentage": 93.08, "elapsed_time": "12:32:17", "remaining_time": "0:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4132, "total_steps": 4438, "loss": 0.1365, "learning_rate": 6.470963001153268e-08, "epoch": 0.9309713577604416, "percentage": 93.11, "elapsed_time": "12:32:27", "remaining_time": "0:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4133, "total_steps": 4438, "loss": 0.1277, "learning_rate": 6.428920146833606e-08, "epoch": 0.93119666544625, "percentage": 93.13, "elapsed_time": "12:32:38", "remaining_time": "0:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4134, "total_steps": 4438, "loss": 0.1353, "learning_rate": 6.387012538455723e-08, "epoch": 0.9314219731320584, "percentage": 93.15, "elapsed_time": "12:32:49", "remaining_time": "0:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4135, "total_steps": 4438, "loss": 0.1274, "learning_rate": 6.345240199289365e-08, "epoch": 0.9316472808178669, "percentage": 93.17, "elapsed_time": "12:33:00", "remaining_time": "0:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4136, "total_steps": 4438, "loss": 0.1249, "learning_rate": 6.303603152529119e-08, "epoch": 0.9318725885036754, "percentage": 93.2, "elapsed_time": "12:33:10", "remaining_time": "0:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4137, "total_steps": 4438, "loss": 0.1205, "learning_rate": 6.262101421294547e-08, "epoch": 0.9320978961894838, "percentage": 93.22, "elapsed_time": "12:33:20", "remaining_time": "0:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4138, "total_steps": 4438, "loss": 0.1206, "learning_rate": 6.220735028629937e-08, "epoch": 0.9323232038752922, "percentage": 93.24, "elapsed_time": "12:33:31", "remaining_time": "0:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4139, "total_steps": 4438, "loss": 0.1222, "learning_rate": 6.179503997504554e-08, "epoch": 0.9325485115611006, "percentage": 93.26, "elapsed_time": "12:33:42", "remaining_time": "0:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4140, "total_steps": 4438, "loss": 0.1229, "learning_rate": 6.13840835081242e-08, "epoch": 0.932773819246909, "percentage": 93.29, "elapsed_time": "12:33:53", "remaining_time": "0:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4141, "total_steps": 4438, "loss": 0.1364, "learning_rate": 6.097448111372446e-08, "epoch": 0.9329991269327175, "percentage": 93.31, "elapsed_time": "12:34:03", "remaining_time": "0:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4142, "total_steps": 4438, "loss": 0.1344, "learning_rate": 6.056623301928327e-08, "epoch": 0.9332244346185259, "percentage": 93.33, "elapsed_time": "12:34:15", "remaining_time": "0:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4143, "total_steps": 4438, "loss": 0.114, "learning_rate": 6.015933945148517e-08, "epoch": 0.9334497423043343, "percentage": 93.35, "elapsed_time": "12:34:25", "remaining_time": "0:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4144, "total_steps": 4438, "loss": 0.1243, "learning_rate": 5.975380063626356e-08, "epoch": 0.9336750499901428, "percentage": 93.38, "elapsed_time": "12:34:35", "remaining_time": "0:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4145, "total_steps": 4438, "loss": 0.1236, "learning_rate": 5.934961679879836e-08, "epoch": 0.9339003576759513, "percentage": 93.4, "elapsed_time": "12:34:46", "remaining_time": "0:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4146, "total_steps": 4438, "loss": 0.1165, "learning_rate": 5.894678816351862e-08, "epoch": 0.9341256653617597, "percentage": 93.42, "elapsed_time": "12:34:56", "remaining_time": "0:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4147, "total_steps": 4438, "loss": 0.1226, "learning_rate": 5.854531495409932e-08, "epoch": 0.9343509730475681, "percentage": 93.44, "elapsed_time": "12:35:07", "remaining_time": "0:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4148, "total_steps": 4438, "loss": 0.1276, "learning_rate": 5.8145197393463806e-08, "epoch": 0.9345762807333765, "percentage": 93.47, "elapsed_time": "12:35:17", "remaining_time": "0:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4149, "total_steps": 4438, "loss": 0.1176, "learning_rate": 5.774643570378296e-08, "epoch": 0.9348015884191849, "percentage": 93.49, "elapsed_time": "12:35:27", "remaining_time": "0:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 4438, "loss": 0.1206, "learning_rate": 5.73490301064733e-08, "epoch": 0.9350268961049933, "percentage": 93.51, "elapsed_time": "12:35:37", "remaining_time": "0:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4151, "total_steps": 4438, "loss": 0.135, "learning_rate": 5.695298082219997e-08, "epoch": 0.9352522037908018, "percentage": 93.53, "elapsed_time": "12:35:47", "remaining_time": "0:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4152, "total_steps": 4438, "loss": 0.1191, "learning_rate": 5.6558288070874544e-08, "epoch": 0.9354775114766103, "percentage": 93.56, "elapsed_time": "12:35:58", "remaining_time": "0:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4153, "total_steps": 4438, "loss": 0.1358, "learning_rate": 5.616495207165451e-08, "epoch": 0.9357028191624187, "percentage": 93.58, "elapsed_time": "12:36:08", "remaining_time": "0:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4154, "total_steps": 4438, "loss": 0.1255, "learning_rate": 5.577297304294543e-08, "epoch": 0.9359281268482271, "percentage": 93.6, "elapsed_time": "12:36:18", "remaining_time": "0:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4155, "total_steps": 4438, "loss": 0.1214, "learning_rate": 5.538235120239821e-08, "epoch": 0.9361534345340355, "percentage": 93.62, "elapsed_time": "12:36:28", "remaining_time": "0:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4156, "total_steps": 4438, "loss": 0.1217, "learning_rate": 5.4993086766910733e-08, "epoch": 0.936378742219844, "percentage": 93.65, "elapsed_time": "12:36:41", "remaining_time": "0:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4157, "total_steps": 4438, "loss": 0.1281, "learning_rate": 5.460517995262704e-08, "epoch": 0.9366040499056524, "percentage": 93.67, "elapsed_time": "12:36:51", "remaining_time": "0:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4158, "total_steps": 4438, "loss": 0.1233, "learning_rate": 5.421863097493707e-08, "epoch": 0.9368293575914608, "percentage": 93.69, "elapsed_time": "12:37:01", "remaining_time": "0:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4159, "total_steps": 4438, "loss": 0.1293, "learning_rate": 5.383344004847774e-08, "epoch": 0.9370546652772692, "percentage": 93.71, "elapsed_time": "12:37:12", "remaining_time": "0:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4160, "total_steps": 4438, "loss": 0.112, "learning_rate": 5.344960738713018e-08, "epoch": 0.9372799729630777, "percentage": 93.74, "elapsed_time": "12:37:21", "remaining_time": "0:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4161, "total_steps": 4438, "loss": 0.1356, "learning_rate": 5.3067133204023344e-08, "epoch": 0.9375052806488862, "percentage": 93.76, "elapsed_time": "12:37:31", "remaining_time": "0:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4162, "total_steps": 4438, "loss": 0.1194, "learning_rate": 5.268601771153042e-08, "epoch": 0.9377305883346946, "percentage": 93.78, "elapsed_time": "12:37:42", "remaining_time": "0:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4163, "total_steps": 4438, "loss": 0.1227, "learning_rate": 5.230626112127046e-08, "epoch": 0.937955896020503, "percentage": 93.8, "elapsed_time": "12:37:52", "remaining_time": "0:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4164, "total_steps": 4438, "loss": 0.1247, "learning_rate": 5.192786364410868e-08, "epoch": 0.9381812037063114, "percentage": 93.83, "elapsed_time": "12:38:03", "remaining_time": "0:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4165, "total_steps": 4438, "loss": 0.117, "learning_rate": 5.15508254901545e-08, "epoch": 0.9384065113921198, "percentage": 93.85, "elapsed_time": "12:38:13", "remaining_time": "0:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4166, "total_steps": 4438, "loss": 0.1221, "learning_rate": 5.117514686876379e-08, "epoch": 0.9386318190779283, "percentage": 93.87, "elapsed_time": "12:38:23", "remaining_time": "0:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4167, "total_steps": 4438, "loss": 0.1215, "learning_rate": 5.080082798853664e-08, "epoch": 0.9388571267637368, "percentage": 93.89, "elapsed_time": "12:38:33", "remaining_time": "0:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4168, "total_steps": 4438, "loss": 0.1268, "learning_rate": 5.0427869057317894e-08, "epoch": 0.9390824344495452, "percentage": 93.92, "elapsed_time": "12:38:42", "remaining_time": "0:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4169, "total_steps": 4438, "loss": 0.1246, "learning_rate": 5.0056270282198286e-08, "epoch": 0.9393077421353536, "percentage": 93.94, "elapsed_time": "12:38:53", "remaining_time": "0:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4170, "total_steps": 4438, "loss": 0.1219, "learning_rate": 4.9686031869512486e-08, "epoch": 0.939533049821162, "percentage": 93.96, "elapsed_time": "12:39:05", "remaining_time": "0:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4171, "total_steps": 4438, "loss": 0.1175, "learning_rate": 4.93171540248405e-08, "epoch": 0.9397583575069705, "percentage": 93.98, "elapsed_time": "12:39:16", "remaining_time": "0:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4172, "total_steps": 4438, "loss": 0.1354, "learning_rate": 4.89496369530057e-08, "epoch": 0.9399836651927789, "percentage": 94.01, "elapsed_time": "12:39:26", "remaining_time": "0:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4173, "total_steps": 4438, "loss": 0.1232, "learning_rate": 4.858348085807735e-08, "epoch": 0.9402089728785873, "percentage": 94.03, "elapsed_time": "12:39:37", "remaining_time": "0:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4174, "total_steps": 4438, "loss": 0.128, "learning_rate": 4.8218685943368094e-08, "epoch": 0.9404342805643957, "percentage": 94.05, "elapsed_time": "12:39:48", "remaining_time": "0:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4175, "total_steps": 4438, "loss": 0.1357, "learning_rate": 4.7855252411434516e-08, "epoch": 0.9406595882502042, "percentage": 94.07, "elapsed_time": "12:39:59", "remaining_time": "0:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4176, "total_steps": 4438, "loss": 0.1243, "learning_rate": 4.7493180464078246e-08, "epoch": 0.9408848959360127, "percentage": 94.1, "elapsed_time": "12:40:10", "remaining_time": "0:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4177, "total_steps": 4438, "loss": 0.1281, "learning_rate": 4.713247030234402e-08, "epoch": 0.9411102036218211, "percentage": 94.12, "elapsed_time": "12:40:21", "remaining_time": "0:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4178, "total_steps": 4438, "loss": 0.1193, "learning_rate": 4.677312212652108e-08, "epoch": 0.9413355113076295, "percentage": 94.14, "elapsed_time": "12:40:31", "remaining_time": "0:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4179, "total_steps": 4438, "loss": 0.1262, "learning_rate": 4.641513613614174e-08, "epoch": 0.9415608189934379, "percentage": 94.16, "elapsed_time": "12:40:42", "remaining_time": "0:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4180, "total_steps": 4438, "loss": 0.1277, "learning_rate": 4.605851252998256e-08, "epoch": 0.9417861266792463, "percentage": 94.19, "elapsed_time": "12:40:53", "remaining_time": "0:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4181, "total_steps": 4438, "loss": 0.1208, "learning_rate": 4.570325150606292e-08, "epoch": 0.9420114343650547, "percentage": 94.21, "elapsed_time": "12:41:04", "remaining_time": "0:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4182, "total_steps": 4438, "loss": 0.1225, "learning_rate": 4.5349353261646414e-08, "epoch": 0.9422367420508632, "percentage": 94.23, "elapsed_time": "12:41:14", "remaining_time": "0:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4183, "total_steps": 4438, "loss": 0.1089, "learning_rate": 4.4996817993239464e-08, "epoch": 0.9424620497366717, "percentage": 94.25, "elapsed_time": "12:41:24", "remaining_time": "0:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4184, "total_steps": 4438, "loss": 0.1309, "learning_rate": 4.464564589659187e-08, "epoch": 0.9426873574224801, "percentage": 94.28, "elapsed_time": "12:41:36", "remaining_time": "0:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4185, "total_steps": 4438, "loss": 0.121, "learning_rate": 4.4295837166696e-08, "epoch": 0.9429126651082885, "percentage": 94.3, "elapsed_time": "12:41:45", "remaining_time": "0:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4186, "total_steps": 4438, "loss": 0.1362, "learning_rate": 4.3947391997787857e-08, "epoch": 0.943137972794097, "percentage": 94.32, "elapsed_time": "12:41:55", "remaining_time": "0:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4187, "total_steps": 4438, "loss": 0.1368, "learning_rate": 4.360031058334602e-08, "epoch": 0.9433632804799054, "percentage": 94.34, "elapsed_time": "12:42:05", "remaining_time": "0:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4188, "total_steps": 4438, "loss": 0.1249, "learning_rate": 4.325459311609187e-08, "epoch": 0.9435885881657138, "percentage": 94.37, "elapsed_time": "12:42:15", "remaining_time": "0:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4189, "total_steps": 4438, "loss": 0.1317, "learning_rate": 4.291023978798964e-08, "epoch": 0.9438138958515222, "percentage": 94.39, "elapsed_time": "12:42:26", "remaining_time": "0:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4190, "total_steps": 4438, "loss": 0.1367, "learning_rate": 4.256725079024554e-08, "epoch": 0.9440392035373306, "percentage": 94.41, "elapsed_time": "12:42:36", "remaining_time": "0:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4191, "total_steps": 4438, "loss": 0.1238, "learning_rate": 4.22256263133089e-08, "epoch": 0.9442645112231391, "percentage": 94.43, "elapsed_time": "12:42:46", "remaining_time": "0:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4192, "total_steps": 4438, "loss": 0.1282, "learning_rate": 4.1885366546870754e-08, "epoch": 0.9444898189089476, "percentage": 94.46, "elapsed_time": "12:42:58", "remaining_time": "0:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4193, "total_steps": 4438, "loss": 0.1287, "learning_rate": 4.1546471679864975e-08, "epoch": 0.944715126594756, "percentage": 94.48, "elapsed_time": "12:43:09", "remaining_time": "0:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4194, "total_steps": 4438, "loss": 0.1139, "learning_rate": 4.120894190046687e-08, "epoch": 0.9449404342805644, "percentage": 94.5, "elapsed_time": "12:43:18", "remaining_time": "0:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4195, "total_steps": 4438, "loss": 0.116, "learning_rate": 4.087277739609458e-08, "epoch": 0.9451657419663728, "percentage": 94.52, "elapsed_time": "12:43:29", "remaining_time": "0:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4196, "total_steps": 4438, "loss": 0.1249, "learning_rate": 4.053797835340739e-08, "epoch": 0.9453910496521812, "percentage": 94.55, "elapsed_time": "12:43:39", "remaining_time": "0:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4197, "total_steps": 4438, "loss": 0.1114, "learning_rate": 4.020454495830689e-08, "epoch": 0.9456163573379897, "percentage": 94.57, "elapsed_time": "12:43:50", "remaining_time": "0:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4198, "total_steps": 4438, "loss": 0.1289, "learning_rate": 3.987247739593636e-08, "epoch": 0.9458416650237981, "percentage": 94.59, "elapsed_time": "12:44:02", "remaining_time": "0:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4199, "total_steps": 4438, "loss": 0.1206, "learning_rate": 3.9541775850679975e-08, "epoch": 0.9460669727096066, "percentage": 94.61, "elapsed_time": "12:44:12", "remaining_time": "0:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 4438, "loss": 0.12, "learning_rate": 3.9212440506164465e-08, "epoch": 0.946292280395415, "percentage": 94.64, "elapsed_time": "12:44:22", "remaining_time": "0:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4201, "total_steps": 4438, "loss": 0.1262, "learning_rate": 3.888447154525771e-08, "epoch": 0.9465175880812234, "percentage": 94.66, "elapsed_time": "12:44:33", "remaining_time": "0:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4202, "total_steps": 4438, "loss": 0.1178, "learning_rate": 3.855786915006793e-08, "epoch": 0.9467428957670319, "percentage": 94.68, "elapsed_time": "12:44:45", "remaining_time": "0:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4203, "total_steps": 4438, "loss": 0.1092, "learning_rate": 3.8232633501945896e-08, "epoch": 0.9469682034528403, "percentage": 94.7, "elapsed_time": "12:44:54", "remaining_time": "0:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4204, "total_steps": 4438, "loss": 0.1278, "learning_rate": 3.790876478148242e-08, "epoch": 0.9471935111386487, "percentage": 94.73, "elapsed_time": "12:45:05", "remaining_time": "0:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4205, "total_steps": 4438, "loss": 0.1302, "learning_rate": 3.758626316850977e-08, "epoch": 0.9474188188244571, "percentage": 94.75, "elapsed_time": "12:45:16", "remaining_time": "0:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4206, "total_steps": 4438, "loss": 0.1349, "learning_rate": 3.726512884210165e-08, "epoch": 0.9476441265102655, "percentage": 94.77, "elapsed_time": "12:45:28", "remaining_time": "0:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4207, "total_steps": 4438, "loss": 0.1168, "learning_rate": 3.694536198057097e-08, "epoch": 0.9478694341960741, "percentage": 94.79, "elapsed_time": "12:45:39", "remaining_time": "0:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4208, "total_steps": 4438, "loss": 0.125, "learning_rate": 3.6626962761473205e-08, "epoch": 0.9480947418818825, "percentage": 94.82, "elapsed_time": "12:45:50", "remaining_time": "0:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4209, "total_steps": 4438, "loss": 0.1112, "learning_rate": 3.630993136160332e-08, "epoch": 0.9483200495676909, "percentage": 94.84, "elapsed_time": "12:46:00", "remaining_time": "0:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4210, "total_steps": 4438, "loss": 0.1287, "learning_rate": 3.599426795699662e-08, "epoch": 0.9485453572534993, "percentage": 94.86, "elapsed_time": "12:46:11", "remaining_time": "0:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4211, "total_steps": 4438, "loss": 0.1323, "learning_rate": 3.567997272293011e-08, "epoch": 0.9487706649393077, "percentage": 94.89, "elapsed_time": "12:46:22", "remaining_time": "0:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4212, "total_steps": 4438, "loss": 0.1245, "learning_rate": 3.53670458339192e-08, "epoch": 0.9489959726251161, "percentage": 94.91, "elapsed_time": "12:46:32", "remaining_time": "0:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4213, "total_steps": 4438, "loss": 0.1192, "learning_rate": 3.505548746372128e-08, "epoch": 0.9492212803109246, "percentage": 94.93, "elapsed_time": "12:46:43", "remaining_time": "0:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4214, "total_steps": 4438, "loss": 0.1256, "learning_rate": 3.474529778533298e-08, "epoch": 0.9494465879967331, "percentage": 94.95, "elapsed_time": "12:46:54", "remaining_time": "0:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4215, "total_steps": 4438, "loss": 0.1182, "learning_rate": 3.443647697099067e-08, "epoch": 0.9496718956825415, "percentage": 94.98, "elapsed_time": "12:47:04", "remaining_time": "0:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4216, "total_steps": 4438, "loss": 0.1249, "learning_rate": 3.412902519217137e-08, "epoch": 0.9498972033683499, "percentage": 95.0, "elapsed_time": "12:47:15", "remaining_time": "0:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4217, "total_steps": 4438, "loss": 0.1209, "learning_rate": 3.382294261959157e-08, "epoch": 0.9501225110541583, "percentage": 95.02, "elapsed_time": "12:47:25", "remaining_time": "0:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4218, "total_steps": 4438, "loss": 0.1322, "learning_rate": 3.351822942320754e-08, "epoch": 0.9503478187399668, "percentage": 95.04, "elapsed_time": "12:47:36", "remaining_time": "0:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4219, "total_steps": 4438, "loss": 0.1295, "learning_rate": 3.3214885772215046e-08, "epoch": 0.9505731264257752, "percentage": 95.07, "elapsed_time": "12:47:46", "remaining_time": "0:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4220, "total_steps": 4438, "loss": 0.1217, "learning_rate": 3.2912911835049634e-08, "epoch": 0.9507984341115836, "percentage": 95.09, "elapsed_time": "12:47:58", "remaining_time": "0:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4221, "total_steps": 4438, "loss": 0.1346, "learning_rate": 3.261230777938607e-08, "epoch": 0.951023741797392, "percentage": 95.11, "elapsed_time": "12:48:10", "remaining_time": "0:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4222, "total_steps": 4438, "loss": 0.1348, "learning_rate": 3.231307377213833e-08, "epoch": 0.9512490494832005, "percentage": 95.13, "elapsed_time": "12:48:21", "remaining_time": "0:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4223, "total_steps": 4438, "loss": 0.1369, "learning_rate": 3.201520997946045e-08, "epoch": 0.951474357169009, "percentage": 95.16, "elapsed_time": "12:48:32", "remaining_time": "0:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4224, "total_steps": 4438, "loss": 0.1127, "learning_rate": 3.171871656674458e-08, "epoch": 0.9516996648548174, "percentage": 95.18, "elapsed_time": "12:48:43", "remaining_time": "0:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4225, "total_steps": 4438, "loss": 0.1191, "learning_rate": 3.142359369862291e-08, "epoch": 0.9519249725406258, "percentage": 95.2, "elapsed_time": "12:48:52", "remaining_time": "0:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4226, "total_steps": 4438, "loss": 0.144, "learning_rate": 3.112984153896603e-08, "epoch": 0.9521502802264342, "percentage": 95.22, "elapsed_time": "12:49:03", "remaining_time": "0:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4227, "total_steps": 4438, "loss": 0.1281, "learning_rate": 3.0837460250883186e-08, "epoch": 0.9523755879122426, "percentage": 95.25, "elapsed_time": "12:49:13", "remaining_time": "0:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4228, "total_steps": 4438, "loss": 0.1258, "learning_rate": 3.0546449996723404e-08, "epoch": 0.9526008955980511, "percentage": 95.27, "elapsed_time": "12:49:23", "remaining_time": "0:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4229, "total_steps": 4438, "loss": 0.118, "learning_rate": 3.0256810938073534e-08, "epoch": 0.9528262032838595, "percentage": 95.29, "elapsed_time": "12:49:32", "remaining_time": "0:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4230, "total_steps": 4438, "loss": 0.133, "learning_rate": 2.996854323575937e-08, "epoch": 0.953051510969668, "percentage": 95.31, "elapsed_time": "12:49:42", "remaining_time": "0:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4231, "total_steps": 4438, "loss": 0.125, "learning_rate": 2.968164704984483e-08, "epoch": 0.9532768186554764, "percentage": 95.34, "elapsed_time": "12:49:52", "remaining_time": "0:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4232, "total_steps": 4438, "loss": 0.1303, "learning_rate": 2.939612253963331e-08, "epoch": 0.9535021263412848, "percentage": 95.36, "elapsed_time": "12:50:03", "remaining_time": "0:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4233, "total_steps": 4438, "loss": 0.1382, "learning_rate": 2.911196986366577e-08, "epoch": 0.9537274340270933, "percentage": 95.38, "elapsed_time": "12:50:13", "remaining_time": "0:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4234, "total_steps": 4438, "loss": 0.1275, "learning_rate": 2.8829189179721552e-08, "epoch": 0.9539527417129017, "percentage": 95.4, "elapsed_time": "12:50:24", "remaining_time": "0:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4235, "total_steps": 4438, "loss": 0.1262, "learning_rate": 2.8547780644818113e-08, "epoch": 0.9541780493987101, "percentage": 95.43, "elapsed_time": "12:50:35", "remaining_time": "0:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4236, "total_steps": 4438, "loss": 0.1186, "learning_rate": 2.8267744415211296e-08, "epoch": 0.9544033570845185, "percentage": 95.45, "elapsed_time": "12:50:44", "remaining_time": "0:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4237, "total_steps": 4438, "loss": 0.1464, "learning_rate": 2.7989080646394217e-08, "epoch": 0.9546286647703269, "percentage": 95.47, "elapsed_time": "12:50:55", "remaining_time": "0:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4238, "total_steps": 4438, "loss": 0.116, "learning_rate": 2.7711789493099495e-08, "epoch": 0.9548539724561355, "percentage": 95.49, "elapsed_time": "12:51:08", "remaining_time": "0:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4239, "total_steps": 4438, "loss": 0.116, "learning_rate": 2.743587110929563e-08, "epoch": 0.9550792801419439, "percentage": 95.52, "elapsed_time": "12:51:18", "remaining_time": "0:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4240, "total_steps": 4438, "loss": 0.1334, "learning_rate": 2.716132564819035e-08, "epoch": 0.9553045878277523, "percentage": 95.54, "elapsed_time": "12:51:28", "remaining_time": "0:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4241, "total_steps": 4438, "loss": 0.126, "learning_rate": 2.688815326222838e-08, "epoch": 0.9555298955135607, "percentage": 95.56, "elapsed_time": "12:51:38", "remaining_time": "0:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4242, "total_steps": 4438, "loss": 0.1262, "learning_rate": 2.661635410309199e-08, "epoch": 0.9557552031993691, "percentage": 95.58, "elapsed_time": "12:51:48", "remaining_time": "0:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4243, "total_steps": 4438, "loss": 0.1273, "learning_rate": 2.6345928321701575e-08, "epoch": 0.9559805108851775, "percentage": 95.61, "elapsed_time": "12:52:00", "remaining_time": "0:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4244, "total_steps": 4438, "loss": 0.1127, "learning_rate": 2.6076876068213965e-08, "epoch": 0.956205818570986, "percentage": 95.63, "elapsed_time": "12:52:10", "remaining_time": "0:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4245, "total_steps": 4438, "loss": 0.1335, "learning_rate": 2.5809197492024372e-08, "epoch": 0.9564311262567944, "percentage": 95.65, "elapsed_time": "12:52:21", "remaining_time": "0:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4246, "total_steps": 4438, "loss": 0.1221, "learning_rate": 2.554289274176419e-08, "epoch": 0.9566564339426029, "percentage": 95.67, "elapsed_time": "12:52:32", "remaining_time": "0:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4247, "total_steps": 4438, "loss": 0.1275, "learning_rate": 2.5277961965302633e-08, "epoch": 0.9568817416284113, "percentage": 95.7, "elapsed_time": "12:52:45", "remaining_time": "0:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4248, "total_steps": 4438, "loss": 0.1195, "learning_rate": 2.5014405309746193e-08, "epoch": 0.9571070493142197, "percentage": 95.72, "elapsed_time": "12:52:55", "remaining_time": "0:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4249, "total_steps": 4438, "loss": 0.1229, "learning_rate": 2.4752222921437807e-08, "epoch": 0.9573323570000282, "percentage": 95.74, "elapsed_time": "12:53:05", "remaining_time": "0:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 4438, "loss": 0.1315, "learning_rate": 2.449141494595797e-08, "epoch": 0.9575576646858366, "percentage": 95.76, "elapsed_time": "12:53:16", "remaining_time": "0:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4251, "total_steps": 4438, "loss": 0.118, "learning_rate": 2.423198152812306e-08, "epoch": 0.957782972371645, "percentage": 95.79, "elapsed_time": "12:53:26", "remaining_time": "0:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4252, "total_steps": 4438, "loss": 0.1304, "learning_rate": 2.3973922811987295e-08, "epoch": 0.9580082800574534, "percentage": 95.81, "elapsed_time": "12:53:37", "remaining_time": "0:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4253, "total_steps": 4438, "loss": 0.1214, "learning_rate": 2.3717238940840493e-08, "epoch": 0.9582335877432618, "percentage": 95.83, "elapsed_time": "12:53:47", "remaining_time": "0:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4254, "total_steps": 4438, "loss": 0.1235, "learning_rate": 2.3461930057210037e-08, "epoch": 0.9584588954290704, "percentage": 95.85, "elapsed_time": "12:53:58", "remaining_time": "0:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4255, "total_steps": 4438, "loss": 0.1151, "learning_rate": 2.320799630285947e-08, "epoch": 0.9586842031148788, "percentage": 95.88, "elapsed_time": "12:54:09", "remaining_time": "0:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4256, "total_steps": 4438, "loss": 0.1373, "learning_rate": 2.2955437818788508e-08, "epoch": 0.9589095108006872, "percentage": 95.9, "elapsed_time": "12:54:20", "remaining_time": "0:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4257, "total_steps": 4438, "loss": 0.1185, "learning_rate": 2.2704254745233577e-08, "epoch": 0.9591348184864956, "percentage": 95.92, "elapsed_time": "12:54:30", "remaining_time": "0:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4258, "total_steps": 4438, "loss": 0.1263, "learning_rate": 2.2454447221667563e-08, "epoch": 0.959360126172304, "percentage": 95.94, "elapsed_time": "12:54:40", "remaining_time": "0:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4259, "total_steps": 4438, "loss": 0.1261, "learning_rate": 2.2206015386798673e-08, "epoch": 0.9595854338581125, "percentage": 95.97, "elapsed_time": "12:54:52", "remaining_time": "0:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4260, "total_steps": 4438, "loss": 0.1174, "learning_rate": 2.1958959378572398e-08, "epoch": 0.9598107415439209, "percentage": 95.99, "elapsed_time": "12:55:02", "remaining_time": "0:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4261, "total_steps": 4438, "loss": 0.1272, "learning_rate": 2.1713279334169278e-08, "epoch": 0.9600360492297294, "percentage": 96.01, "elapsed_time": "12:55:13", "remaining_time": "0:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4262, "total_steps": 4438, "loss": 0.1182, "learning_rate": 2.1468975390006587e-08, "epoch": 0.9602613569155378, "percentage": 96.03, "elapsed_time": "12:55:22", "remaining_time": "0:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4263, "total_steps": 4438, "loss": 0.119, "learning_rate": 2.1226047681737193e-08, "epoch": 0.9604866646013462, "percentage": 96.06, "elapsed_time": "12:55:34", "remaining_time": "0:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4264, "total_steps": 4438, "loss": 0.1243, "learning_rate": 2.0984496344249596e-08, "epoch": 0.9607119722871547, "percentage": 96.08, "elapsed_time": "12:55:44", "remaining_time": "0:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4265, "total_steps": 4438, "loss": 0.1146, "learning_rate": 2.074432151166844e-08, "epoch": 0.9609372799729631, "percentage": 96.1, "elapsed_time": "12:55:54", "remaining_time": "0:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4266, "total_steps": 4438, "loss": 0.1382, "learning_rate": 2.0505523317353727e-08, "epoch": 0.9611625876587715, "percentage": 96.12, "elapsed_time": "12:56:04", "remaining_time": "0:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4267, "total_steps": 4438, "loss": 0.1229, "learning_rate": 2.0268101893901327e-08, "epoch": 0.9613878953445799, "percentage": 96.15, "elapsed_time": "12:56:14", "remaining_time": "0:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4268, "total_steps": 4438, "loss": 0.128, "learning_rate": 2.0032057373142453e-08, "epoch": 0.9616132030303883, "percentage": 96.17, "elapsed_time": "12:56:27", "remaining_time": "0:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4269, "total_steps": 4438, "loss": 0.1321, "learning_rate": 1.9797389886143658e-08, "epoch": 0.9618385107161969, "percentage": 96.19, "elapsed_time": "12:56:37", "remaining_time": "0:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4270, "total_steps": 4438, "loss": 0.1195, "learning_rate": 1.956409956320737e-08, "epoch": 0.9620638184020053, "percentage": 96.21, "elapsed_time": "12:56:49", "remaining_time": "0:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4271, "total_steps": 4438, "loss": 0.1362, "learning_rate": 1.933218653387081e-08, "epoch": 0.9622891260878137, "percentage": 96.24, "elapsed_time": "12:56:59", "remaining_time": "0:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4272, "total_steps": 4438, "loss": 0.1312, "learning_rate": 1.91016509269068e-08, "epoch": 0.9625144337736221, "percentage": 96.26, "elapsed_time": "12:57:09", "remaining_time": "0:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4273, "total_steps": 4438, "loss": 0.1339, "learning_rate": 1.8872492870322945e-08, "epoch": 0.9627397414594305, "percentage": 96.28, "elapsed_time": "12:57:20", "remaining_time": "0:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4274, "total_steps": 4438, "loss": 0.1228, "learning_rate": 1.864471249136218e-08, "epoch": 0.962965049145239, "percentage": 96.3, "elapsed_time": "12:57:30", "remaining_time": "0:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4275, "total_steps": 4438, "loss": 0.1276, "learning_rate": 1.8418309916502787e-08, "epoch": 0.9631903568310474, "percentage": 96.33, "elapsed_time": "12:57:41", "remaining_time": "0:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4276, "total_steps": 4438, "loss": 0.1079, "learning_rate": 1.819328527145725e-08, "epoch": 0.9634156645168558, "percentage": 96.35, "elapsed_time": "12:57:52", "remaining_time": "0:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4277, "total_steps": 4438, "loss": 0.117, "learning_rate": 1.7969638681173684e-08, "epoch": 0.9636409722026643, "percentage": 96.37, "elapsed_time": "12:58:02", "remaining_time": "0:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4278, "total_steps": 4438, "loss": 0.122, "learning_rate": 1.774737026983414e-08, "epoch": 0.9638662798884727, "percentage": 96.39, "elapsed_time": "12:58:14", "remaining_time": "0:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4279, "total_steps": 4438, "loss": 0.1337, "learning_rate": 1.752648016085684e-08, "epoch": 0.9640915875742812, "percentage": 96.42, "elapsed_time": "12:58:26", "remaining_time": "0:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4280, "total_steps": 4438, "loss": 0.1284, "learning_rate": 1.7306968476893393e-08, "epoch": 0.9643168952600896, "percentage": 96.44, "elapsed_time": "12:58:37", "remaining_time": "0:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4281, "total_steps": 4438, "loss": 0.133, "learning_rate": 1.708883533983019e-08, "epoch": 0.964542202945898, "percentage": 96.46, "elapsed_time": "12:58:47", "remaining_time": "0:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4282, "total_steps": 4438, "loss": 0.1308, "learning_rate": 1.6872080870788955e-08, "epoch": 0.9647675106317064, "percentage": 96.48, "elapsed_time": "12:58:58", "remaining_time": "0:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4283, "total_steps": 4438, "loss": 0.1131, "learning_rate": 1.6656705190125078e-08, "epoch": 0.9649928183175148, "percentage": 96.51, "elapsed_time": "12:59:08", "remaining_time": "0:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4284, "total_steps": 4438, "loss": 0.1202, "learning_rate": 1.6442708417428732e-08, "epoch": 0.9652181260033232, "percentage": 96.53, "elapsed_time": "12:59:19", "remaining_time": "0:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4285, "total_steps": 4438, "loss": 0.1262, "learning_rate": 1.6230090671524312e-08, "epoch": 0.9654434336891318, "percentage": 96.55, "elapsed_time": "12:59:30", "remaining_time": "0:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4286, "total_steps": 4438, "loss": 0.122, "learning_rate": 1.6018852070470437e-08, "epoch": 0.9656687413749402, "percentage": 96.58, "elapsed_time": "12:59:40", "remaining_time": "0:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4287, "total_steps": 4438, "loss": 0.1293, "learning_rate": 1.5808992731560225e-08, "epoch": 0.9658940490607486, "percentage": 96.6, "elapsed_time": "12:59:51", "remaining_time": "0:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4288, "total_steps": 4438, "loss": 0.1191, "learning_rate": 1.5600512771320462e-08, "epoch": 0.966119356746557, "percentage": 96.62, "elapsed_time": "13:00:01", "remaining_time": "0:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4289, "total_steps": 4438, "loss": 0.1227, "learning_rate": 1.5393412305512446e-08, "epoch": 0.9663446644323654, "percentage": 96.64, "elapsed_time": "13:00:11", "remaining_time": "0:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4290, "total_steps": 4438, "loss": 0.1178, "learning_rate": 1.518769144913168e-08, "epoch": 0.9665699721181739, "percentage": 96.67, "elapsed_time": "13:00:20", "remaining_time": "0:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4291, "total_steps": 4438, "loss": 0.1206, "learning_rate": 1.4983350316406797e-08, "epoch": 0.9667952798039823, "percentage": 96.69, "elapsed_time": "13:00:31", "remaining_time": "0:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4292, "total_steps": 4438, "loss": 0.1177, "learning_rate": 1.4780389020800923e-08, "epoch": 0.9670205874897907, "percentage": 96.71, "elapsed_time": "13:00:42", "remaining_time": "0:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4293, "total_steps": 4438, "loss": 0.1173, "learning_rate": 1.4578807675011131e-08, "epoch": 0.9672458951755992, "percentage": 96.73, "elapsed_time": "13:00:52", "remaining_time": "0:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4294, "total_steps": 4438, "loss": 0.1269, "learning_rate": 1.4378606390967609e-08, "epoch": 0.9674712028614076, "percentage": 96.76, "elapsed_time": "13:01:03", "remaining_time": "0:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4295, "total_steps": 4438, "loss": 0.1272, "learning_rate": 1.4179785279835045e-08, "epoch": 0.9676965105472161, "percentage": 96.78, "elapsed_time": "13:01:13", "remaining_time": "0:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4296, "total_steps": 4438, "loss": 0.1198, "learning_rate": 1.3982344452011242e-08, "epoch": 0.9679218182330245, "percentage": 96.8, "elapsed_time": "13:01:23", "remaining_time": "0:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4297, "total_steps": 4438, "loss": 0.128, "learning_rate": 1.3786284017127949e-08, "epoch": 0.9681471259188329, "percentage": 96.82, "elapsed_time": "13:01:35", "remaining_time": "0:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4298, "total_steps": 4438, "loss": 0.1253, "learning_rate": 1.3591604084049747e-08, "epoch": 0.9683724336046413, "percentage": 96.85, "elapsed_time": "13:01:47", "remaining_time": "0:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4299, "total_steps": 4438, "loss": 0.1294, "learning_rate": 1.3398304760875725e-08, "epoch": 0.9685977412904497, "percentage": 96.87, "elapsed_time": "13:01:57", "remaining_time": "0:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 4438, "loss": 0.1279, "learning_rate": 1.3206386154937245e-08, "epoch": 0.9688230489762581, "percentage": 96.89, "elapsed_time": "13:02:09", "remaining_time": "0:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4301, "total_steps": 4438, "loss": 0.1372, "learning_rate": 1.30158483727999e-08, "epoch": 0.9690483566620667, "percentage": 96.91, "elapsed_time": "13:02:20", "remaining_time": "0:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4302, "total_steps": 4438, "loss": 0.1188, "learning_rate": 1.2826691520262114e-08, "epoch": 0.9692736643478751, "percentage": 96.94, "elapsed_time": "13:02:30", "remaining_time": "0:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4303, "total_steps": 4438, "loss": 0.1134, "learning_rate": 1.2638915702355702e-08, "epoch": 0.9694989720336835, "percentage": 96.96, "elapsed_time": "13:02:40", "remaining_time": "0:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4304, "total_steps": 4438, "loss": 0.1182, "learning_rate": 1.2452521023345598e-08, "epoch": 0.9697242797194919, "percentage": 96.98, "elapsed_time": "13:02:50", "remaining_time": "0:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4305, "total_steps": 4438, "loss": 0.1287, "learning_rate": 1.2267507586729566e-08, "epoch": 0.9699495874053004, "percentage": 97.0, "elapsed_time": "13:03:01", "remaining_time": "0:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4306, "total_steps": 4438, "loss": 0.1073, "learning_rate": 1.2083875495238761e-08, "epoch": 0.9701748950911088, "percentage": 97.03, "elapsed_time": "13:03:12", "remaining_time": "0:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4307, "total_steps": 4438, "loss": 0.1252, "learning_rate": 1.1901624850837734e-08, "epoch": 0.9704002027769172, "percentage": 97.05, "elapsed_time": "13:03:22", "remaining_time": "0:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4308, "total_steps": 4438, "loss": 0.1287, "learning_rate": 1.1720755754722757e-08, "epoch": 0.9706255104627256, "percentage": 97.07, "elapsed_time": "13:03:32", "remaining_time": "0:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4309, "total_steps": 4438, "loss": 0.1267, "learning_rate": 1.1541268307324049e-08, "epoch": 0.9708508181485341, "percentage": 97.09, "elapsed_time": "13:03:43", "remaining_time": "0:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4310, "total_steps": 4438, "loss": 0.126, "learning_rate": 1.1363162608304112e-08, "epoch": 0.9710761258343426, "percentage": 97.12, "elapsed_time": "13:03:54", "remaining_time": "0:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4311, "total_steps": 4438, "loss": 0.1341, "learning_rate": 1.1186438756558838e-08, "epoch": 0.971301433520151, "percentage": 97.14, "elapsed_time": "13:04:04", "remaining_time": "0:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4312, "total_steps": 4438, "loss": 0.1297, "learning_rate": 1.1011096850215842e-08, "epoch": 0.9715267412059594, "percentage": 97.16, "elapsed_time": "13:04:14", "remaining_time": "0:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4313, "total_steps": 4438, "loss": 0.1246, "learning_rate": 1.083713698663641e-08, "epoch": 0.9717520488917678, "percentage": 97.18, "elapsed_time": "13:04:25", "remaining_time": "0:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4314, "total_steps": 4438, "loss": 0.1133, "learning_rate": 1.0664559262413831e-08, "epoch": 0.9719773565775762, "percentage": 97.21, "elapsed_time": "13:04:36", "remaining_time": "0:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4315, "total_steps": 4438, "loss": 0.1379, "learning_rate": 1.0493363773373677e-08, "epoch": 0.9722026642633846, "percentage": 97.23, "elapsed_time": "13:04:47", "remaining_time": "0:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4316, "total_steps": 4438, "loss": 0.1356, "learning_rate": 1.0323550614574907e-08, "epoch": 0.9724279719491932, "percentage": 97.25, "elapsed_time": "13:04:57", "remaining_time": "0:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4317, "total_steps": 4438, "loss": 0.118, "learning_rate": 1.0155119880308483e-08, "epoch": 0.9726532796350016, "percentage": 97.27, "elapsed_time": "13:05:07", "remaining_time": "0:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4318, "total_steps": 4438, "loss": 0.1198, "learning_rate": 9.988071664097376e-09, "epoch": 0.97287858732081, "percentage": 97.3, "elapsed_time": "13:05:17", "remaining_time": "0:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4319, "total_steps": 4438, "loss": 0.1275, "learning_rate": 9.822406058697665e-09, "epoch": 0.9731038950066184, "percentage": 97.32, "elapsed_time": "13:05:28", "remaining_time": "0:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4320, "total_steps": 4438, "loss": 0.1261, "learning_rate": 9.658123156096599e-09, "epoch": 0.9733292026924268, "percentage": 97.34, "elapsed_time": "13:05:39", "remaining_time": "0:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4321, "total_steps": 4438, "loss": 0.128, "learning_rate": 9.4952230475151e-09, "epoch": 0.9735545103782353, "percentage": 97.36, "elapsed_time": "13:05:48", "remaining_time": "0:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4322, "total_steps": 4438, "loss": 0.1235, "learning_rate": 9.333705823404981e-09, "epoch": 0.9737798180640437, "percentage": 97.39, "elapsed_time": "13:05:59", "remaining_time": "0:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4323, "total_steps": 4438, "loss": 0.1303, "learning_rate": 9.17357157345089e-09, "epoch": 0.9740051257498521, "percentage": 97.41, "elapsed_time": "13:06:10", "remaining_time": "0:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4324, "total_steps": 4438, "loss": 0.1341, "learning_rate": 9.014820386569756e-09, "epoch": 0.9742304334356606, "percentage": 97.43, "elapsed_time": "13:06:21", "remaining_time": "0:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4325, "total_steps": 4438, "loss": 0.1199, "learning_rate": 8.85745235090968e-09, "epoch": 0.974455741121469, "percentage": 97.45, "elapsed_time": "13:06:32", "remaining_time": "0:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4326, "total_steps": 4438, "loss": 0.129, "learning_rate": 8.701467553851317e-09, "epoch": 0.9746810488072775, "percentage": 97.48, "elapsed_time": "13:06:42", "remaining_time": "0:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4327, "total_steps": 4438, "loss": 0.1244, "learning_rate": 8.54686608200761e-09, "epoch": 0.9749063564930859, "percentage": 97.5, "elapsed_time": "13:06:55", "remaining_time": "0:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4328, "total_steps": 4438, "loss": 0.1141, "learning_rate": 8.393648021222666e-09, "epoch": 0.9751316641788943, "percentage": 97.52, "elapsed_time": "13:07:05", "remaining_time": "0:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4329, "total_steps": 4438, "loss": 0.1147, "learning_rate": 8.241813456573156e-09, "epoch": 0.9753569718647027, "percentage": 97.54, "elapsed_time": "13:07:15", "remaining_time": "0:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4330, "total_steps": 4438, "loss": 0.1253, "learning_rate": 8.09136247236636e-09, "epoch": 0.9755822795505111, "percentage": 97.57, "elapsed_time": "13:07:25", "remaining_time": "0:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4331, "total_steps": 4438, "loss": 0.1378, "learning_rate": 7.942295152142954e-09, "epoch": 0.9758075872363196, "percentage": 97.59, "elapsed_time": "13:07:37", "remaining_time": "0:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4332, "total_steps": 4438, "loss": 0.143, "learning_rate": 7.79461157867395e-09, "epoch": 0.9760328949221281, "percentage": 97.61, "elapsed_time": "13:07:50", "remaining_time": "0:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4333, "total_steps": 4438, "loss": 0.1181, "learning_rate": 7.64831183396264e-09, "epoch": 0.9762582026079365, "percentage": 97.63, "elapsed_time": "13:08:00", "remaining_time": "0:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4334, "total_steps": 4438, "loss": 0.1127, "learning_rate": 7.503395999244045e-09, "epoch": 0.9764835102937449, "percentage": 97.66, "elapsed_time": "13:08:11", "remaining_time": "0:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4335, "total_steps": 4438, "loss": 0.1123, "learning_rate": 7.359864154984353e-09, "epoch": 0.9767088179795533, "percentage": 97.68, "elapsed_time": "13:08:21", "remaining_time": "0:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4336, "total_steps": 4438, "loss": 0.1273, "learning_rate": 7.217716380881479e-09, "epoch": 0.9769341256653618, "percentage": 97.7, "elapsed_time": "13:08:31", "remaining_time": "0:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4337, "total_steps": 4438, "loss": 0.1249, "learning_rate": 7.076952755864508e-09, "epoch": 0.9771594333511702, "percentage": 97.72, "elapsed_time": "13:08:42", "remaining_time": "0:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4338, "total_steps": 4438, "loss": 0.116, "learning_rate": 6.937573358094529e-09, "epoch": 0.9773847410369786, "percentage": 97.75, "elapsed_time": "13:08:51", "remaining_time": "0:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4339, "total_steps": 4438, "loss": 0.12, "learning_rate": 6.799578264963802e-09, "epoch": 0.977610048722787, "percentage": 97.77, "elapsed_time": "13:09:02", "remaining_time": "0:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4340, "total_steps": 4438, "loss": 0.127, "learning_rate": 6.662967553095756e-09, "epoch": 0.9778353564085955, "percentage": 97.79, "elapsed_time": "13:09:12", "remaining_time": "0:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4341, "total_steps": 4438, "loss": 0.1168, "learning_rate": 6.527741298345269e-09, "epoch": 0.978060664094404, "percentage": 97.81, "elapsed_time": "13:09:23", "remaining_time": "0:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4342, "total_steps": 4438, "loss": 0.1213, "learning_rate": 6.3938995757981125e-09, "epoch": 0.9782859717802124, "percentage": 97.84, "elapsed_time": "13:09:35", "remaining_time": "0:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4343, "total_steps": 4438, "loss": 0.1163, "learning_rate": 6.2614424597720605e-09, "epoch": 0.9785112794660208, "percentage": 97.86, "elapsed_time": "13:09:45", "remaining_time": "0:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4344, "total_steps": 4438, "loss": 0.1096, "learning_rate": 6.1303700238152245e-09, "epoch": 0.9787365871518292, "percentage": 97.88, "elapsed_time": "13:09:54", "remaining_time": "0:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4345, "total_steps": 4438, "loss": 0.1191, "learning_rate": 6.00068234070772e-09, "epoch": 0.9789618948376376, "percentage": 97.9, "elapsed_time": "13:10:06", "remaining_time": "0:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4346, "total_steps": 4438, "loss": 0.1316, "learning_rate": 5.8723794824597226e-09, "epoch": 0.979187202523446, "percentage": 97.93, "elapsed_time": "13:10:16", "remaining_time": "0:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4347, "total_steps": 4438, "loss": 0.1289, "learning_rate": 5.745461520313411e-09, "epoch": 0.9794125102092545, "percentage": 97.95, "elapsed_time": "13:10:28", "remaining_time": "0:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4348, "total_steps": 4438, "loss": 0.1192, "learning_rate": 5.6199285247415805e-09, "epoch": 0.979637817895063, "percentage": 97.97, "elapsed_time": "13:10:38", "remaining_time": "0:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4349, "total_steps": 4438, "loss": 0.1176, "learning_rate": 5.495780565447917e-09, "epoch": 0.9798631255808714, "percentage": 97.99, "elapsed_time": "13:10:49", "remaining_time": "0:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 4438, "loss": 0.1291, "learning_rate": 5.373017711367001e-09, "epoch": 0.9800884332666798, "percentage": 98.02, "elapsed_time": "13:11:01", "remaining_time": "0:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4351, "total_steps": 4438, "loss": 0.1283, "learning_rate": 5.2516400306648615e-09, "epoch": 0.9803137409524882, "percentage": 98.04, "elapsed_time": "13:11:10", "remaining_time": "0:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4352, "total_steps": 4438, "loss": 0.1132, "learning_rate": 5.131647590737587e-09, "epoch": 0.9805390486382967, "percentage": 98.06, "elapsed_time": "13:11:20", "remaining_time": "0:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4353, "total_steps": 4438, "loss": 0.1225, "learning_rate": 5.0130404582127144e-09, "epoch": 0.9807643563241051, "percentage": 98.08, "elapsed_time": "13:11:30", "remaining_time": "0:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4354, "total_steps": 4438, "loss": 0.1251, "learning_rate": 4.895818698948396e-09, "epoch": 0.9809896640099135, "percentage": 98.11, "elapsed_time": "13:11:41", "remaining_time": "0:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4355, "total_steps": 4438, "loss": 0.1231, "learning_rate": 4.779982378033676e-09, "epoch": 0.9812149716957219, "percentage": 98.13, "elapsed_time": "13:11:53", "remaining_time": "0:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4356, "total_steps": 4438, "loss": 0.1235, "learning_rate": 4.6655315597876615e-09, "epoch": 0.9814402793815304, "percentage": 98.15, "elapsed_time": "13:12:03", "remaining_time": "0:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4357, "total_steps": 4438, "loss": 0.1131, "learning_rate": 4.552466307760905e-09, "epoch": 0.9816655870673389, "percentage": 98.17, "elapsed_time": "13:12:15", "remaining_time": "0:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4358, "total_steps": 4438, "loss": 0.1227, "learning_rate": 4.440786684734577e-09, "epoch": 0.9818908947531473, "percentage": 98.2, "elapsed_time": "13:12:26", "remaining_time": "0:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4359, "total_steps": 4438, "loss": 0.136, "learning_rate": 4.330492752719628e-09, "epoch": 0.9821162024389557, "percentage": 98.22, "elapsed_time": "13:12:37", "remaining_time": "0:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4360, "total_steps": 4438, "loss": 0.1232, "learning_rate": 4.221584572958737e-09, "epoch": 0.9823415101247641, "percentage": 98.24, "elapsed_time": "13:12:47", "remaining_time": "0:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4361, "total_steps": 4438, "loss": 0.1126, "learning_rate": 4.114062205924085e-09, "epoch": 0.9825668178105725, "percentage": 98.26, "elapsed_time": "13:12:59", "remaining_time": "0:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4362, "total_steps": 4438, "loss": 0.1287, "learning_rate": 4.0079257113190275e-09, "epoch": 0.982792125496381, "percentage": 98.29, "elapsed_time": "13:13:08", "remaining_time": "0:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4363, "total_steps": 4438, "loss": 0.1131, "learning_rate": 3.903175148077531e-09, "epoch": 0.9830174331821895, "percentage": 98.31, "elapsed_time": "13:13:18", "remaining_time": "0:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4364, "total_steps": 4438, "loss": 0.1174, "learning_rate": 3.799810574363072e-09, "epoch": 0.9832427408679979, "percentage": 98.33, "elapsed_time": "13:13:29", "remaining_time": "0:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4365, "total_steps": 4438, "loss": 0.134, "learning_rate": 3.697832047570571e-09, "epoch": 0.9834680485538063, "percentage": 98.36, "elapsed_time": "13:13:41", "remaining_time": "0:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4366, "total_steps": 4438, "loss": 0.1262, "learning_rate": 3.597239624325011e-09, "epoch": 0.9836933562396147, "percentage": 98.38, "elapsed_time": "13:13:52", "remaining_time": "0:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4367, "total_steps": 4438, "loss": 0.1331, "learning_rate": 3.4980333604811567e-09, "epoch": 0.9839186639254232, "percentage": 98.4, "elapsed_time": "13:14:02", "remaining_time": "0:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4368, "total_steps": 4438, "loss": 0.1249, "learning_rate": 3.4002133111246673e-09, "epoch": 0.9841439716112316, "percentage": 98.42, "elapsed_time": "13:14:13", "remaining_time": "0:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4369, "total_steps": 4438, "loss": 0.1383, "learning_rate": 3.303779530571538e-09, "epoch": 0.98436927929704, "percentage": 98.45, "elapsed_time": "13:14:24", "remaining_time": "0:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4370, "total_steps": 4438, "loss": 0.1213, "learning_rate": 3.208732072368104e-09, "epoch": 0.9845945869828484, "percentage": 98.47, "elapsed_time": "13:14:35", "remaining_time": "0:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4371, "total_steps": 4438, "loss": 0.1299, "learning_rate": 3.1150709892899256e-09, "epoch": 0.9848198946686569, "percentage": 98.49, "elapsed_time": "13:14:46", "remaining_time": "0:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4372, "total_steps": 4438, "loss": 0.122, "learning_rate": 3.022796333344291e-09, "epoch": 0.9850452023544654, "percentage": 98.51, "elapsed_time": "13:14:56", "remaining_time": "0:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4373, "total_steps": 4438, "loss": 0.1305, "learning_rate": 2.9319081557674377e-09, "epoch": 0.9852705100402738, "percentage": 98.54, "elapsed_time": "13:15:06", "remaining_time": "0:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4374, "total_steps": 4438, "loss": 0.1305, "learning_rate": 2.8424065070262186e-09, "epoch": 0.9854958177260822, "percentage": 98.56, "elapsed_time": "13:15:16", "remaining_time": "0:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4375, "total_steps": 4438, "loss": 0.1351, "learning_rate": 2.754291436817824e-09, "epoch": 0.9857211254118906, "percentage": 98.58, "elapsed_time": "13:15:27", "remaining_time": "0:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4376, "total_steps": 4438, "loss": 0.122, "learning_rate": 2.6675629940689508e-09, "epoch": 0.985946433097699, "percentage": 98.6, "elapsed_time": "13:15:39", "remaining_time": "0:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4377, "total_steps": 4438, "loss": 0.1188, "learning_rate": 2.582221226936632e-09, "epoch": 0.9861717407835074, "percentage": 98.63, "elapsed_time": "13:15:49", "remaining_time": "0:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4378, "total_steps": 4438, "loss": 0.1195, "learning_rate": 2.4982661828085175e-09, "epoch": 0.9863970484693159, "percentage": 98.65, "elapsed_time": "13:15:59", "remaining_time": "0:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4379, "total_steps": 4438, "loss": 0.1182, "learning_rate": 2.415697908300929e-09, "epoch": 0.9866223561551244, "percentage": 98.67, "elapsed_time": "13:16:10", "remaining_time": "0:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4380, "total_steps": 4438, "loss": 0.1243, "learning_rate": 2.3345164492616367e-09, "epoch": 0.9868476638409328, "percentage": 98.69, "elapsed_time": "13:16:20", "remaining_time": "0:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4381, "total_steps": 4438, "loss": 0.1131, "learning_rate": 2.2547218507673606e-09, "epoch": 0.9870729715267412, "percentage": 98.72, "elapsed_time": "13:16:32", "remaining_time": "0:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4382, "total_steps": 4438, "loss": 0.1351, "learning_rate": 2.1763141571248813e-09, "epoch": 0.9872982792125496, "percentage": 98.74, "elapsed_time": "13:16:43", "remaining_time": "0:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4383, "total_steps": 4438, "loss": 0.1264, "learning_rate": 2.0992934118715948e-09, "epoch": 0.9875235868983581, "percentage": 98.76, "elapsed_time": "13:16:53", "remaining_time": "0:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4384, "total_steps": 4438, "loss": 0.1272, "learning_rate": 2.0236596577738466e-09, "epoch": 0.9877488945841665, "percentage": 98.78, "elapsed_time": "13:17:04", "remaining_time": "0:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4385, "total_steps": 4438, "loss": 0.1094, "learning_rate": 1.9494129368280432e-09, "epoch": 0.9879742022699749, "percentage": 98.81, "elapsed_time": "13:17:14", "remaining_time": "0:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4386, "total_steps": 4438, "loss": 0.1153, "learning_rate": 1.876553290261207e-09, "epoch": 0.9881995099557833, "percentage": 98.83, "elapsed_time": "13:17:25", "remaining_time": "0:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4387, "total_steps": 4438, "loss": 0.115, "learning_rate": 1.8050807585293095e-09, "epoch": 0.9884248176415918, "percentage": 98.85, "elapsed_time": "13:17:37", "remaining_time": "0:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4388, "total_steps": 4438, "loss": 0.1285, "learning_rate": 1.7349953813183828e-09, "epoch": 0.9886501253274003, "percentage": 98.87, "elapsed_time": "13:17:49", "remaining_time": "0:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4389, "total_steps": 4438, "loss": 0.1106, "learning_rate": 1.6662971975439645e-09, "epoch": 0.9888754330132087, "percentage": 98.9, "elapsed_time": "13:17:59", "remaining_time": "0:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4390, "total_steps": 4438, "loss": 0.1268, "learning_rate": 1.5989862453522075e-09, "epoch": 0.9891007406990171, "percentage": 98.92, "elapsed_time": "13:18:11", "remaining_time": "0:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4391, "total_steps": 4438, "loss": 0.1241, "learning_rate": 1.5330625621176598e-09, "epoch": 0.9893260483848255, "percentage": 98.94, "elapsed_time": "13:18:21", "remaining_time": "0:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4392, "total_steps": 4438, "loss": 0.1174, "learning_rate": 1.468526184445762e-09, "epoch": 0.9895513560706339, "percentage": 98.96, "elapsed_time": "13:18:33", "remaining_time": "0:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4393, "total_steps": 4438, "loss": 0.131, "learning_rate": 1.4053771481711832e-09, "epoch": 0.9897766637564424, "percentage": 98.99, "elapsed_time": "13:18:44", "remaining_time": "0:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4394, "total_steps": 4438, "loss": 0.1299, "learning_rate": 1.343615488357819e-09, "epoch": 0.9900019714422508, "percentage": 99.01, "elapsed_time": "13:18:55", "remaining_time": "0:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4395, "total_steps": 4438, "loss": 0.1177, "learning_rate": 1.2832412393001814e-09, "epoch": 0.9902272791280593, "percentage": 99.03, "elapsed_time": "13:19:05", "remaining_time": "0:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4396, "total_steps": 4438, "loss": 0.1126, "learning_rate": 1.2242544345211772e-09, "epoch": 0.9904525868138677, "percentage": 99.05, "elapsed_time": "13:19:15", "remaining_time": "0:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4397, "total_steps": 4438, "loss": 0.129, "learning_rate": 1.1666551067746058e-09, "epoch": 0.9906778944996761, "percentage": 99.08, "elapsed_time": "13:19:26", "remaining_time": "0:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4398, "total_steps": 4438, "loss": 0.1242, "learning_rate": 1.1104432880429394e-09, "epoch": 0.9909032021854846, "percentage": 99.1, "elapsed_time": "13:19:36", "remaining_time": "0:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4399, "total_steps": 4438, "loss": 0.1182, "learning_rate": 1.0556190095384333e-09, "epoch": 0.991128509871293, "percentage": 99.12, "elapsed_time": "13:19:47", "remaining_time": "0:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 4438, "loss": 0.126, "learning_rate": 1.0021823017028475e-09, "epoch": 0.9913538175571014, "percentage": 99.14, "elapsed_time": "13:19:57", "remaining_time": "0:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4401, "total_steps": 4438, "loss": 0.138, "learning_rate": 9.501331942080029e-10, "epoch": 0.9915791252429098, "percentage": 99.17, "elapsed_time": "13:20:07", "remaining_time": "0:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4402, "total_steps": 4438, "loss": 0.1298, "learning_rate": 8.994717159546695e-10, "epoch": 0.9918044329287182, "percentage": 99.19, "elapsed_time": "13:20:18", "remaining_time": "0:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4403, "total_steps": 4438, "loss": 0.1176, "learning_rate": 8.501978950734014e-10, "epoch": 0.9920297406145268, "percentage": 99.21, "elapsed_time": "13:20:28", "remaining_time": "0:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4404, "total_steps": 4438, "loss": 0.1194, "learning_rate": 8.023117589237017e-10, "epoch": 0.9922550483003352, "percentage": 99.23, "elapsed_time": "13:20:39", "remaining_time": "0:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4405, "total_steps": 4438, "loss": 0.1322, "learning_rate": 7.558133340954121e-10, "epoch": 0.9924803559861436, "percentage": 99.26, "elapsed_time": "13:20:49", "remaining_time": "0:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4406, "total_steps": 4438, "loss": 0.1196, "learning_rate": 7.10702646406769e-10, "epoch": 0.992705663671952, "percentage": 99.28, "elapsed_time": "13:21:01", "remaining_time": "0:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4407, "total_steps": 4438, "loss": 0.1269, "learning_rate": 6.669797209069018e-10, "epoch": 0.9929309713577604, "percentage": 99.3, "elapsed_time": "13:21:12", "remaining_time": "0:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4408, "total_steps": 4438, "loss": 0.1145, "learning_rate": 6.246445818727798e-10, "epoch": 0.9931562790435688, "percentage": 99.32, "elapsed_time": "13:21:22", "remaining_time": "0:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4409, "total_steps": 4438, "loss": 0.1295, "learning_rate": 5.836972528119878e-10, "epoch": 0.9933815867293773, "percentage": 99.35, "elapsed_time": "13:21:32", "remaining_time": "0:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4410, "total_steps": 4438, "loss": 0.1168, "learning_rate": 5.44137756460783e-10, "epoch": 0.9936068944151858, "percentage": 99.37, "elapsed_time": "13:21:41", "remaining_time": "0:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4411, "total_steps": 4438, "loss": 0.1196, "learning_rate": 5.059661147852057e-10, "epoch": 0.9938322021009942, "percentage": 99.39, "elapsed_time": "13:21:51", "remaining_time": "0:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4412, "total_steps": 4438, "loss": 0.1235, "learning_rate": 4.691823489805236e-10, "epoch": 0.9940575097868026, "percentage": 99.41, "elapsed_time": "13:22:03", "remaining_time": "0:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4413, "total_steps": 4438, "loss": 0.1256, "learning_rate": 4.3378647947150965e-10, "epoch": 0.994282817472611, "percentage": 99.44, "elapsed_time": "13:22:14", "remaining_time": "0:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4414, "total_steps": 4438, "loss": 0.1282, "learning_rate": 3.9977852591188694e-10, "epoch": 0.9945081251584195, "percentage": 99.46, "elapsed_time": "13:22:25", "remaining_time": "0:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4415, "total_steps": 4438, "loss": 0.1234, "learning_rate": 3.671585071854389e-10, "epoch": 0.9947334328442279, "percentage": 99.48, "elapsed_time": "13:22:36", "remaining_time": "0:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4416, "total_steps": 4438, "loss": 0.1274, "learning_rate": 3.3592644140434393e-10, "epoch": 0.9949587405300363, "percentage": 99.5, "elapsed_time": "13:22:46", "remaining_time": "0:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4417, "total_steps": 4438, "loss": 0.1245, "learning_rate": 3.0608234591084083e-10, "epoch": 0.9951840482158447, "percentage": 99.53, "elapsed_time": "13:22:57", "remaining_time": "0:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4418, "total_steps": 4438, "loss": 0.1331, "learning_rate": 2.776262372761185e-10, "epoch": 0.9954093559016532, "percentage": 99.55, "elapsed_time": "13:23:10", "remaining_time": "0:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4419, "total_steps": 4438, "loss": 0.1245, "learning_rate": 2.505581313011485e-10, "epoch": 0.9956346635874617, "percentage": 99.57, "elapsed_time": "13:23:21", "remaining_time": "0:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4420, "total_steps": 4438, "loss": 0.1333, "learning_rate": 2.2487804301557503e-10, "epoch": 0.9958599712732701, "percentage": 99.59, "elapsed_time": "13:23:32", "remaining_time": "0:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4421, "total_steps": 4438, "loss": 0.1195, "learning_rate": 2.0058598667854755e-10, "epoch": 0.9960852789590785, "percentage": 99.62, "elapsed_time": "13:23:43", "remaining_time": "0:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4422, "total_steps": 4438, "loss": 0.1156, "learning_rate": 1.776819757787207e-10, "epoch": 0.9963105866448869, "percentage": 99.64, "elapsed_time": "13:23:52", "remaining_time": "0:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4423, "total_steps": 4438, "loss": 0.1284, "learning_rate": 1.561660230336992e-10, "epoch": 0.9965358943306953, "percentage": 99.66, "elapsed_time": "13:24:01", "remaining_time": "0:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4424, "total_steps": 4438, "loss": 0.1233, "learning_rate": 1.3603814039031547e-10, "epoch": 0.9967612020165038, "percentage": 99.68, "elapsed_time": "13:24:13", "remaining_time": "0:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4425, "total_steps": 4438, "loss": 0.1048, "learning_rate": 1.1729833902518473e-10, "epoch": 0.9969865097023122, "percentage": 99.71, "elapsed_time": "13:24:24", "remaining_time": "0:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4426, "total_steps": 4438, "loss": 0.1301, "learning_rate": 9.994662934387223e-11, "epoch": 0.9972118173881207, "percentage": 99.73, "elapsed_time": "13:24:35", "remaining_time": "0:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4427, "total_steps": 4438, "loss": 0.1247, "learning_rate": 8.398302098061583e-11, "epoch": 0.9974371250739291, "percentage": 99.75, "elapsed_time": "13:24:46", "remaining_time": "0:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4428, "total_steps": 4438, "loss": 0.1202, "learning_rate": 6.94075227999913e-11, "epoch": 0.9976624327597375, "percentage": 99.77, "elapsed_time": "13:24:57", "remaining_time": "0:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4429, "total_steps": 4438, "loss": 0.1231, "learning_rate": 5.62201428946918e-11, "epoch": 0.997887740445546, "percentage": 99.8, "elapsed_time": "13:25:07", "remaining_time": "0:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4430, "total_steps": 4438, "loss": 0.1166, "learning_rate": 4.44208885877484e-11, "epoch": 0.9981130481313544, "percentage": 99.82, "elapsed_time": "13:25:18", "remaining_time": "0:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4431, "total_steps": 4438, "loss": 0.1232, "learning_rate": 3.400976643030962e-11, "epoch": 0.9983383558171628, "percentage": 99.84, "elapsed_time": "13:25:28", "remaining_time": "0:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4432, "total_steps": 4438, "loss": 0.1304, "learning_rate": 2.498678220386186e-11, "epoch": 0.9985636635029712, "percentage": 99.86, "elapsed_time": "13:25:39", "remaining_time": "0:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4433, "total_steps": 4438, "loss": 0.1302, "learning_rate": 1.735194091800896e-11, "epoch": 0.9987889711887796, "percentage": 99.89, "elapsed_time": "13:25:50", "remaining_time": "0:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4434, "total_steps": 4438, "loss": 0.128, "learning_rate": 1.1105246812137538e-11, "epoch": 0.9990142788745882, "percentage": 99.91, "elapsed_time": "13:26:00", "remaining_time": "0:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4435, "total_steps": 4438, "loss": 0.1272, "learning_rate": 6.246703355139438e-12, "epoch": 0.9992395865603966, "percentage": 99.93, "elapsed_time": "13:26:11", "remaining_time": "0:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4436, "total_steps": 4438, "loss": 0.1159, "learning_rate": 2.7763132445790543e-12, "epoch": 0.999464894246205, "percentage": 99.95, "elapsed_time": "13:26:21", "remaining_time": "0:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4437, "total_steps": 4438, "loss": 0.1275, "learning_rate": 6.940784075259999e-13, "epoch": 0.9996902019320134, "percentage": 99.98, "elapsed_time": "13:26:31", "remaining_time": "0:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4438, "total_steps": 4438, "loss": 0.1104, "learning_rate": 0.0, "epoch": 0.9999155096178218, "percentage": 100.0, "elapsed_time": "13:26:42", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4438, "total_steps": 4438, "epoch": 0.9999155096178218, "percentage": 100.0, "elapsed_time": "13:26:42", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}