sedrickkeh's picture
Training in progress, epoch 2
ac398d4 verified
{"current_steps": 10, "total_steps": 1617, "loss": 0.9092, "lr": 5e-06, "epoch": 0.018548574078367727, "percentage": 0.62, "elapsed_time": "0:09:37", "remaining_time": "1 day, 1:46:52"}
{"current_steps": 20, "total_steps": 1617, "loss": 0.8033, "lr": 5e-06, "epoch": 0.037097148156735454, "percentage": 1.24, "elapsed_time": "0:19:11", "remaining_time": "1 day, 1:31:50"}
{"current_steps": 30, "total_steps": 1617, "loss": 0.7597, "lr": 5e-06, "epoch": 0.055645722235103175, "percentage": 1.86, "elapsed_time": "0:28:43", "remaining_time": "1 day, 1:19:54"}
{"current_steps": 40, "total_steps": 1617, "loss": 0.7382, "lr": 5e-06, "epoch": 0.07419429631347091, "percentage": 2.47, "elapsed_time": "0:38:17", "remaining_time": "1 day, 1:09:25"}
{"current_steps": 50, "total_steps": 1617, "loss": 0.7179, "lr": 5e-06, "epoch": 0.09274287039183862, "percentage": 3.09, "elapsed_time": "0:47:50", "remaining_time": "1 day, 0:59:24"}
{"current_steps": 60, "total_steps": 1617, "loss": 0.6967, "lr": 5e-06, "epoch": 0.11129144447020635, "percentage": 3.71, "elapsed_time": "0:57:24", "remaining_time": "1 day, 0:49:35"}
{"current_steps": 70, "total_steps": 1617, "loss": 0.6892, "lr": 5e-06, "epoch": 0.12984001854857408, "percentage": 4.33, "elapsed_time": "1:06:57", "remaining_time": "1 day, 0:39:50"}
{"current_steps": 80, "total_steps": 1617, "loss": 0.6645, "lr": 5e-06, "epoch": 0.14838859262694182, "percentage": 4.95, "elapsed_time": "1:16:31", "remaining_time": "1 day, 0:30:11"}
{"current_steps": 90, "total_steps": 1617, "loss": 0.6739, "lr": 5e-06, "epoch": 0.16693716670530953, "percentage": 5.57, "elapsed_time": "1:26:05", "remaining_time": "1 day, 0:20:36"}
{"current_steps": 100, "total_steps": 1617, "loss": 0.6596, "lr": 5e-06, "epoch": 0.18548574078367724, "percentage": 6.18, "elapsed_time": "1:35:38", "remaining_time": "1 day, 0:10:55"}
{"current_steps": 110, "total_steps": 1617, "loss": 0.6419, "lr": 5e-06, "epoch": 0.20403431486204499, "percentage": 6.8, "elapsed_time": "1:45:12", "remaining_time": "1 day, 0:01:15"}
{"current_steps": 120, "total_steps": 1617, "loss": 0.6475, "lr": 5e-06, "epoch": 0.2225828889404127, "percentage": 7.42, "elapsed_time": "1:54:45", "remaining_time": "23:51:37"}
{"current_steps": 130, "total_steps": 1617, "loss": 0.6394, "lr": 5e-06, "epoch": 0.24113146301878044, "percentage": 8.04, "elapsed_time": "2:04:19", "remaining_time": "23:42:02"}
{"current_steps": 140, "total_steps": 1617, "loss": 0.6349, "lr": 5e-06, "epoch": 0.25968003709714815, "percentage": 8.66, "elapsed_time": "2:13:52", "remaining_time": "23:32:25"}
{"current_steps": 150, "total_steps": 1617, "loss": 0.6307, "lr": 5e-06, "epoch": 0.2782286111755159, "percentage": 9.28, "elapsed_time": "2:23:25", "remaining_time": "23:22:46"}
{"current_steps": 160, "total_steps": 1617, "loss": 0.6221, "lr": 5e-06, "epoch": 0.29677718525388364, "percentage": 9.89, "elapsed_time": "2:32:59", "remaining_time": "23:13:07"}
{"current_steps": 170, "total_steps": 1617, "loss": 0.6321, "lr": 5e-06, "epoch": 0.3153257593322513, "percentage": 10.51, "elapsed_time": "2:42:32", "remaining_time": "23:03:27"}
{"current_steps": 180, "total_steps": 1617, "loss": 0.6306, "lr": 5e-06, "epoch": 0.33387433341061906, "percentage": 11.13, "elapsed_time": "2:52:05", "remaining_time": "22:53:51"}
{"current_steps": 190, "total_steps": 1617, "loss": 0.632, "lr": 5e-06, "epoch": 0.3524229074889868, "percentage": 11.75, "elapsed_time": "3:01:38", "remaining_time": "22:44:14"}
{"current_steps": 200, "total_steps": 1617, "loss": 0.633, "lr": 5e-06, "epoch": 0.3709714815673545, "percentage": 12.37, "elapsed_time": "3:11:11", "remaining_time": "22:34:36"}
{"current_steps": 210, "total_steps": 1617, "loss": 0.6406, "lr": 5e-06, "epoch": 0.38952005564572223, "percentage": 12.99, "elapsed_time": "3:20:44", "remaining_time": "22:24:58"}
{"current_steps": 220, "total_steps": 1617, "loss": 0.6246, "lr": 5e-06, "epoch": 0.40806862972408997, "percentage": 13.61, "elapsed_time": "3:30:17", "remaining_time": "22:15:18"}
{"current_steps": 230, "total_steps": 1617, "loss": 0.607, "lr": 5e-06, "epoch": 0.4266172038024577, "percentage": 14.22, "elapsed_time": "3:39:49", "remaining_time": "22:05:39"}
{"current_steps": 240, "total_steps": 1617, "loss": 0.6243, "lr": 5e-06, "epoch": 0.4451657778808254, "percentage": 14.84, "elapsed_time": "3:49:22", "remaining_time": "21:55:59"}
{"current_steps": 250, "total_steps": 1617, "loss": 0.6171, "lr": 5e-06, "epoch": 0.46371435195919314, "percentage": 15.46, "elapsed_time": "3:58:54", "remaining_time": "21:46:21"}
{"current_steps": 260, "total_steps": 1617, "loss": 0.606, "lr": 5e-06, "epoch": 0.4822629260375609, "percentage": 16.08, "elapsed_time": "4:08:27", "remaining_time": "21:36:43"}
{"current_steps": 270, "total_steps": 1617, "loss": 0.6102, "lr": 5e-06, "epoch": 0.5008115001159286, "percentage": 16.7, "elapsed_time": "4:17:59", "remaining_time": "21:27:06"}
{"current_steps": 280, "total_steps": 1617, "loss": 0.616, "lr": 5e-06, "epoch": 0.5193600741942963, "percentage": 17.32, "elapsed_time": "4:27:32", "remaining_time": "21:17:30"}
{"current_steps": 290, "total_steps": 1617, "loss": 0.6142, "lr": 5e-06, "epoch": 0.537908648272664, "percentage": 17.93, "elapsed_time": "4:37:04", "remaining_time": "21:07:52"}
{"current_steps": 300, "total_steps": 1617, "loss": 0.6079, "lr": 5e-06, "epoch": 0.5564572223510318, "percentage": 18.55, "elapsed_time": "4:46:37", "remaining_time": "20:58:16"}
{"current_steps": 310, "total_steps": 1617, "loss": 0.6055, "lr": 5e-06, "epoch": 0.5750057964293995, "percentage": 19.17, "elapsed_time": "4:56:09", "remaining_time": "20:48:39"}
{"current_steps": 320, "total_steps": 1617, "loss": 0.6028, "lr": 5e-06, "epoch": 0.5935543705077673, "percentage": 19.79, "elapsed_time": "5:05:42", "remaining_time": "20:39:05"}
{"current_steps": 330, "total_steps": 1617, "loss": 0.6086, "lr": 5e-06, "epoch": 0.6121029445861349, "percentage": 20.41, "elapsed_time": "5:15:16", "remaining_time": "20:29:35"}
{"current_steps": 340, "total_steps": 1617, "loss": 0.603, "lr": 5e-06, "epoch": 0.6306515186645026, "percentage": 21.03, "elapsed_time": "5:24:50", "remaining_time": "20:20:02"}
{"current_steps": 350, "total_steps": 1617, "loss": 0.6058, "lr": 5e-06, "epoch": 0.6492000927428704, "percentage": 21.65, "elapsed_time": "5:34:22", "remaining_time": "20:10:27"}
{"current_steps": 360, "total_steps": 1617, "loss": 0.5953, "lr": 5e-06, "epoch": 0.6677486668212381, "percentage": 22.26, "elapsed_time": "5:43:55", "remaining_time": "20:00:53"}
{"current_steps": 370, "total_steps": 1617, "loss": 0.6024, "lr": 5e-06, "epoch": 0.6862972408996059, "percentage": 22.88, "elapsed_time": "5:53:29", "remaining_time": "19:51:20"}
{"current_steps": 380, "total_steps": 1617, "loss": 0.607, "lr": 5e-06, "epoch": 0.7048458149779736, "percentage": 23.5, "elapsed_time": "6:03:01", "remaining_time": "19:41:44"}
{"current_steps": 390, "total_steps": 1617, "loss": 0.5974, "lr": 5e-06, "epoch": 0.7233943890563413, "percentage": 24.12, "elapsed_time": "6:12:34", "remaining_time": "19:32:11"}
{"current_steps": 400, "total_steps": 1617, "loss": 0.5972, "lr": 5e-06, "epoch": 0.741942963134709, "percentage": 24.74, "elapsed_time": "6:22:07", "remaining_time": "19:22:38"}
{"current_steps": 410, "total_steps": 1617, "loss": 0.5816, "lr": 5e-06, "epoch": 0.7604915372130767, "percentage": 25.36, "elapsed_time": "6:31:41", "remaining_time": "19:13:05"}
{"current_steps": 420, "total_steps": 1617, "loss": 0.5757, "lr": 5e-06, "epoch": 0.7790401112914445, "percentage": 25.97, "elapsed_time": "6:41:14", "remaining_time": "19:03:32"}
{"current_steps": 430, "total_steps": 1617, "loss": 0.595, "lr": 5e-06, "epoch": 0.7975886853698122, "percentage": 26.59, "elapsed_time": "6:50:47", "remaining_time": "18:53:58"}
{"current_steps": 440, "total_steps": 1617, "loss": 0.5936, "lr": 5e-06, "epoch": 0.8161372594481799, "percentage": 27.21, "elapsed_time": "7:00:21", "remaining_time": "18:44:26"}
{"current_steps": 450, "total_steps": 1617, "loss": 0.5856, "lr": 5e-06, "epoch": 0.8346858335265477, "percentage": 27.83, "elapsed_time": "7:09:54", "remaining_time": "18:34:53"}
{"current_steps": 460, "total_steps": 1617, "loss": 0.5943, "lr": 5e-06, "epoch": 0.8532344076049154, "percentage": 28.45, "elapsed_time": "7:19:27", "remaining_time": "18:25:21"}
{"current_steps": 470, "total_steps": 1617, "loss": 0.5833, "lr": 5e-06, "epoch": 0.871782981683283, "percentage": 29.07, "elapsed_time": "7:29:01", "remaining_time": "18:15:48"}
{"current_steps": 480, "total_steps": 1617, "loss": 0.599, "lr": 5e-06, "epoch": 0.8903315557616508, "percentage": 29.68, "elapsed_time": "7:38:34", "remaining_time": "18:06:14"}
{"current_steps": 490, "total_steps": 1617, "loss": 0.5768, "lr": 5e-06, "epoch": 0.9088801298400185, "percentage": 30.3, "elapsed_time": "7:48:07", "remaining_time": "17:56:40"}
{"current_steps": 500, "total_steps": 1617, "loss": 0.5839, "lr": 5e-06, "epoch": 0.9274287039183863, "percentage": 30.92, "elapsed_time": "7:57:40", "remaining_time": "17:47:07"}
{"current_steps": 510, "total_steps": 1617, "loss": 0.5797, "lr": 5e-06, "epoch": 0.945977277996754, "percentage": 31.54, "elapsed_time": "8:07:12", "remaining_time": "17:37:31"}
{"current_steps": 520, "total_steps": 1617, "loss": 0.5833, "lr": 5e-06, "epoch": 0.9645258520751218, "percentage": 32.16, "elapsed_time": "8:16:45", "remaining_time": "17:27:57"}
{"current_steps": 530, "total_steps": 1617, "loss": 0.5897, "lr": 5e-06, "epoch": 0.9830744261534895, "percentage": 32.78, "elapsed_time": "8:26:17", "remaining_time": "17:18:23"}
{"current_steps": 539, "total_steps": 1617, "eval_loss": 0.5783212780952454, "epoch": 0.9997681428240204, "percentage": 33.33, "elapsed_time": "8:44:26", "remaining_time": "17:28:53"}
{"current_steps": 540, "total_steps": 1617, "loss": 0.6241, "lr": 5e-06, "epoch": 1.0016230002318571, "percentage": 33.4, "elapsed_time": "8:46:26", "remaining_time": "17:29:56"}
{"current_steps": 550, "total_steps": 1617, "loss": 0.5375, "lr": 5e-06, "epoch": 1.0201715743102249, "percentage": 34.01, "elapsed_time": "8:55:59", "remaining_time": "17:19:49"}
{"current_steps": 560, "total_steps": 1617, "loss": 0.5428, "lr": 5e-06, "epoch": 1.0387201483885926, "percentage": 34.63, "elapsed_time": "9:05:33", "remaining_time": "17:09:44"}
{"current_steps": 570, "total_steps": 1617, "loss": 0.5265, "lr": 5e-06, "epoch": 1.0572687224669604, "percentage": 35.25, "elapsed_time": "9:15:06", "remaining_time": "16:59:39"}
{"current_steps": 580, "total_steps": 1617, "loss": 0.5341, "lr": 5e-06, "epoch": 1.075817296545328, "percentage": 35.87, "elapsed_time": "9:24:39", "remaining_time": "16:49:34"}
{"current_steps": 590, "total_steps": 1617, "loss": 0.525, "lr": 5e-06, "epoch": 1.0943658706236958, "percentage": 36.49, "elapsed_time": "9:34:12", "remaining_time": "16:39:31"}
{"current_steps": 600, "total_steps": 1617, "loss": 0.538, "lr": 5e-06, "epoch": 1.1129144447020636, "percentage": 37.11, "elapsed_time": "9:43:46", "remaining_time": "16:29:30"}
{"current_steps": 610, "total_steps": 1617, "loss": 0.5298, "lr": 5e-06, "epoch": 1.1314630187804313, "percentage": 37.72, "elapsed_time": "9:53:20", "remaining_time": "16:19:29"}
{"current_steps": 620, "total_steps": 1617, "loss": 0.5234, "lr": 5e-06, "epoch": 1.150011592858799, "percentage": 38.34, "elapsed_time": "10:02:54", "remaining_time": "16:09:30"}
{"current_steps": 630, "total_steps": 1617, "loss": 0.5314, "lr": 5e-06, "epoch": 1.1685601669371668, "percentage": 38.96, "elapsed_time": "10:12:28", "remaining_time": "15:59:31"}
{"current_steps": 640, "total_steps": 1617, "loss": 0.5314, "lr": 5e-06, "epoch": 1.1871087410155345, "percentage": 39.58, "elapsed_time": "10:22:01", "remaining_time": "15:49:34"}
{"current_steps": 650, "total_steps": 1617, "loss": 0.5359, "lr": 5e-06, "epoch": 1.205657315093902, "percentage": 40.2, "elapsed_time": "10:31:35", "remaining_time": "15:39:37"}
{"current_steps": 660, "total_steps": 1617, "loss": 0.5314, "lr": 5e-06, "epoch": 1.2242058891722698, "percentage": 40.82, "elapsed_time": "10:41:09", "remaining_time": "15:29:40"}
{"current_steps": 670, "total_steps": 1617, "loss": 0.5305, "lr": 5e-06, "epoch": 1.2427544632506375, "percentage": 41.43, "elapsed_time": "10:50:42", "remaining_time": "15:19:43"}
{"current_steps": 680, "total_steps": 1617, "loss": 0.5427, "lr": 5e-06, "epoch": 1.2613030373290053, "percentage": 42.05, "elapsed_time": "11:00:15", "remaining_time": "15:09:48"}
{"current_steps": 690, "total_steps": 1617, "loss": 0.5304, "lr": 5e-06, "epoch": 1.279851611407373, "percentage": 42.67, "elapsed_time": "11:09:48", "remaining_time": "14:59:52"}
{"current_steps": 700, "total_steps": 1617, "loss": 0.5301, "lr": 5e-06, "epoch": 1.2984001854857408, "percentage": 43.29, "elapsed_time": "11:19:22", "remaining_time": "14:49:58"}
{"current_steps": 710, "total_steps": 1617, "loss": 0.5216, "lr": 5e-06, "epoch": 1.3169487595641085, "percentage": 43.91, "elapsed_time": "11:28:55", "remaining_time": "14:40:04"}
{"current_steps": 720, "total_steps": 1617, "loss": 0.5465, "lr": 5e-06, "epoch": 1.3354973336424762, "percentage": 44.53, "elapsed_time": "11:38:28", "remaining_time": "14:30:11"}
{"current_steps": 730, "total_steps": 1617, "loss": 0.5432, "lr": 5e-06, "epoch": 1.354045907720844, "percentage": 45.15, "elapsed_time": "11:48:01", "remaining_time": "14:20:18"}
{"current_steps": 740, "total_steps": 1617, "loss": 0.5318, "lr": 5e-06, "epoch": 1.3725944817992117, "percentage": 45.76, "elapsed_time": "11:57:35", "remaining_time": "14:10:25"}
{"current_steps": 750, "total_steps": 1617, "loss": 0.5282, "lr": 5e-06, "epoch": 1.3911430558775795, "percentage": 46.38, "elapsed_time": "12:07:08", "remaining_time": "14:00:34"}
{"current_steps": 760, "total_steps": 1617, "loss": 0.5204, "lr": 5e-06, "epoch": 1.4096916299559472, "percentage": 47.0, "elapsed_time": "12:16:41", "remaining_time": "13:50:43"}
{"current_steps": 770, "total_steps": 1617, "loss": 0.5262, "lr": 5e-06, "epoch": 1.428240204034315, "percentage": 47.62, "elapsed_time": "12:26:15", "remaining_time": "13:40:53"}
{"current_steps": 780, "total_steps": 1617, "loss": 0.5264, "lr": 5e-06, "epoch": 1.4467887781126825, "percentage": 48.24, "elapsed_time": "12:35:49", "remaining_time": "13:31:03"}
{"current_steps": 790, "total_steps": 1617, "loss": 0.5264, "lr": 5e-06, "epoch": 1.4653373521910504, "percentage": 48.86, "elapsed_time": "12:45:22", "remaining_time": "13:21:13"}
{"current_steps": 800, "total_steps": 1617, "loss": 0.5268, "lr": 5e-06, "epoch": 1.483885926269418, "percentage": 49.47, "elapsed_time": "12:54:56", "remaining_time": "13:11:24"}
{"current_steps": 810, "total_steps": 1617, "loss": 0.5301, "lr": 5e-06, "epoch": 1.502434500347786, "percentage": 50.09, "elapsed_time": "13:04:29", "remaining_time": "13:01:35"}
{"current_steps": 820, "total_steps": 1617, "loss": 0.5193, "lr": 5e-06, "epoch": 1.5209830744261534, "percentage": 50.71, "elapsed_time": "13:14:03", "remaining_time": "12:51:47"}
{"current_steps": 830, "total_steps": 1617, "loss": 0.5216, "lr": 5e-06, "epoch": 1.5395316485045212, "percentage": 51.33, "elapsed_time": "13:23:37", "remaining_time": "12:41:59"}
{"current_steps": 840, "total_steps": 1617, "loss": 0.5259, "lr": 5e-06, "epoch": 1.558080222582889, "percentage": 51.95, "elapsed_time": "13:33:10", "remaining_time": "12:32:11"}
{"current_steps": 850, "total_steps": 1617, "loss": 0.5241, "lr": 5e-06, "epoch": 1.5766287966612567, "percentage": 52.57, "elapsed_time": "13:42:44", "remaining_time": "12:22:24"}
{"current_steps": 860, "total_steps": 1617, "loss": 0.5267, "lr": 5e-06, "epoch": 1.5951773707396244, "percentage": 53.18, "elapsed_time": "13:52:18", "remaining_time": "12:12:37"}
{"current_steps": 870, "total_steps": 1617, "loss": 0.5317, "lr": 5e-06, "epoch": 1.6137259448179921, "percentage": 53.8, "elapsed_time": "14:01:52", "remaining_time": "12:02:50"}
{"current_steps": 880, "total_steps": 1617, "loss": 0.527, "lr": 5e-06, "epoch": 1.6322745188963599, "percentage": 54.42, "elapsed_time": "14:11:26", "remaining_time": "11:53:04"}
{"current_steps": 890, "total_steps": 1617, "loss": 0.5194, "lr": 5e-06, "epoch": 1.6508230929747274, "percentage": 55.04, "elapsed_time": "14:21:00", "remaining_time": "11:43:18"}
{"current_steps": 900, "total_steps": 1617, "loss": 0.5206, "lr": 5e-06, "epoch": 1.6693716670530954, "percentage": 55.66, "elapsed_time": "14:30:34", "remaining_time": "11:33:33"}
{"current_steps": 910, "total_steps": 1617, "loss": 0.515, "lr": 5e-06, "epoch": 1.6879202411314629, "percentage": 56.28, "elapsed_time": "14:40:08", "remaining_time": "11:23:48"}
{"current_steps": 920, "total_steps": 1617, "loss": 0.5304, "lr": 5e-06, "epoch": 1.7064688152098308, "percentage": 56.9, "elapsed_time": "14:49:42", "remaining_time": "11:14:03"}
{"current_steps": 930, "total_steps": 1617, "loss": 0.5228, "lr": 5e-06, "epoch": 1.7250173892881984, "percentage": 57.51, "elapsed_time": "14:59:16", "remaining_time": "11:04:18"}
{"current_steps": 940, "total_steps": 1617, "loss": 0.5066, "lr": 5e-06, "epoch": 1.7435659633665663, "percentage": 58.13, "elapsed_time": "15:08:51", "remaining_time": "10:54:34"}
{"current_steps": 950, "total_steps": 1617, "loss": 0.5219, "lr": 5e-06, "epoch": 1.7621145374449338, "percentage": 58.75, "elapsed_time": "15:18:25", "remaining_time": "10:44:50"}
{"current_steps": 960, "total_steps": 1617, "loss": 0.519, "lr": 5e-06, "epoch": 1.7806631115233018, "percentage": 59.37, "elapsed_time": "15:27:59", "remaining_time": "10:35:05"}
{"current_steps": 970, "total_steps": 1617, "loss": 0.5155, "lr": 5e-06, "epoch": 1.7992116856016693, "percentage": 59.99, "elapsed_time": "15:37:33", "remaining_time": "10:25:21"}
{"current_steps": 980, "total_steps": 1617, "loss": 0.5056, "lr": 5e-06, "epoch": 1.817760259680037, "percentage": 60.61, "elapsed_time": "15:47:07", "remaining_time": "10:15:38"}
{"current_steps": 990, "total_steps": 1617, "loss": 0.5178, "lr": 5e-06, "epoch": 1.8363088337584048, "percentage": 61.22, "elapsed_time": "15:56:42", "remaining_time": "10:05:54"}
{"current_steps": 1000, "total_steps": 1617, "loss": 0.5235, "lr": 5e-06, "epoch": 1.8548574078367726, "percentage": 61.84, "elapsed_time": "16:06:16", "remaining_time": "9:56:11"}
{"current_steps": 1010, "total_steps": 1617, "loss": 0.5291, "lr": 5e-06, "epoch": 1.8734059819151403, "percentage": 62.46, "elapsed_time": "16:15:50", "remaining_time": "9:46:28"}
{"current_steps": 1020, "total_steps": 1617, "loss": 0.5136, "lr": 5e-06, "epoch": 1.891954555993508, "percentage": 63.08, "elapsed_time": "16:25:24", "remaining_time": "9:36:45"}
{"current_steps": 1030, "total_steps": 1617, "loss": 0.5174, "lr": 5e-06, "epoch": 1.9105031300718758, "percentage": 63.7, "elapsed_time": "16:34:58", "remaining_time": "9:27:02"}
{"current_steps": 1040, "total_steps": 1617, "loss": 0.524, "lr": 5e-06, "epoch": 1.9290517041502433, "percentage": 64.32, "elapsed_time": "16:44:32", "remaining_time": "9:17:19"}
{"current_steps": 1050, "total_steps": 1617, "loss": 0.5117, "lr": 5e-06, "epoch": 1.9476002782286113, "percentage": 64.94, "elapsed_time": "16:54:07", "remaining_time": "9:07:37"}
{"current_steps": 1060, "total_steps": 1617, "loss": 0.5101, "lr": 5e-06, "epoch": 1.9661488523069788, "percentage": 65.55, "elapsed_time": "17:03:41", "remaining_time": "8:57:55"}
{"current_steps": 1070, "total_steps": 1617, "loss": 0.519, "lr": 5e-06, "epoch": 1.9846974263853467, "percentage": 66.17, "elapsed_time": "17:13:16", "remaining_time": "8:48:13"}
{"current_steps": 1078, "total_steps": 1617, "eval_loss": 0.5572099685668945, "epoch": 1.9995362856480408, "percentage": 66.67, "elapsed_time": "17:30:39", "remaining_time": "8:45:19"}
{"current_steps": 1080, "total_steps": 1617, "loss": 0.5612, "lr": 5e-06, "epoch": 2.0032460004637143, "percentage": 66.79, "elapsed_time": "17:33:34", "remaining_time": "8:43:51"}
{"current_steps": 1090, "total_steps": 1617, "loss": 0.4796, "lr": 5e-06, "epoch": 2.0217945745420822, "percentage": 67.41, "elapsed_time": "17:43:09", "remaining_time": "8:34:01"}
{"current_steps": 1100, "total_steps": 1617, "loss": 0.4717, "lr": 5e-06, "epoch": 2.0403431486204497, "percentage": 68.03, "elapsed_time": "17:52:43", "remaining_time": "8:24:10"}
{"current_steps": 1110, "total_steps": 1617, "loss": 0.4705, "lr": 5e-06, "epoch": 2.0588917226988177, "percentage": 68.65, "elapsed_time": "18:02:17", "remaining_time": "8:14:20"}
{"current_steps": 1120, "total_steps": 1617, "loss": 0.4661, "lr": 5e-06, "epoch": 2.0774402967771852, "percentage": 69.26, "elapsed_time": "18:11:51", "remaining_time": "8:04:30"}
{"current_steps": 1130, "total_steps": 1617, "loss": 0.4674, "lr": 5e-06, "epoch": 2.095988870855553, "percentage": 69.88, "elapsed_time": "18:21:25", "remaining_time": "7:54:41"}
{"current_steps": 1140, "total_steps": 1617, "loss": 0.4645, "lr": 5e-06, "epoch": 2.1145374449339207, "percentage": 70.5, "elapsed_time": "18:30:59", "remaining_time": "7:44:51"}
{"current_steps": 1150, "total_steps": 1617, "loss": 0.4676, "lr": 5e-06, "epoch": 2.1330860190122882, "percentage": 71.12, "elapsed_time": "18:40:33", "remaining_time": "7:35:02"}
{"current_steps": 1160, "total_steps": 1617, "loss": 0.4657, "lr": 5e-06, "epoch": 2.151634593090656, "percentage": 71.74, "elapsed_time": "18:50:07", "remaining_time": "7:25:13"}
{"current_steps": 1170, "total_steps": 1617, "loss": 0.4656, "lr": 5e-06, "epoch": 2.1701831671690237, "percentage": 72.36, "elapsed_time": "18:59:40", "remaining_time": "7:15:24"}
{"current_steps": 1180, "total_steps": 1617, "loss": 0.4583, "lr": 5e-06, "epoch": 2.1887317412473917, "percentage": 72.97, "elapsed_time": "19:09:14", "remaining_time": "7:05:36"}
{"current_steps": 1190, "total_steps": 1617, "loss": 0.469, "lr": 5e-06, "epoch": 2.207280315325759, "percentage": 73.59, "elapsed_time": "19:18:47", "remaining_time": "6:55:48"}
{"current_steps": 1200, "total_steps": 1617, "loss": 0.4715, "lr": 5e-06, "epoch": 2.225828889404127, "percentage": 74.21, "elapsed_time": "19:28:21", "remaining_time": "6:46:00"}
{"current_steps": 1210, "total_steps": 1617, "loss": 0.4584, "lr": 5e-06, "epoch": 2.2443774634824947, "percentage": 74.83, "elapsed_time": "19:37:54", "remaining_time": "6:36:12"}
{"current_steps": 1220, "total_steps": 1617, "loss": 0.4772, "lr": 5e-06, "epoch": 2.2629260375608626, "percentage": 75.45, "elapsed_time": "19:47:28", "remaining_time": "6:26:24"}
{"current_steps": 1230, "total_steps": 1617, "loss": 0.4701, "lr": 5e-06, "epoch": 2.28147461163923, "percentage": 76.07, "elapsed_time": "19:57:01", "remaining_time": "6:16:37"}
{"current_steps": 1240, "total_steps": 1617, "loss": 0.4619, "lr": 5e-06, "epoch": 2.300023185717598, "percentage": 76.69, "elapsed_time": "20:06:35", "remaining_time": "6:06:50"}
{"current_steps": 1250, "total_steps": 1617, "loss": 0.4734, "lr": 5e-06, "epoch": 2.3185717597959656, "percentage": 77.3, "elapsed_time": "20:16:08", "remaining_time": "5:57:03"}
{"current_steps": 1260, "total_steps": 1617, "loss": 0.4746, "lr": 5e-06, "epoch": 2.3371203338743336, "percentage": 77.92, "elapsed_time": "20:25:43", "remaining_time": "5:47:17"}
{"current_steps": 1270, "total_steps": 1617, "loss": 0.4647, "lr": 5e-06, "epoch": 2.355668907952701, "percentage": 78.54, "elapsed_time": "20:35:16", "remaining_time": "5:37:30"}
{"current_steps": 1280, "total_steps": 1617, "loss": 0.459, "lr": 5e-06, "epoch": 2.374217482031069, "percentage": 79.16, "elapsed_time": "20:44:50", "remaining_time": "5:27:44"}
{"current_steps": 1290, "total_steps": 1617, "loss": 0.4687, "lr": 5e-06, "epoch": 2.3927660561094366, "percentage": 79.78, "elapsed_time": "20:54:24", "remaining_time": "5:17:58"}
{"current_steps": 1300, "total_steps": 1617, "loss": 0.4636, "lr": 5e-06, "epoch": 2.411314630187804, "percentage": 80.4, "elapsed_time": "21:03:58", "remaining_time": "5:08:12"}
{"current_steps": 1310, "total_steps": 1617, "loss": 0.4798, "lr": 5e-06, "epoch": 2.429863204266172, "percentage": 81.01, "elapsed_time": "21:13:32", "remaining_time": "4:58:27"}
{"current_steps": 1320, "total_steps": 1617, "loss": 0.4743, "lr": 5e-06, "epoch": 2.4484117783445396, "percentage": 81.63, "elapsed_time": "21:23:06", "remaining_time": "4:48:42"}
{"current_steps": 1330, "total_steps": 1617, "loss": 0.479, "lr": 5e-06, "epoch": 2.4669603524229076, "percentage": 82.25, "elapsed_time": "21:32:40", "remaining_time": "4:38:56"}
{"current_steps": 1340, "total_steps": 1617, "loss": 0.4667, "lr": 5e-06, "epoch": 2.485508926501275, "percentage": 82.87, "elapsed_time": "21:42:14", "remaining_time": "4:29:11"}
{"current_steps": 1350, "total_steps": 1617, "loss": 0.4756, "lr": 5e-06, "epoch": 2.504057500579643, "percentage": 83.49, "elapsed_time": "21:51:48", "remaining_time": "4:19:26"}
{"current_steps": 1360, "total_steps": 1617, "loss": 0.4656, "lr": 5e-06, "epoch": 2.5226060746580106, "percentage": 84.11, "elapsed_time": "22:01:22", "remaining_time": "4:09:42"}
{"current_steps": 1370, "total_steps": 1617, "loss": 0.4769, "lr": 5e-06, "epoch": 2.5411546487363785, "percentage": 84.72, "elapsed_time": "22:10:57", "remaining_time": "3:59:57"}
{"current_steps": 1380, "total_steps": 1617, "loss": 0.4715, "lr": 5e-06, "epoch": 2.559703222814746, "percentage": 85.34, "elapsed_time": "22:20:30", "remaining_time": "3:50:13"}
{"current_steps": 1390, "total_steps": 1617, "loss": 0.466, "lr": 5e-06, "epoch": 2.578251796893114, "percentage": 85.96, "elapsed_time": "22:30:05", "remaining_time": "3:40:28"}
{"current_steps": 1400, "total_steps": 1617, "loss": 0.4719, "lr": 5e-06, "epoch": 2.5968003709714815, "percentage": 86.58, "elapsed_time": "22:39:38", "remaining_time": "3:30:44"}
{"current_steps": 1410, "total_steps": 1617, "loss": 0.4657, "lr": 5e-06, "epoch": 2.615348945049849, "percentage": 87.2, "elapsed_time": "22:49:11", "remaining_time": "3:21:00"}
{"current_steps": 1420, "total_steps": 1617, "loss": 0.4649, "lr": 5e-06, "epoch": 2.633897519128217, "percentage": 87.82, "elapsed_time": "22:58:45", "remaining_time": "3:11:16"}
{"current_steps": 1430, "total_steps": 1617, "loss": 0.4734, "lr": 5e-06, "epoch": 2.652446093206585, "percentage": 88.44, "elapsed_time": "23:08:19", "remaining_time": "3:01:32"}
{"current_steps": 1440, "total_steps": 1617, "loss": 0.4696, "lr": 5e-06, "epoch": 2.6709946672849525, "percentage": 89.05, "elapsed_time": "23:17:52", "remaining_time": "2:51:49"}
{"current_steps": 1450, "total_steps": 1617, "loss": 0.4626, "lr": 5e-06, "epoch": 2.68954324136332, "percentage": 89.67, "elapsed_time": "23:27:26", "remaining_time": "2:42:05"}
{"current_steps": 1460, "total_steps": 1617, "loss": 0.4683, "lr": 5e-06, "epoch": 2.708091815441688, "percentage": 90.29, "elapsed_time": "23:36:59", "remaining_time": "2:32:22"}
{"current_steps": 1470, "total_steps": 1617, "loss": 0.4724, "lr": 5e-06, "epoch": 2.7266403895200555, "percentage": 90.91, "elapsed_time": "23:46:31", "remaining_time": "2:22:39"}
{"current_steps": 1480, "total_steps": 1617, "loss": 0.4756, "lr": 5e-06, "epoch": 2.7451889635984235, "percentage": 91.53, "elapsed_time": "23:56:05", "remaining_time": "2:12:56"}
{"current_steps": 1490, "total_steps": 1617, "loss": 0.4765, "lr": 5e-06, "epoch": 2.763737537676791, "percentage": 92.15, "elapsed_time": "1 day, 0:05:38", "remaining_time": "2:03:13"}
{"current_steps": 1500, "total_steps": 1617, "loss": 0.4798, "lr": 5e-06, "epoch": 2.782286111755159, "percentage": 92.76, "elapsed_time": "1 day, 0:15:11", "remaining_time": "1:53:30"}
{"current_steps": 1510, "total_steps": 1617, "loss": 0.4694, "lr": 5e-06, "epoch": 2.8008346858335265, "percentage": 93.38, "elapsed_time": "1 day, 0:24:45", "remaining_time": "1:43:47"}
{"current_steps": 1520, "total_steps": 1617, "loss": 0.4672, "lr": 5e-06, "epoch": 2.8193832599118944, "percentage": 94.0, "elapsed_time": "1 day, 0:34:18", "remaining_time": "1:34:05"}
{"current_steps": 1530, "total_steps": 1617, "loss": 0.4704, "lr": 5e-06, "epoch": 2.837931833990262, "percentage": 94.62, "elapsed_time": "1 day, 0:43:52", "remaining_time": "1:24:22"}
{"current_steps": 1540, "total_steps": 1617, "loss": 0.4795, "lr": 5e-06, "epoch": 2.85648040806863, "percentage": 95.24, "elapsed_time": "1 day, 0:53:25", "remaining_time": "1:14:40"}
{"current_steps": 1550, "total_steps": 1617, "loss": 0.4626, "lr": 5e-06, "epoch": 2.8750289821469974, "percentage": 95.86, "elapsed_time": "1 day, 1:02:59", "remaining_time": "1:04:58"}
{"current_steps": 1560, "total_steps": 1617, "loss": 0.4767, "lr": 5e-06, "epoch": 2.893577556225365, "percentage": 96.47, "elapsed_time": "1 day, 1:12:32", "remaining_time": "0:55:15"}
{"current_steps": 1570, "total_steps": 1617, "loss": 0.4681, "lr": 5e-06, "epoch": 2.912126130303733, "percentage": 97.09, "elapsed_time": "1 day, 1:22:05", "remaining_time": "0:45:33"}
{"current_steps": 1580, "total_steps": 1617, "loss": 0.4732, "lr": 5e-06, "epoch": 2.930674704382101, "percentage": 97.71, "elapsed_time": "1 day, 1:31:39", "remaining_time": "0:35:52"}
{"current_steps": 1590, "total_steps": 1617, "loss": 0.4732, "lr": 5e-06, "epoch": 2.9492232784604684, "percentage": 98.33, "elapsed_time": "1 day, 1:41:12", "remaining_time": "0:26:10"}
{"current_steps": 1600, "total_steps": 1617, "loss": 0.4713, "lr": 5e-06, "epoch": 2.967771852538836, "percentage": 98.95, "elapsed_time": "1 day, 1:50:45", "remaining_time": "0:16:28"}
{"current_steps": 1610, "total_steps": 1617, "loss": 0.469, "lr": 5e-06, "epoch": 2.986320426617204, "percentage": 99.57, "elapsed_time": "1 day, 2:00:19", "remaining_time": "0:06:47"}
{"current_steps": 1617, "total_steps": 1617, "eval_loss": 0.5541288256645203, "epoch": 2.9993044284720614, "percentage": 100.0, "elapsed_time": "1 day, 2:17:41", "remaining_time": "0:00:00"}
{"current_steps": 1617, "total_steps": 1617, "epoch": 2.9993044284720614, "percentage": 100.0, "elapsed_time": "1 day, 2:19:10", "remaining_time": "0:00:00"}