Training in progress, step 3000
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2a98295a1e634e88cf8515a2ee71c8862b2b17c16858accec06e9cd8371eaf6
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5f0fdde20cd86d13e56a1769a7e255a07b658b11745063a36b4e0f88fffe985
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6820b480842b0f24468ee6ab538772e6fee31598b47bbe2953534b0c54b2d829
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfc55e3eed89dd590cb2f15b0c48b56aadfbe4075556a7fbe869aa18265b3bae
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -317,3 +317,310 @@
|
|
| 317 |
{"current_steps": 1585, "total_steps": 12698, "loss": 0.1431, "lr": 3.99255355650765e-05, "epoch": 0.8737596471885336, "percentage": 12.48, "elapsed_time": "2:54:54", "remaining_time": "20:26:22"}
|
| 318 |
{"current_steps": 1590, "total_steps": 12698, "loss": 0.142, "lr": 3.992314673710739e-05, "epoch": 0.87651598676957, "percentage": 12.52, "elapsed_time": "2:55:18", "remaining_time": "20:24:43"}
|
| 319 |
{"current_steps": 1595, "total_steps": 12698, "loss": 0.1294, "lr": 3.992072026848469e-05, "epoch": 0.8792723263506064, "percentage": 12.56, "elapsed_time": "2:55:40", "remaining_time": "20:22:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 317 |
{"current_steps": 1585, "total_steps": 12698, "loss": 0.1431, "lr": 3.99255355650765e-05, "epoch": 0.8737596471885336, "percentage": 12.48, "elapsed_time": "2:54:54", "remaining_time": "20:26:22"}
|
| 318 |
{"current_steps": 1590, "total_steps": 12698, "loss": 0.142, "lr": 3.992314673710739e-05, "epoch": 0.87651598676957, "percentage": 12.52, "elapsed_time": "2:55:18", "remaining_time": "20:24:43"}
|
| 319 |
{"current_steps": 1595, "total_steps": 12698, "loss": 0.1294, "lr": 3.992072026848469e-05, "epoch": 0.8792723263506064, "percentage": 12.56, "elapsed_time": "2:55:40", "remaining_time": "20:22:51"}
|
| 320 |
+
{"current_steps": 1600, "total_steps": 12698, "loss": 0.1213, "lr": 3.991825616379271e-05, "epoch": 0.8820286659316428, "percentage": 12.6, "elapsed_time": "2:56:05", "remaining_time": "20:21:27"}
|
| 321 |
+
{"current_steps": 1605, "total_steps": 12698, "loss": 0.1492, "lr": 3.9915754427686867e-05, "epoch": 0.8847850055126791, "percentage": 12.64, "elapsed_time": "2:56:40", "remaining_time": "20:21:07"}
|
| 322 |
+
{"current_steps": 1610, "total_steps": 12698, "loss": 0.11, "lr": 3.9913215064893664e-05, "epoch": 0.8875413450937155, "percentage": 12.68, "elapsed_time": "2:57:02", "remaining_time": "20:19:20"}
|
| 323 |
+
{"current_steps": 1615, "total_steps": 12698, "loss": 0.1369, "lr": 3.9910638080210714e-05, "epoch": 0.8902976846747519, "percentage": 12.72, "elapsed_time": "2:57:27", "remaining_time": "20:17:48"}
|
| 324 |
+
{"current_steps": 1620, "total_steps": 12698, "loss": 0.1407, "lr": 3.990802347850668e-05, "epoch": 0.8930540242557883, "percentage": 12.76, "elapsed_time": "2:57:53", "remaining_time": "20:16:29"}
|
| 325 |
+
{"current_steps": 1625, "total_steps": 12698, "loss": 0.1426, "lr": 3.990537126472132e-05, "epoch": 0.8958103638368247, "percentage": 12.8, "elapsed_time": "2:58:25", "remaining_time": "20:15:47"}
|
| 326 |
+
{"current_steps": 1630, "total_steps": 12698, "loss": 0.1397, "lr": 3.990268144386543e-05, "epoch": 0.898566703417861, "percentage": 12.84, "elapsed_time": "2:58:59", "remaining_time": "20:15:22"}
|
| 327 |
+
{"current_steps": 1635, "total_steps": 12698, "loss": 0.1409, "lr": 3.989995402102089e-05, "epoch": 0.9013230429988974, "percentage": 12.88, "elapsed_time": "2:59:19", "remaining_time": "20:13:24"}
|
| 328 |
+
{"current_steps": 1640, "total_steps": 12698, "loss": 0.1313, "lr": 3.989718900134058e-05, "epoch": 0.9040793825799338, "percentage": 12.92, "elapsed_time": "2:59:42", "remaining_time": "20:11:41"}
|
| 329 |
+
{"current_steps": 1645, "total_steps": 12698, "loss": 0.156, "lr": 3.9894386390048444e-05, "epoch": 0.9068357221609702, "percentage": 12.95, "elapsed_time": "3:00:20", "remaining_time": "20:11:46"}
|
| 330 |
+
{"current_steps": 1650, "total_steps": 12698, "loss": 0.1302, "lr": 3.989154619243943e-05, "epoch": 0.9095920617420066, "percentage": 12.99, "elapsed_time": "3:00:45", "remaining_time": "20:10:19"}
|
| 331 |
+
{"current_steps": 1655, "total_steps": 12698, "loss": 0.1183, "lr": 3.988866841387949e-05, "epoch": 0.912348401323043, "percentage": 13.03, "elapsed_time": "3:01:07", "remaining_time": "20:08:32"}
|
| 332 |
+
{"current_steps": 1660, "total_steps": 12698, "loss": 0.1434, "lr": 3.988575305980561e-05, "epoch": 0.9151047409040793, "percentage": 13.07, "elapsed_time": "3:01:39", "remaining_time": "20:07:55"}
|
| 333 |
+
{"current_steps": 1665, "total_steps": 12698, "loss": 0.1396, "lr": 3.988280013572573e-05, "epoch": 0.9178610804851157, "percentage": 13.11, "elapsed_time": "3:02:13", "remaining_time": "20:07:32"}
|
| 334 |
+
{"current_steps": 1670, "total_steps": 12698, "loss": 0.1144, "lr": 3.9879809647218805e-05, "epoch": 0.9206174200661521, "percentage": 13.15, "elapsed_time": "3:02:40", "remaining_time": "20:06:17"}
|
| 335 |
+
{"current_steps": 1675, "total_steps": 12698, "loss": 0.1263, "lr": 3.9876781599934726e-05, "epoch": 0.9233737596471885, "percentage": 13.19, "elapsed_time": "3:03:18", "remaining_time": "20:06:19"}
|
| 336 |
+
{"current_steps": 1680, "total_steps": 12698, "loss": 0.1133, "lr": 3.9873715999594374e-05, "epoch": 0.9261300992282249, "percentage": 13.23, "elapsed_time": "3:03:45", "remaining_time": "20:05:10"}
|
| 337 |
+
{"current_steps": 1685, "total_steps": 12698, "loss": 0.1054, "lr": 3.987061285198955e-05, "epoch": 0.9288864388092613, "percentage": 13.27, "elapsed_time": "3:04:10", "remaining_time": "20:03:42"}
|
| 338 |
+
{"current_steps": 1690, "total_steps": 12698, "loss": 0.1344, "lr": 3.9867472162983024e-05, "epoch": 0.9316427783902976, "percentage": 13.31, "elapsed_time": "3:04:36", "remaining_time": "20:02:30"}
|
| 339 |
+
{"current_steps": 1695, "total_steps": 12698, "loss": 0.1237, "lr": 3.9864293938508465e-05, "epoch": 0.934399117971334, "percentage": 13.35, "elapsed_time": "3:05:09", "remaining_time": "20:01:53"}
|
| 340 |
+
{"current_steps": 1700, "total_steps": 12698, "loss": 0.145, "lr": 3.986107818457048e-05, "epoch": 0.9371554575523704, "percentage": 13.39, "elapsed_time": "3:05:37", "remaining_time": "20:00:52"}
|
| 341 |
+
{"current_steps": 1705, "total_steps": 12698, "loss": 0.1315, "lr": 3.985782490724455e-05, "epoch": 0.9399117971334069, "percentage": 13.43, "elapsed_time": "3:06:03", "remaining_time": "19:59:34"}
|
| 342 |
+
{"current_steps": 1710, "total_steps": 12698, "loss": 0.1572, "lr": 3.985453411267709e-05, "epoch": 0.9426681367144433, "percentage": 13.47, "elapsed_time": "3:06:26", "remaining_time": "19:58:02"}
|
| 343 |
+
{"current_steps": 1715, "total_steps": 12698, "loss": 0.1144, "lr": 3.985120580708536e-05, "epoch": 0.9454244762954797, "percentage": 13.51, "elapsed_time": "3:06:46", "remaining_time": "19:56:08"}
|
| 344 |
+
{"current_steps": 1720, "total_steps": 12698, "loss": 0.14, "lr": 3.98478399967575e-05, "epoch": 0.948180815876516, "percentage": 13.55, "elapsed_time": "3:07:10", "remaining_time": "19:54:38"}
|
| 345 |
+
{"current_steps": 1725, "total_steps": 12698, "loss": 0.1212, "lr": 3.9844436688052526e-05, "epoch": 0.9509371554575524, "percentage": 13.58, "elapsed_time": "3:07:30", "remaining_time": "19:52:47"}
|
| 346 |
+
{"current_steps": 1730, "total_steps": 12698, "loss": 0.1728, "lr": 3.9840995887400274e-05, "epoch": 0.9536934950385888, "percentage": 13.62, "elapsed_time": "3:08:03", "remaining_time": "19:52:17"}
|
| 347 |
+
{"current_steps": 1735, "total_steps": 12698, "loss": 0.1558, "lr": 3.9837517601301424e-05, "epoch": 0.9564498346196252, "percentage": 13.66, "elapsed_time": "3:08:51", "remaining_time": "19:53:18"}
|
| 348 |
+
{"current_steps": 1740, "total_steps": 12698, "loss": 0.127, "lr": 3.983400183632747e-05, "epoch": 0.9592061742006616, "percentage": 13.7, "elapsed_time": "3:09:15", "remaining_time": "19:51:53"}
|
| 349 |
+
{"current_steps": 1745, "total_steps": 12698, "loss": 0.1255, "lr": 3.983044859912073e-05, "epoch": 0.961962513781698, "percentage": 13.74, "elapsed_time": "3:09:38", "remaining_time": "19:50:19"}
|
| 350 |
+
{"current_steps": 1750, "total_steps": 12698, "loss": 0.124, "lr": 3.9826857896394306e-05, "epoch": 0.9647188533627343, "percentage": 13.78, "elapsed_time": "3:10:00", "remaining_time": "19:48:39"}
|
| 351 |
+
{"current_steps": 1755, "total_steps": 12698, "loss": 0.1187, "lr": 3.982322973493209e-05, "epoch": 0.9674751929437707, "percentage": 13.82, "elapsed_time": "3:10:20", "remaining_time": "19:46:48"}
|
| 352 |
+
{"current_steps": 1760, "total_steps": 12698, "loss": 0.1538, "lr": 3.9819564121588736e-05, "epoch": 0.9702315325248071, "percentage": 13.86, "elapsed_time": "3:10:41", "remaining_time": "19:45:03"}
|
| 353 |
+
{"current_steps": 1765, "total_steps": 12698, "loss": 0.1127, "lr": 3.981586106328966e-05, "epoch": 0.9729878721058435, "percentage": 13.9, "elapsed_time": "3:11:04", "remaining_time": "19:43:34"}
|
| 354 |
+
{"current_steps": 1770, "total_steps": 12698, "loss": 0.1187, "lr": 3.981212056703102e-05, "epoch": 0.9757442116868799, "percentage": 13.94, "elapsed_time": "3:11:25", "remaining_time": "19:41:51"}
|
| 355 |
+
{"current_steps": 1775, "total_steps": 12698, "loss": 0.1229, "lr": 3.980834263987971e-05, "epoch": 0.9785005512679162, "percentage": 13.98, "elapsed_time": "3:11:51", "remaining_time": "19:40:40"}
|
| 356 |
+
{"current_steps": 1780, "total_steps": 12698, "loss": 0.1324, "lr": 3.980452728897334e-05, "epoch": 0.9812568908489526, "percentage": 14.02, "elapsed_time": "3:12:25", "remaining_time": "19:40:15"}
|
| 357 |
+
{"current_steps": 1785, "total_steps": 12698, "loss": 0.1074, "lr": 3.9800674521520234e-05, "epoch": 0.984013230429989, "percentage": 14.06, "elapsed_time": "3:12:55", "remaining_time": "19:39:28"}
|
| 358 |
+
{"current_steps": 1790, "total_steps": 12698, "loss": 0.1202, "lr": 3.9796784344799385e-05, "epoch": 0.9867695700110254, "percentage": 14.1, "elapsed_time": "3:13:24", "remaining_time": "19:38:35"}
|
| 359 |
+
{"current_steps": 1795, "total_steps": 12698, "loss": 0.1384, "lr": 3.979285676616048e-05, "epoch": 0.9895259095920618, "percentage": 14.14, "elapsed_time": "3:14:16", "remaining_time": "19:40:00"}
|
| 360 |
+
{"current_steps": 1800, "total_steps": 12698, "loss": 0.2087, "lr": 3.978889179302385e-05, "epoch": 0.9922822491730982, "percentage": 14.18, "elapsed_time": "3:15:10", "remaining_time": "19:41:39"}
|
| 361 |
+
{"current_steps": 1805, "total_steps": 12698, "loss": 0.1203, "lr": 3.9784889432880513e-05, "epoch": 0.9950385887541345, "percentage": 14.21, "elapsed_time": "3:15:41", "remaining_time": "19:40:56"}
|
| 362 |
+
{"current_steps": 1810, "total_steps": 12698, "loss": 0.1193, "lr": 3.9780849693292094e-05, "epoch": 0.9977949283351709, "percentage": 14.25, "elapsed_time": "3:16:05", "remaining_time": "19:39:32"}
|
| 363 |
+
{"current_steps": 1815, "total_steps": 12698, "loss": 0.1924, "lr": 3.977677258189082e-05, "epoch": 1.0005512679162072, "percentage": 14.29, "elapsed_time": "3:16:59", "remaining_time": "19:41:11"}
|
| 364 |
+
{"current_steps": 1820, "total_steps": 12698, "loss": 0.2826, "lr": 3.977265810637957e-05, "epoch": 1.0033076074972436, "percentage": 14.33, "elapsed_time": "3:18:13", "remaining_time": "19:44:44"}
|
| 365 |
+
{"current_steps": 1825, "total_steps": 12698, "loss": 0.2761, "lr": 3.9768506274531795e-05, "epoch": 1.00606394707828, "percentage": 14.37, "elapsed_time": "3:19:21", "remaining_time": "19:47:47"}
|
| 366 |
+
{"current_steps": 1830, "total_steps": 12698, "loss": 0.2648, "lr": 3.97643170941915e-05, "epoch": 1.0088202866593163, "percentage": 14.41, "elapsed_time": "3:20:37", "remaining_time": "19:51:27"}
|
| 367 |
+
{"current_steps": 1835, "total_steps": 12698, "loss": 0.2426, "lr": 3.9760090573273286e-05, "epoch": 1.0115766262403527, "percentage": 14.45, "elapsed_time": "3:21:56", "remaining_time": "19:55:27"}
|
| 368 |
+
{"current_steps": 1840, "total_steps": 12698, "loss": 0.2492, "lr": 3.975582671976229e-05, "epoch": 1.014332965821389, "percentage": 14.49, "elapsed_time": "3:23:15", "remaining_time": "19:59:24"}
|
| 369 |
+
{"current_steps": 1845, "total_steps": 12698, "loss": 0.2653, "lr": 3.9751525541714164e-05, "epoch": 1.0170893054024255, "percentage": 14.53, "elapsed_time": "3:24:31", "remaining_time": "20:03:06"}
|
| 370 |
+
{"current_steps": 1850, "total_steps": 12698, "loss": 0.2613, "lr": 3.974718704725511e-05, "epoch": 1.0198456449834619, "percentage": 14.57, "elapsed_time": "3:25:47", "remaining_time": "20:06:43"}
|
| 371 |
+
{"current_steps": 1855, "total_steps": 12698, "loss": 0.2496, "lr": 3.9742811244581806e-05, "epoch": 1.0226019845644982, "percentage": 14.61, "elapsed_time": "3:26:59", "remaining_time": "20:09:57"}
|
| 372 |
+
{"current_steps": 1860, "total_steps": 12698, "loss": 0.2467, "lr": 3.973839814196142e-05, "epoch": 1.0253583241455346, "percentage": 14.65, "elapsed_time": "3:27:58", "remaining_time": "20:11:49"}
|
| 373 |
+
{"current_steps": 1865, "total_steps": 12698, "loss": 0.2412, "lr": 3.973394774773159e-05, "epoch": 1.028114663726571, "percentage": 14.69, "elapsed_time": "3:29:11", "remaining_time": "20:15:05"}
|
| 374 |
+
{"current_steps": 1870, "total_steps": 12698, "loss": 0.2433, "lr": 3.972946007030043e-05, "epoch": 1.0308710033076074, "percentage": 14.73, "elapsed_time": "3:30:22", "remaining_time": "20:18:09"}
|
| 375 |
+
{"current_steps": 1875, "total_steps": 12698, "loss": 0.2395, "lr": 3.972493511814646e-05, "epoch": 1.0336273428886438, "percentage": 14.77, "elapsed_time": "3:31:31", "remaining_time": "20:20:59"}
|
| 376 |
+
{"current_steps": 1880, "total_steps": 12698, "loss": 0.237, "lr": 3.972037289981865e-05, "epoch": 1.0363836824696802, "percentage": 14.81, "elapsed_time": "3:32:39", "remaining_time": "20:23:41"}
|
| 377 |
+
{"current_steps": 1885, "total_steps": 12698, "loss": 0.2295, "lr": 3.971577342393635e-05, "epoch": 1.0391400220507165, "percentage": 14.84, "elapsed_time": "3:33:50", "remaining_time": "20:26:40"}
|
| 378 |
+
{"current_steps": 1890, "total_steps": 12698, "loss": 0.2349, "lr": 3.971113669918933e-05, "epoch": 1.041896361631753, "percentage": 14.88, "elapsed_time": "3:34:57", "remaining_time": "20:29:12"}
|
| 379 |
+
{"current_steps": 1895, "total_steps": 12698, "loss": 0.2371, "lr": 3.9706462734337714e-05, "epoch": 1.0446527012127893, "percentage": 14.92, "elapsed_time": "3:36:05", "remaining_time": "20:31:52"}
|
| 380 |
+
{"current_steps": 1900, "total_steps": 12698, "loss": 0.2288, "lr": 3.970175153821199e-05, "epoch": 1.0474090407938257, "percentage": 14.96, "elapsed_time": "3:37:20", "remaining_time": "20:35:08"}
|
| 381 |
+
{"current_steps": 1905, "total_steps": 12698, "loss": 0.2488, "lr": 3.9697003119712994e-05, "epoch": 1.0501653803748623, "percentage": 15.0, "elapsed_time": "3:38:31", "remaining_time": "20:38:03"}
|
| 382 |
+
{"current_steps": 1910, "total_steps": 12698, "loss": 0.2605, "lr": 3.969221748781186e-05, "epoch": 1.0529217199558987, "percentage": 15.04, "elapsed_time": "3:39:41", "remaining_time": "20:40:49"}
|
| 383 |
+
{"current_steps": 1915, "total_steps": 12698, "loss": 0.219, "lr": 3.9687394651550055e-05, "epoch": 1.055678059536935, "percentage": 15.08, "elapsed_time": "3:40:40", "remaining_time": "20:42:37"}
|
| 384 |
+
{"current_steps": 1920, "total_steps": 12698, "loss": 0.2228, "lr": 3.968253462003934e-05, "epoch": 1.0584343991179714, "percentage": 15.12, "elapsed_time": "3:41:52", "remaining_time": "20:45:29"}
|
| 385 |
+
{"current_steps": 1925, "total_steps": 12698, "loss": 0.2293, "lr": 3.967763740246172e-05, "epoch": 1.0611907386990078, "percentage": 15.16, "elapsed_time": "3:43:04", "remaining_time": "20:48:24"}
|
| 386 |
+
{"current_steps": 1930, "total_steps": 12698, "loss": 0.2413, "lr": 3.967270300806948e-05, "epoch": 1.0639470782800442, "percentage": 15.2, "elapsed_time": "3:44:11", "remaining_time": "20:50:49"}
|
| 387 |
+
{"current_steps": 1935, "total_steps": 12698, "loss": 0.232, "lr": 3.9667731446185126e-05, "epoch": 1.0667034178610806, "percentage": 15.24, "elapsed_time": "3:45:27", "remaining_time": "20:54:04"}
|
| 388 |
+
{"current_steps": 1940, "total_steps": 12698, "loss": 0.2311, "lr": 3.966272272620141e-05, "epoch": 1.069459757442117, "percentage": 15.28, "elapsed_time": "3:46:44", "remaining_time": "20:57:24"}
|
| 389 |
+
{"current_steps": 1945, "total_steps": 12698, "loss": 0.2023, "lr": 3.965767685758126e-05, "epoch": 1.0722160970231533, "percentage": 15.32, "elapsed_time": "3:48:00", "remaining_time": "21:00:33"}
|
| 390 |
+
{"current_steps": 1950, "total_steps": 12698, "loss": 0.2046, "lr": 3.965259384985779e-05, "epoch": 1.0749724366041897, "percentage": 15.36, "elapsed_time": "3:49:15", "remaining_time": "21:03:37"}
|
| 391 |
+
{"current_steps": 1955, "total_steps": 12698, "loss": 0.214, "lr": 3.96474737126343e-05, "epoch": 1.0777287761852261, "percentage": 15.4, "elapsed_time": "3:50:30", "remaining_time": "21:06:41"}
|
| 392 |
+
{"current_steps": 1960, "total_steps": 12698, "loss": 0.237, "lr": 3.964231645558422e-05, "epoch": 1.0804851157662625, "percentage": 15.44, "elapsed_time": "3:51:19", "remaining_time": "21:07:18"}
|
| 393 |
+
{"current_steps": 1965, "total_steps": 12698, "loss": 0.2412, "lr": 3.9637122088451125e-05, "epoch": 1.0832414553472989, "percentage": 15.47, "elapsed_time": "3:52:27", "remaining_time": "21:09:43"}
|
| 394 |
+
{"current_steps": 1970, "total_steps": 12698, "loss": 0.2454, "lr": 3.963189062104869e-05, "epoch": 1.0859977949283353, "percentage": 15.51, "elapsed_time": "3:53:38", "remaining_time": "21:12:22"}
|
| 395 |
+
{"current_steps": 1975, "total_steps": 12698, "loss": 0.2438, "lr": 3.962662206326069e-05, "epoch": 1.0887541345093716, "percentage": 15.55, "elapsed_time": "3:54:50", "remaining_time": "21:15:00"}
|
| 396 |
+
{"current_steps": 1980, "total_steps": 12698, "loss": 0.2372, "lr": 3.962131642504097e-05, "epoch": 1.091510474090408, "percentage": 15.59, "elapsed_time": "3:56:01", "remaining_time": "21:17:36"}
|
| 397 |
+
{"current_steps": 1985, "total_steps": 12698, "loss": 0.2262, "lr": 3.9615973716413434e-05, "epoch": 1.0942668136714444, "percentage": 15.63, "elapsed_time": "3:57:19", "remaining_time": "21:20:48"}
|
| 398 |
+
{"current_steps": 1990, "total_steps": 12698, "loss": 0.2351, "lr": 3.961059394747202e-05, "epoch": 1.0970231532524808, "percentage": 15.67, "elapsed_time": "3:58:34", "remaining_time": "21:23:46"}
|
| 399 |
+
{"current_steps": 1995, "total_steps": 12698, "loss": 0.2285, "lr": 3.9605177128380686e-05, "epoch": 1.0997794928335172, "percentage": 15.71, "elapsed_time": "3:59:49", "remaining_time": "21:26:40"}
|
| 400 |
+
{"current_steps": 2000, "total_steps": 12698, "loss": 0.2391, "lr": 3.9599723269373393e-05, "epoch": 1.1025358324145536, "percentage": 15.75, "elapsed_time": "4:01:07", "remaining_time": "21:29:44"}
|
| 401 |
+
{"current_steps": 2005, "total_steps": 12698, "loss": 0.2296, "lr": 3.959423238075407e-05, "epoch": 1.10529217199559, "percentage": 15.79, "elapsed_time": "4:02:23", "remaining_time": "21:32:45"}
|
| 402 |
+
{"current_steps": 2010, "total_steps": 12698, "loss": 0.2343, "lr": 3.958870447289662e-05, "epoch": 1.1080485115766263, "percentage": 15.83, "elapsed_time": "4:03:37", "remaining_time": "21:35:28"}
|
| 403 |
+
{"current_steps": 2015, "total_steps": 12698, "loss": 0.2353, "lr": 3.958313955624487e-05, "epoch": 1.1108048511576627, "percentage": 15.87, "elapsed_time": "4:04:44", "remaining_time": "21:37:33"}
|
| 404 |
+
{"current_steps": 2020, "total_steps": 12698, "loss": 0.2262, "lr": 3.957753764131258e-05, "epoch": 1.113561190738699, "percentage": 15.91, "elapsed_time": "4:05:50", "remaining_time": "21:39:34"}
|
| 405 |
+
{"current_steps": 2025, "total_steps": 12698, "loss": 0.2278, "lr": 3.9571898738683394e-05, "epoch": 1.1163175303197355, "percentage": 15.95, "elapsed_time": "4:06:37", "remaining_time": "21:39:52"}
|
| 406 |
+
{"current_steps": 2030, "total_steps": 12698, "loss": 0.2274, "lr": 3.9566222859010875e-05, "epoch": 1.1190738699007718, "percentage": 15.99, "elapsed_time": "4:07:50", "remaining_time": "21:42:25"}
|
| 407 |
+
{"current_steps": 2035, "total_steps": 12698, "loss": 0.2264, "lr": 3.95605100130184e-05, "epoch": 1.1218302094818082, "percentage": 16.03, "elapsed_time": "4:08:59", "remaining_time": "21:44:39"}
|
| 408 |
+
{"current_steps": 2040, "total_steps": 12698, "loss": 0.2271, "lr": 3.9554760211499214e-05, "epoch": 1.1245865490628446, "percentage": 16.07, "elapsed_time": "4:10:15", "remaining_time": "21:47:26"}
|
| 409 |
+
{"current_steps": 2045, "total_steps": 12698, "loss": 0.2257, "lr": 3.9548973465316374e-05, "epoch": 1.127342888643881, "percentage": 16.1, "elapsed_time": "4:11:29", "remaining_time": "21:50:06"}
|
| 410 |
+
{"current_steps": 2050, "total_steps": 12698, "loss": 0.2297, "lr": 3.9543149785402733e-05, "epoch": 1.1300992282249174, "percentage": 16.14, "elapsed_time": "4:12:47", "remaining_time": "21:53:04"}
|
| 411 |
+
{"current_steps": 2055, "total_steps": 12698, "loss": 0.2303, "lr": 3.9537289182760926e-05, "epoch": 1.1328555678059538, "percentage": 16.18, "elapsed_time": "4:13:59", "remaining_time": "21:55:24"}
|
| 412 |
+
{"current_steps": 2060, "total_steps": 12698, "loss": 0.2044, "lr": 3.953139166846335e-05, "epoch": 1.1356119073869901, "percentage": 16.22, "elapsed_time": "4:14:46", "remaining_time": "21:55:41"}
|
| 413 |
+
{"current_steps": 2065, "total_steps": 12698, "loss": 0.2255, "lr": 3.952545725365215e-05, "epoch": 1.1383682469680265, "percentage": 16.26, "elapsed_time": "4:15:47", "remaining_time": "21:57:08"}
|
| 414 |
+
{"current_steps": 2070, "total_steps": 12698, "loss": 0.2218, "lr": 3.951948594953914e-05, "epoch": 1.141124586549063, "percentage": 16.3, "elapsed_time": "4:17:00", "remaining_time": "21:59:33"}
|
| 415 |
+
{"current_steps": 2075, "total_steps": 12698, "loss": 0.2286, "lr": 3.951347776740588e-05, "epoch": 1.1438809261300993, "percentage": 16.34, "elapsed_time": "4:18:12", "remaining_time": "22:01:52"}
|
| 416 |
+
{"current_steps": 2080, "total_steps": 12698, "loss": 0.2204, "lr": 3.9507432718603584e-05, "epoch": 1.1466372657111357, "percentage": 16.38, "elapsed_time": "4:19:18", "remaining_time": "22:03:43"}
|
| 417 |
+
{"current_steps": 2085, "total_steps": 12698, "loss": 0.2149, "lr": 3.9501350814553114e-05, "epoch": 1.149393605292172, "percentage": 16.42, "elapsed_time": "4:20:26", "remaining_time": "22:05:42"}
|
| 418 |
+
{"current_steps": 2090, "total_steps": 12698, "loss": 0.2253, "lr": 3.9495232066744965e-05, "epoch": 1.1521499448732084, "percentage": 16.46, "elapsed_time": "4:21:45", "remaining_time": "22:08:34"}
|
| 419 |
+
{"current_steps": 2095, "total_steps": 12698, "loss": 0.2466, "lr": 3.9489076486739245e-05, "epoch": 1.1549062844542448, "percentage": 16.5, "elapsed_time": "4:22:20", "remaining_time": "22:07:46"}
|
| 420 |
+
{"current_steps": 2100, "total_steps": 12698, "loss": 0.2454, "lr": 3.948288408616565e-05, "epoch": 1.1576626240352812, "percentage": 16.54, "elapsed_time": "4:22:32", "remaining_time": "22:04:59"}
|
| 421 |
+
{"current_steps": 2105, "total_steps": 12698, "loss": 0.2367, "lr": 3.947665487672342e-05, "epoch": 1.1604189636163176, "percentage": 16.58, "elapsed_time": "4:22:45", "remaining_time": "22:02:18"}
|
| 422 |
+
{"current_steps": 2110, "total_steps": 12698, "loss": 0.231, "lr": 3.9470388870181376e-05, "epoch": 1.163175303197354, "percentage": 16.62, "elapsed_time": "4:22:57", "remaining_time": "21:59:33"}
|
| 423 |
+
{"current_steps": 2115, "total_steps": 12698, "loss": 0.2313, "lr": 3.9464086078377824e-05, "epoch": 1.1659316427783903, "percentage": 16.66, "elapsed_time": "4:23:11", "remaining_time": "21:56:57"}
|
| 424 |
+
{"current_steps": 2120, "total_steps": 12698, "loss": 0.2239, "lr": 3.945774651322058e-05, "epoch": 1.1686879823594267, "percentage": 16.7, "elapsed_time": "4:23:23", "remaining_time": "21:54:13"}
|
| 425 |
+
{"current_steps": 2125, "total_steps": 12698, "loss": 0.2333, "lr": 3.945137018668695e-05, "epoch": 1.171444321940463, "percentage": 16.73, "elapsed_time": "4:23:35", "remaining_time": "21:51:31"}
|
| 426 |
+
{"current_steps": 2130, "total_steps": 12698, "loss": 0.22, "lr": 3.9444957110823665e-05, "epoch": 1.1742006615214995, "percentage": 16.77, "elapsed_time": "4:23:47", "remaining_time": "21:48:48"}
|
| 427 |
+
{"current_steps": 2135, "total_steps": 12698, "loss": 0.2431, "lr": 3.943850729774692e-05, "epoch": 1.1769570011025359, "percentage": 16.81, "elapsed_time": "4:23:59", "remaining_time": "21:46:04"}
|
| 428 |
+
{"current_steps": 2140, "total_steps": 12698, "loss": 0.2308, "lr": 3.943202075964229e-05, "epoch": 1.1797133406835723, "percentage": 16.85, "elapsed_time": "4:24:11", "remaining_time": "21:43:26"}
|
| 429 |
+
{"current_steps": 2145, "total_steps": 12698, "loss": 0.2215, "lr": 3.942549750876473e-05, "epoch": 1.1824696802646086, "percentage": 16.89, "elapsed_time": "4:24:24", "remaining_time": "21:40:52"}
|
| 430 |
+
{"current_steps": 2150, "total_steps": 12698, "loss": 0.2271, "lr": 3.941893755743859e-05, "epoch": 1.185226019845645, "percentage": 16.93, "elapsed_time": "4:24:38", "remaining_time": "21:38:19"}
|
| 431 |
+
{"current_steps": 2155, "total_steps": 12698, "loss": 0.2244, "lr": 3.9412340918057525e-05, "epoch": 1.1879823594266814, "percentage": 16.97, "elapsed_time": "4:24:50", "remaining_time": "21:35:41"}
|
| 432 |
+
{"current_steps": 2160, "total_steps": 12698, "loss": 0.2038, "lr": 3.9405707603084525e-05, "epoch": 1.1907386990077178, "percentage": 17.01, "elapsed_time": "4:25:02", "remaining_time": "21:33:01"}
|
| 433 |
+
{"current_steps": 2165, "total_steps": 12698, "loss": 0.2081, "lr": 3.939903762505186e-05, "epoch": 1.1934950385887542, "percentage": 17.05, "elapsed_time": "4:25:13", "remaining_time": "21:30:23"}
|
| 434 |
+
{"current_steps": 2170, "total_steps": 12698, "loss": 0.2137, "lr": 3.9392330996561064e-05, "epoch": 1.1962513781697905, "percentage": 17.09, "elapsed_time": "4:25:27", "remaining_time": "21:27:52"}
|
| 435 |
+
{"current_steps": 2175, "total_steps": 12698, "loss": 0.2286, "lr": 3.9385587730282936e-05, "epoch": 1.199007717750827, "percentage": 17.13, "elapsed_time": "4:25:39", "remaining_time": "21:25:18"}
|
| 436 |
+
{"current_steps": 2180, "total_steps": 12698, "loss": 0.2306, "lr": 3.937880783895746e-05, "epoch": 1.2017640573318633, "percentage": 17.17, "elapsed_time": "4:25:54", "remaining_time": "21:22:56"}
|
| 437 |
+
{"current_steps": 2185, "total_steps": 12698, "loss": 0.2117, "lr": 3.9371991335393846e-05, "epoch": 1.2045203969128997, "percentage": 17.21, "elapsed_time": "4:26:06", "remaining_time": "21:20:21"}
|
| 438 |
+
{"current_steps": 2190, "total_steps": 12698, "loss": 0.2233, "lr": 3.936513823247047e-05, "epoch": 1.207276736493936, "percentage": 17.25, "elapsed_time": "4:26:19", "remaining_time": "21:17:52"}
|
| 439 |
+
{"current_steps": 2195, "total_steps": 12698, "loss": 0.2237, "lr": 3.935824854313483e-05, "epoch": 1.2100330760749725, "percentage": 17.29, "elapsed_time": "4:26:33", "remaining_time": "21:15:29"}
|
| 440 |
+
{"current_steps": 2200, "total_steps": 12698, "loss": 0.2266, "lr": 3.935132228040357e-05, "epoch": 1.2127894156560088, "percentage": 17.33, "elapsed_time": "4:26:49", "remaining_time": "21:13:16"}
|
| 441 |
+
{"current_steps": 2205, "total_steps": 12698, "loss": 0.2183, "lr": 3.934435945736244e-05, "epoch": 1.2155457552370452, "percentage": 17.36, "elapsed_time": "4:27:02", "remaining_time": "21:10:46"}
|
| 442 |
+
{"current_steps": 2210, "total_steps": 12698, "loss": 0.2149, "lr": 3.933736008716624e-05, "epoch": 1.2183020948180816, "percentage": 17.4, "elapsed_time": "4:27:14", "remaining_time": "21:08:13"}
|
| 443 |
+
{"current_steps": 2215, "total_steps": 12698, "loss": 0.2147, "lr": 3.933032418303883e-05, "epoch": 1.221058434399118, "percentage": 17.44, "elapsed_time": "4:27:26", "remaining_time": "21:05:43"}
|
| 444 |
+
{"current_steps": 2220, "total_steps": 12698, "loss": 0.218, "lr": 3.932325175827309e-05, "epoch": 1.2238147739801544, "percentage": 17.48, "elapsed_time": "4:27:38", "remaining_time": "21:03:14"}
|
| 445 |
+
{"current_steps": 2225, "total_steps": 12698, "loss": 0.2197, "lr": 3.9316142826230905e-05, "epoch": 1.2265711135611908, "percentage": 17.52, "elapsed_time": "4:27:51", "remaining_time": "21:00:46"}
|
| 446 |
+
{"current_steps": 2230, "total_steps": 12698, "loss": 0.217, "lr": 3.9308997400343114e-05, "epoch": 1.2293274531422271, "percentage": 17.56, "elapsed_time": "4:28:06", "remaining_time": "20:58:31"}
|
| 447 |
+
{"current_steps": 2235, "total_steps": 12698, "loss": 0.2059, "lr": 3.930181549410954e-05, "epoch": 1.2320837927232635, "percentage": 17.6, "elapsed_time": "4:28:18", "remaining_time": "20:56:05"}
|
| 448 |
+
{"current_steps": 2240, "total_steps": 12698, "loss": 0.2098, "lr": 3.9294597121098884e-05, "epoch": 1.2348401323043, "percentage": 17.64, "elapsed_time": "4:28:30", "remaining_time": "20:53:36"}
|
| 449 |
+
{"current_steps": 2245, "total_steps": 12698, "loss": 0.2154, "lr": 3.928734229494878e-05, "epoch": 1.2375964718853363, "percentage": 17.68, "elapsed_time": "4:28:42", "remaining_time": "20:51:09"}
|
| 450 |
+
{"current_steps": 2250, "total_steps": 12698, "loss": 0.2202, "lr": 3.928005102936571e-05, "epoch": 1.2403528114663727, "percentage": 17.72, "elapsed_time": "4:28:55", "remaining_time": "20:48:44"}
|
| 451 |
+
{"current_steps": 2255, "total_steps": 12698, "loss": 0.2121, "lr": 3.9272723338125e-05, "epoch": 1.243109151047409, "percentage": 17.76, "elapsed_time": "4:29:07", "remaining_time": "20:46:19"}
|
| 452 |
+
{"current_steps": 2260, "total_steps": 12698, "loss": 0.2055, "lr": 3.926535923507081e-05, "epoch": 1.2458654906284454, "percentage": 17.8, "elapsed_time": "4:29:19", "remaining_time": "20:43:52"}
|
| 453 |
+
{"current_steps": 2265, "total_steps": 12698, "loss": 0.1972, "lr": 3.92579587341161e-05, "epoch": 1.2486218302094818, "percentage": 17.84, "elapsed_time": "4:29:31", "remaining_time": "20:41:26"}
|
| 454 |
+
{"current_steps": 2270, "total_steps": 12698, "loss": 0.2163, "lr": 3.9250521849242555e-05, "epoch": 1.2513781697905182, "percentage": 17.88, "elapsed_time": "4:29:43", "remaining_time": "20:39:04"}
|
| 455 |
+
{"current_steps": 2275, "total_steps": 12698, "loss": 0.2089, "lr": 3.9243048594500647e-05, "epoch": 1.2541345093715546, "percentage": 17.92, "elapsed_time": "4:29:55", "remaining_time": "20:36:40"}
|
| 456 |
+
{"current_steps": 2280, "total_steps": 12698, "loss": 0.2005, "lr": 3.923553898400953e-05, "epoch": 1.256890848952591, "percentage": 17.96, "elapsed_time": "4:30:07", "remaining_time": "20:34:18"}
|
| 457 |
+
{"current_steps": 2285, "total_steps": 12698, "loss": 0.215, "lr": 3.922799303195707e-05, "epoch": 1.2596471885336273, "percentage": 17.99, "elapsed_time": "4:30:20", "remaining_time": "20:31:57"}
|
| 458 |
+
{"current_steps": 2290, "total_steps": 12698, "loss": 0.2193, "lr": 3.922041075259975e-05, "epoch": 1.2624035281146637, "percentage": 18.03, "elapsed_time": "4:30:32", "remaining_time": "20:29:35"}
|
| 459 |
+
{"current_steps": 2295, "total_steps": 12698, "loss": 0.2016, "lr": 3.921279216026275e-05, "epoch": 1.2651598676957, "percentage": 18.07, "elapsed_time": "4:30:44", "remaining_time": "20:27:13"}
|
| 460 |
+
{"current_steps": 2300, "total_steps": 12698, "loss": 0.2171, "lr": 3.920513726933979e-05, "epoch": 1.2679162072767365, "percentage": 18.11, "elapsed_time": "4:30:58", "remaining_time": "20:25:01"}
|
| 461 |
+
{"current_steps": 2305, "total_steps": 12698, "loss": 0.2156, "lr": 3.919744609429321e-05, "epoch": 1.2706725468577729, "percentage": 18.15, "elapsed_time": "4:31:12", "remaining_time": "20:22:52"}
|
| 462 |
+
{"current_steps": 2310, "total_steps": 12698, "loss": 0.2254, "lr": 3.918971864965389e-05, "epoch": 1.2734288864388092, "percentage": 18.19, "elapsed_time": "4:31:25", "remaining_time": "20:20:37"}
|
| 463 |
+
{"current_steps": 2315, "total_steps": 12698, "loss": 0.2046, "lr": 3.9181954950021236e-05, "epoch": 1.2761852260198456, "percentage": 18.23, "elapsed_time": "4:31:38", "remaining_time": "20:18:21"}
|
| 464 |
+
{"current_steps": 2320, "total_steps": 12698, "loss": 0.212, "lr": 3.917415501006315e-05, "epoch": 1.278941565600882, "percentage": 18.27, "elapsed_time": "4:31:51", "remaining_time": "20:16:05"}
|
| 465 |
+
{"current_steps": 2325, "total_steps": 12698, "loss": 0.2073, "lr": 3.9166318844516e-05, "epoch": 1.2816979051819184, "percentage": 18.31, "elapsed_time": "4:32:03", "remaining_time": "20:13:46"}
|
| 466 |
+
{"current_steps": 2330, "total_steps": 12698, "loss": 0.1982, "lr": 3.915844646818459e-05, "epoch": 1.2844542447629548, "percentage": 18.35, "elapsed_time": "4:32:15", "remaining_time": "20:11:28"}
|
| 467 |
+
{"current_steps": 2335, "total_steps": 12698, "loss": 0.2052, "lr": 3.915053789594214e-05, "epoch": 1.2872105843439912, "percentage": 18.39, "elapsed_time": "4:32:26", "remaining_time": "20:09:09"}
|
| 468 |
+
{"current_steps": 2340, "total_steps": 12698, "loss": 0.2065, "lr": 3.914259314273027e-05, "epoch": 1.2899669239250275, "percentage": 18.43, "elapsed_time": "4:32:40", "remaining_time": "20:06:59"}
|
| 469 |
+
{"current_steps": 2345, "total_steps": 12698, "loss": 0.2062, "lr": 3.913461222355893e-05, "epoch": 1.292723263506064, "percentage": 18.47, "elapsed_time": "4:32:52", "remaining_time": "20:04:42"}
|
| 470 |
+
{"current_steps": 2350, "total_steps": 12698, "loss": 0.2109, "lr": 3.9126595153506424e-05, "epoch": 1.2954796030871003, "percentage": 18.51, "elapsed_time": "4:33:04", "remaining_time": "20:02:27"}
|
| 471 |
+
{"current_steps": 2355, "total_steps": 12698, "loss": 0.2026, "lr": 3.9118541947719334e-05, "epoch": 1.2982359426681367, "percentage": 18.55, "elapsed_time": "4:33:17", "remaining_time": "20:00:17"}
|
| 472 |
+
{"current_steps": 2360, "total_steps": 12698, "loss": 0.201, "lr": 3.911045262141252e-05, "epoch": 1.300992282249173, "percentage": 18.59, "elapsed_time": "4:33:30", "remaining_time": "19:58:04"}
|
| 473 |
+
{"current_steps": 2365, "total_steps": 12698, "loss": 0.2095, "lr": 3.910232718986909e-05, "epoch": 1.3037486218302095, "percentage": 18.62, "elapsed_time": "4:33:43", "remaining_time": "19:55:55"}
|
| 474 |
+
{"current_steps": 2370, "total_steps": 12698, "loss": 0.2013, "lr": 3.909416566844036e-05, "epoch": 1.3065049614112458, "percentage": 18.66, "elapsed_time": "4:33:55", "remaining_time": "19:53:41"}
|
| 475 |
+
{"current_steps": 2375, "total_steps": 12698, "loss": 0.2101, "lr": 3.908596807254585e-05, "epoch": 1.3092613009922822, "percentage": 18.7, "elapsed_time": "4:34:08", "remaining_time": "19:51:33"}
|
| 476 |
+
{"current_steps": 2380, "total_steps": 12698, "loss": 0.189, "lr": 3.9077734417673186e-05, "epoch": 1.3120176405733186, "percentage": 18.74, "elapsed_time": "4:34:19", "remaining_time": "19:49:18"}
|
| 477 |
+
{"current_steps": 2385, "total_steps": 12698, "loss": 0.2055, "lr": 3.906946471937817e-05, "epoch": 1.314773980154355, "percentage": 18.78, "elapsed_time": "4:34:33", "remaining_time": "19:47:11"}
|
| 478 |
+
{"current_steps": 2390, "total_steps": 12698, "loss": 0.2086, "lr": 3.906115899328468e-05, "epoch": 1.3175303197353914, "percentage": 18.82, "elapsed_time": "4:34:47", "remaining_time": "19:45:08"}
|
| 479 |
+
{"current_steps": 2395, "total_steps": 12698, "loss": 0.193, "lr": 3.905281725508466e-05, "epoch": 1.3202866593164277, "percentage": 18.86, "elapsed_time": "4:34:58", "remaining_time": "19:42:56"}
|
| 480 |
+
{"current_steps": 2400, "total_steps": 12698, "loss": 0.2054, "lr": 3.90444395205381e-05, "epoch": 1.3230429988974641, "percentage": 18.9, "elapsed_time": "4:35:10", "remaining_time": "19:40:43"}
|
| 481 |
+
{"current_steps": 2405, "total_steps": 12698, "loss": 0.2032, "lr": 3.9036025805472976e-05, "epoch": 1.3257993384785005, "percentage": 18.94, "elapsed_time": "4:35:22", "remaining_time": "19:38:33"}
|
| 482 |
+
{"current_steps": 2410, "total_steps": 12698, "loss": 0.2112, "lr": 3.902757612578528e-05, "epoch": 1.328555678059537, "percentage": 18.98, "elapsed_time": "4:35:35", "remaining_time": "19:36:27"}
|
| 483 |
+
{"current_steps": 2415, "total_steps": 12698, "loss": 0.207, "lr": 3.9019090497438916e-05, "epoch": 1.3313120176405733, "percentage": 19.02, "elapsed_time": "4:35:47", "remaining_time": "19:34:18"}
|
| 484 |
+
{"current_steps": 2420, "total_steps": 12698, "loss": 0.2003, "lr": 3.901056893646572e-05, "epoch": 1.3340683572216097, "percentage": 19.06, "elapsed_time": "4:35:59", "remaining_time": "19:32:08"}
|
| 485 |
+
{"current_steps": 2425, "total_steps": 12698, "loss": 0.2132, "lr": 3.900201145896541e-05, "epoch": 1.336824696802646, "percentage": 19.1, "elapsed_time": "4:36:11", "remaining_time": "19:30:01"}
|
| 486 |
+
{"current_steps": 2430, "total_steps": 12698, "loss": 0.2078, "lr": 3.899341808110558e-05, "epoch": 1.3395810363836824, "percentage": 19.14, "elapsed_time": "4:36:23", "remaining_time": "19:27:53"}
|
| 487 |
+
{"current_steps": 2435, "total_steps": 12698, "loss": 0.2112, "lr": 3.898478881912162e-05, "epoch": 1.3423373759647188, "percentage": 19.18, "elapsed_time": "4:36:35", "remaining_time": "19:25:48"}
|
| 488 |
+
{"current_steps": 2440, "total_steps": 12698, "loss": 0.2163, "lr": 3.897612368931674e-05, "epoch": 1.3450937155457552, "percentage": 19.22, "elapsed_time": "4:36:51", "remaining_time": "19:23:56"}
|
| 489 |
+
{"current_steps": 2445, "total_steps": 12698, "loss": 0.2114, "lr": 3.896742270806189e-05, "epoch": 1.3478500551267916, "percentage": 19.26, "elapsed_time": "4:37:03", "remaining_time": "19:21:51"}
|
| 490 |
+
{"current_steps": 2450, "total_steps": 12698, "loss": 0.199, "lr": 3.895868589179579e-05, "epoch": 1.350606394707828, "percentage": 19.29, "elapsed_time": "4:37:15", "remaining_time": "19:19:43"}
|
| 491 |
+
{"current_steps": 2455, "total_steps": 12698, "loss": 0.2092, "lr": 3.894991325702483e-05, "epoch": 1.3533627342888643, "percentage": 19.33, "elapsed_time": "4:37:27", "remaining_time": "19:17:40"}
|
| 492 |
+
{"current_steps": 2460, "total_steps": 12698, "loss": 0.2039, "lr": 3.894110482032309e-05, "epoch": 1.3561190738699007, "percentage": 19.37, "elapsed_time": "4:37:40", "remaining_time": "19:15:36"}
|
| 493 |
+
{"current_steps": 2465, "total_steps": 12698, "loss": 0.2015, "lr": 3.893226059833227e-05, "epoch": 1.358875413450937, "percentage": 19.41, "elapsed_time": "4:37:52", "remaining_time": "19:13:30"}
|
| 494 |
+
{"current_steps": 2470, "total_steps": 12698, "loss": 0.1917, "lr": 3.892338060776172e-05, "epoch": 1.3616317530319735, "percentage": 19.45, "elapsed_time": "4:38:04", "remaining_time": "19:11:28"}
|
| 495 |
+
{"current_steps": 2475, "total_steps": 12698, "loss": 0.1936, "lr": 3.891446486538831e-05, "epoch": 1.3643880926130099, "percentage": 19.49, "elapsed_time": "4:38:16", "remaining_time": "19:09:26"}
|
| 496 |
+
{"current_steps": 2480, "total_steps": 12698, "loss": 0.2097, "lr": 3.890551338805651e-05, "epoch": 1.3671444321940462, "percentage": 19.53, "elapsed_time": "4:38:29", "remaining_time": "19:07:24"}
|
| 497 |
+
{"current_steps": 2485, "total_steps": 12698, "loss": 0.2022, "lr": 3.8896526192678265e-05, "epoch": 1.3699007717750826, "percentage": 19.57, "elapsed_time": "4:38:41", "remaining_time": "19:05:21"}
|
| 498 |
+
{"current_steps": 2490, "total_steps": 12698, "loss": 0.1933, "lr": 3.8887503296233034e-05, "epoch": 1.372657111356119, "percentage": 19.61, "elapsed_time": "4:38:55", "remaining_time": "19:03:28"}
|
| 499 |
+
{"current_steps": 2495, "total_steps": 12698, "loss": 0.1908, "lr": 3.8878444715767686e-05, "epoch": 1.3754134509371554, "percentage": 19.65, "elapsed_time": "4:39:12", "remaining_time": "19:01:47"}
|
| 500 |
+
{"current_steps": 2500, "total_steps": 12698, "loss": 0.1871, "lr": 3.886935046839654e-05, "epoch": 1.3781697905181918, "percentage": 19.69, "elapsed_time": "4:39:24", "remaining_time": "18:59:46"}
|
| 501 |
+
{"current_steps": 2505, "total_steps": 12698, "loss": 0.2014, "lr": 3.886022057130129e-05, "epoch": 1.3809261300992282, "percentage": 19.73, "elapsed_time": "4:39:36", "remaining_time": "18:57:44"}
|
| 502 |
+
{"current_steps": 2510, "total_steps": 12698, "loss": 0.1997, "lr": 3.885105504173099e-05, "epoch": 1.3836824696802645, "percentage": 19.77, "elapsed_time": "4:39:49", "remaining_time": "18:55:48"}
|
| 503 |
+
{"current_steps": 2515, "total_steps": 12698, "loss": 0.2071, "lr": 3.8841853897002e-05, "epoch": 1.386438809261301, "percentage": 19.81, "elapsed_time": "4:40:03", "remaining_time": "18:53:55"}
|
| 504 |
+
{"current_steps": 2520, "total_steps": 12698, "loss": 0.1997, "lr": 3.8832617154497974e-05, "epoch": 1.3891951488423373, "percentage": 19.85, "elapsed_time": "4:40:15", "remaining_time": "18:51:56"}
|
| 505 |
+
{"current_steps": 2525, "total_steps": 12698, "loss": 0.202, "lr": 3.882334483166983e-05, "epoch": 1.3919514884233737, "percentage": 19.89, "elapsed_time": "4:40:27", "remaining_time": "18:49:57"}
|
| 506 |
+
{"current_steps": 2530, "total_steps": 12698, "loss": 0.2055, "lr": 3.881403694603567e-05, "epoch": 1.39470782800441, "percentage": 19.92, "elapsed_time": "4:40:39", "remaining_time": "18:47:58"}
|
| 507 |
+
{"current_steps": 2535, "total_steps": 12698, "loss": 0.297, "lr": 3.880469351518086e-05, "epoch": 1.3974641675854464, "percentage": 19.96, "elapsed_time": "4:41:21", "remaining_time": "18:47:58"}
|
| 508 |
+
{"current_steps": 2540, "total_steps": 12698, "loss": 0.3244, "lr": 3.8795314556757835e-05, "epoch": 1.4002205071664828, "percentage": 20.0, "elapsed_time": "4:41:59", "remaining_time": "18:47:46"}
|
| 509 |
+
{"current_steps": 2545, "total_steps": 12698, "loss": 0.3115, "lr": 3.878590008848621e-05, "epoch": 1.4029768467475192, "percentage": 20.04, "elapsed_time": "4:42:59", "remaining_time": "18:48:58"}
|
| 510 |
+
{"current_steps": 2550, "total_steps": 12698, "loss": 0.3116, "lr": 3.877645012815267e-05, "epoch": 1.4057331863285556, "percentage": 20.08, "elapsed_time": "4:43:51", "remaining_time": "18:49:39"}
|
| 511 |
+
{"current_steps": 2555, "total_steps": 12698, "loss": 0.3065, "lr": 3.8766964693610945e-05, "epoch": 1.4084895259095922, "percentage": 20.12, "elapsed_time": "4:44:44", "remaining_time": "18:50:22"}
|
| 512 |
+
{"current_steps": 2560, "total_steps": 12698, "loss": 0.3189, "lr": 3.875744380278181e-05, "epoch": 1.4112458654906286, "percentage": 20.16, "elapsed_time": "4:45:35", "remaining_time": "18:51:00"}
|
| 513 |
+
{"current_steps": 2565, "total_steps": 12698, "loss": 0.2981, "lr": 3.8747887473653004e-05, "epoch": 1.414002205071665, "percentage": 20.2, "elapsed_time": "4:46:30", "remaining_time": "18:51:50"}
|
| 514 |
+
{"current_steps": 2570, "total_steps": 12698, "loss": 0.3073, "lr": 3.8738295724279226e-05, "epoch": 1.4167585446527013, "percentage": 20.24, "elapsed_time": "4:47:16", "remaining_time": "18:52:08"}
|
| 515 |
+
{"current_steps": 2575, "total_steps": 12698, "loss": 0.3115, "lr": 3.8728668572782103e-05, "epoch": 1.4195148842337377, "percentage": 20.28, "elapsed_time": "4:48:13", "remaining_time": "18:53:05"}
|
| 516 |
+
{"current_steps": 2580, "total_steps": 12698, "loss": 0.3151, "lr": 3.871900603735015e-05, "epoch": 1.422271223814774, "percentage": 20.32, "elapsed_time": "4:49:00", "remaining_time": "18:53:24"}
|
| 517 |
+
{"current_steps": 2585, "total_steps": 12698, "loss": 0.3099, "lr": 3.870930813623871e-05, "epoch": 1.4250275633958105, "percentage": 20.36, "elapsed_time": "4:49:49", "remaining_time": "18:53:50"}
|
| 518 |
+
{"current_steps": 2590, "total_steps": 12698, "loss": 0.3055, "lr": 3.8699574887769953e-05, "epoch": 1.4277839029768469, "percentage": 20.4, "elapsed_time": "4:50:52", "remaining_time": "18:55:13"}
|
| 519 |
+
{"current_steps": 2595, "total_steps": 12698, "loss": 0.3122, "lr": 3.8689806310332855e-05, "epoch": 1.4305402425578833, "percentage": 20.44, "elapsed_time": "4:51:34", "remaining_time": "18:55:09"}
|
| 520 |
+
{"current_steps": 2600, "total_steps": 12698, "loss": 0.3027, "lr": 3.868000242238309e-05, "epoch": 1.4332965821389196, "percentage": 20.48, "elapsed_time": "4:52:18", "remaining_time": "18:55:15"}
|
| 521 |
+
{"current_steps": 2605, "total_steps": 12698, "loss": 0.3161, "lr": 3.867016324244308e-05, "epoch": 1.436052921719956, "percentage": 20.52, "elapsed_time": "4:52:46", "remaining_time": "18:54:19"}
|
| 522 |
+
{"current_steps": 2610, "total_steps": 12698, "loss": 0.3157, "lr": 3.8660288789101925e-05, "epoch": 1.4388092613009924, "percentage": 20.55, "elapsed_time": "4:53:11", "remaining_time": "18:53:14"}
|
| 523 |
+
{"current_steps": 2615, "total_steps": 12698, "loss": 0.3109, "lr": 3.865037908101535e-05, "epoch": 1.4415656008820288, "percentage": 20.59, "elapsed_time": "4:53:39", "remaining_time": "18:52:19"}
|
| 524 |
+
{"current_steps": 2620, "total_steps": 12698, "loss": 0.3225, "lr": 3.864043413690569e-05, "epoch": 1.4443219404630652, "percentage": 20.63, "elapsed_time": "4:54:05", "remaining_time": "18:51:14"}
|
| 525 |
+
{"current_steps": 2625, "total_steps": 12698, "loss": 0.3156, "lr": 3.8630453975561856e-05, "epoch": 1.4470782800441016, "percentage": 20.67, "elapsed_time": "4:54:29", "remaining_time": "18:50:02"}
|
| 526 |
+
{"current_steps": 2630, "total_steps": 12698, "loss": 0.3135, "lr": 3.8620438615839286e-05, "epoch": 1.449834619625138, "percentage": 20.71, "elapsed_time": "4:54:57", "remaining_time": "18:49:09"}
|
| 527 |
+
{"current_steps": 2635, "total_steps": 12698, "loss": 0.3163, "lr": 3.8610388076659944e-05, "epoch": 1.4525909592061743, "percentage": 20.75, "elapsed_time": "4:55:24", "remaining_time": "18:48:08"}
|
| 528 |
+
{"current_steps": 2640, "total_steps": 12698, "loss": 0.3034, "lr": 3.8600302377012226e-05, "epoch": 1.4553472987872107, "percentage": 20.79, "elapsed_time": "4:55:52", "remaining_time": "18:47:15"}
|
| 529 |
+
{"current_steps": 2645, "total_steps": 12698, "loss": 0.2816, "lr": 3.8590181535950966e-05, "epoch": 1.458103638368247, "percentage": 20.83, "elapsed_time": "4:56:21", "remaining_time": "18:46:23"}
|
| 530 |
+
{"current_steps": 2650, "total_steps": 12698, "loss": 0.3106, "lr": 3.858002557259741e-05, "epoch": 1.4608599779492835, "percentage": 20.87, "elapsed_time": "4:56:46", "remaining_time": "18:45:15"}
|
| 531 |
+
{"current_steps": 2655, "total_steps": 12698, "loss": 0.3106, "lr": 3.856983450613912e-05, "epoch": 1.4636163175303198, "percentage": 20.91, "elapsed_time": "4:57:11", "remaining_time": "18:44:11"}
|
| 532 |
+
{"current_steps": 2660, "total_steps": 12698, "loss": 0.3173, "lr": 3.855960835583003e-05, "epoch": 1.4663726571113562, "percentage": 20.95, "elapsed_time": "4:57:36", "remaining_time": "18:43:05"}
|
| 533 |
+
{"current_steps": 2665, "total_steps": 12698, "loss": 0.295, "lr": 3.854934714099031e-05, "epoch": 1.4691289966923926, "percentage": 20.99, "elapsed_time": "4:58:03", "remaining_time": "18:42:06"}
|
| 534 |
+
{"current_steps": 2670, "total_steps": 12698, "loss": 0.2937, "lr": 3.8539050881006404e-05, "epoch": 1.471885336273429, "percentage": 21.03, "elapsed_time": "4:58:29", "remaining_time": "18:41:04"}
|
| 535 |
+
{"current_steps": 2675, "total_steps": 12698, "loss": 0.3131, "lr": 3.852871959533096e-05, "epoch": 1.4746416758544654, "percentage": 21.07, "elapsed_time": "4:58:55", "remaining_time": "18:40:04"}
|
| 536 |
+
{"current_steps": 2680, "total_steps": 12698, "loss": 0.3032, "lr": 3.8518353303482796e-05, "epoch": 1.4773980154355018, "percentage": 21.11, "elapsed_time": "4:59:24", "remaining_time": "18:39:11"}
|
| 537 |
+
{"current_steps": 2685, "total_steps": 12698, "loss": 0.289, "lr": 3.850795202504688e-05, "epoch": 1.4801543550165381, "percentage": 21.15, "elapsed_time": "4:59:49", "remaining_time": "18:38:06"}
|
| 538 |
+
{"current_steps": 2690, "total_steps": 12698, "loss": 0.3064, "lr": 3.8497515779674254e-05, "epoch": 1.4829106945975745, "percentage": 21.18, "elapsed_time": "5:00:16", "remaining_time": "18:37:08"}
|
| 539 |
+
{"current_steps": 2695, "total_steps": 12698, "loss": 0.3046, "lr": 3.848704458708205e-05, "epoch": 1.485667034178611, "percentage": 21.22, "elapsed_time": "5:00:41", "remaining_time": "18:36:04"}
|
| 540 |
+
{"current_steps": 2700, "total_steps": 12698, "loss": 0.2956, "lr": 3.847653846705342e-05, "epoch": 1.4884233737596473, "percentage": 21.26, "elapsed_time": "5:01:10", "remaining_time": "18:35:12"}
|
| 541 |
+
{"current_steps": 2705, "total_steps": 12698, "loss": 0.3075, "lr": 3.846599743943749e-05, "epoch": 1.4911797133406837, "percentage": 21.3, "elapsed_time": "5:01:33", "remaining_time": "18:34:00"}
|
| 542 |
+
{"current_steps": 2710, "total_steps": 12698, "loss": 0.3074, "lr": 3.845542152414934e-05, "epoch": 1.49393605292172, "percentage": 21.34, "elapsed_time": "5:01:57", "remaining_time": "18:32:54"}
|
| 543 |
+
{"current_steps": 2715, "total_steps": 12698, "loss": 0.3022, "lr": 3.844481074116998e-05, "epoch": 1.4966923925027564, "percentage": 21.38, "elapsed_time": "5:02:25", "remaining_time": "18:32:01"}
|
| 544 |
+
{"current_steps": 2720, "total_steps": 12698, "loss": 0.2914, "lr": 3.8434165110546287e-05, "epoch": 1.4994487320837928, "percentage": 21.42, "elapsed_time": "5:02:52", "remaining_time": "18:31:03"}
|
| 545 |
+
{"current_steps": 2725, "total_steps": 12698, "loss": 0.3022, "lr": 3.842348465239096e-05, "epoch": 1.5022050716648292, "percentage": 21.46, "elapsed_time": "5:03:19", "remaining_time": "18:30:05"}
|
| 546 |
+
{"current_steps": 2730, "total_steps": 12698, "loss": 0.302, "lr": 3.841276938688251e-05, "epoch": 1.5049614112458656, "percentage": 21.5, "elapsed_time": "5:03:50", "remaining_time": "18:29:25"}
|
| 547 |
+
{"current_steps": 2735, "total_steps": 12698, "loss": 0.294, "lr": 3.8402019334265216e-05, "epoch": 1.507717750826902, "percentage": 21.54, "elapsed_time": "5:04:14", "remaining_time": "18:28:18"}
|
| 548 |
+
{"current_steps": 2740, "total_steps": 12698, "loss": 0.306, "lr": 3.839123451484907e-05, "epoch": 1.5104740904079383, "percentage": 21.58, "elapsed_time": "5:04:40", "remaining_time": "18:27:16"}
|
| 549 |
+
{"current_steps": 2745, "total_steps": 12698, "loss": 0.3002, "lr": 3.838041494900975e-05, "epoch": 1.5132304299889747, "percentage": 21.62, "elapsed_time": "5:05:09", "remaining_time": "18:26:26"}
|
| 550 |
+
{"current_steps": 2750, "total_steps": 12698, "loss": 0.2898, "lr": 3.836956065718859e-05, "epoch": 1.515986769570011, "percentage": 21.66, "elapsed_time": "5:05:38", "remaining_time": "18:25:39"}
|
| 551 |
+
{"current_steps": 2755, "total_steps": 12698, "loss": 0.2849, "lr": 3.8358671659892507e-05, "epoch": 1.5187431091510475, "percentage": 21.7, "elapsed_time": "5:06:03", "remaining_time": "18:24:36"}
|
| 552 |
+
{"current_steps": 2760, "total_steps": 12698, "loss": 0.3127, "lr": 3.8347747977694014e-05, "epoch": 1.5214994487320839, "percentage": 21.74, "elapsed_time": "5:06:30", "remaining_time": "18:23:37"}
|
| 553 |
+
{"current_steps": 2765, "total_steps": 12698, "loss": 0.2934, "lr": 3.8336789631231136e-05, "epoch": 1.5242557883131203, "percentage": 21.78, "elapsed_time": "5:06:59", "remaining_time": "18:22:48"}
|
| 554 |
+
{"current_steps": 2770, "total_steps": 12698, "loss": 0.3024, "lr": 3.832579664120741e-05, "epoch": 1.5270121278941566, "percentage": 21.81, "elapsed_time": "5:07:23", "remaining_time": "18:21:43"}
|
| 555 |
+
{"current_steps": 2775, "total_steps": 12698, "loss": 0.3063, "lr": 3.83147690283918e-05, "epoch": 1.529768467475193, "percentage": 21.85, "elapsed_time": "5:07:51", "remaining_time": "18:20:49"}
|
| 556 |
+
{"current_steps": 2780, "total_steps": 12698, "loss": 0.2975, "lr": 3.830370681361869e-05, "epoch": 1.5325248070562294, "percentage": 21.89, "elapsed_time": "5:08:18", "remaining_time": "18:19:54"}
|
| 557 |
+
{"current_steps": 2785, "total_steps": 12698, "loss": 0.2969, "lr": 3.829261001778785e-05, "epoch": 1.5352811466372658, "percentage": 21.93, "elapsed_time": "5:08:46", "remaining_time": "18:19:05"}
|
| 558 |
+
{"current_steps": 2790, "total_steps": 12698, "loss": 0.3089, "lr": 3.8281478661864365e-05, "epoch": 1.5380374862183022, "percentage": 21.97, "elapsed_time": "5:09:12", "remaining_time": "18:18:03"}
|
| 559 |
+
{"current_steps": 2795, "total_steps": 12698, "loss": 0.2845, "lr": 3.8270312766878624e-05, "epoch": 1.5407938257993385, "percentage": 22.01, "elapsed_time": "5:09:40", "remaining_time": "18:17:13"}
|
| 560 |
+
{"current_steps": 2800, "total_steps": 12698, "loss": 0.2849, "lr": 3.825911235392628e-05, "epoch": 1.543550165380375, "percentage": 22.05, "elapsed_time": "5:10:06", "remaining_time": "18:16:14"}
|
| 561 |
+
{"current_steps": 2805, "total_steps": 12698, "loss": 0.2826, "lr": 3.824787744416818e-05, "epoch": 1.5463065049614113, "percentage": 22.09, "elapsed_time": "5:10:31", "remaining_time": "18:15:12"}
|
| 562 |
+
{"current_steps": 2810, "total_steps": 12698, "loss": 0.2961, "lr": 3.823660805883036e-05, "epoch": 1.5490628445424477, "percentage": 22.13, "elapsed_time": "5:11:00", "remaining_time": "18:14:24"}
|
| 563 |
+
{"current_steps": 2815, "total_steps": 12698, "loss": 0.2976, "lr": 3.822530421920399e-05, "epoch": 1.551819184123484, "percentage": 22.17, "elapsed_time": "5:11:27", "remaining_time": "18:13:28"}
|
| 564 |
+
{"current_steps": 2820, "total_steps": 12698, "loss": 0.2963, "lr": 3.8213965946645324e-05, "epoch": 1.5545755237045205, "percentage": 22.21, "elapsed_time": "5:12:00", "remaining_time": "18:12:54"}
|
| 565 |
+
{"current_steps": 2825, "total_steps": 12698, "loss": 0.294, "lr": 3.8202593262575674e-05, "epoch": 1.5573318632855568, "percentage": 22.25, "elapsed_time": "5:12:30", "remaining_time": "18:12:11"}
|
| 566 |
+
{"current_steps": 2830, "total_steps": 12698, "loss": 0.3003, "lr": 3.819118618848137e-05, "epoch": 1.5600882028665932, "percentage": 22.29, "elapsed_time": "5:12:59", "remaining_time": "18:11:23"}
|
| 567 |
+
{"current_steps": 2835, "total_steps": 12698, "loss": 0.3015, "lr": 3.8179744745913724e-05, "epoch": 1.5628445424476296, "percentage": 22.33, "elapsed_time": "5:13:26", "remaining_time": "18:10:28"}
|
| 568 |
+
{"current_steps": 2840, "total_steps": 12698, "loss": 0.2973, "lr": 3.816826895648895e-05, "epoch": 1.565600882028666, "percentage": 22.37, "elapsed_time": "5:13:52", "remaining_time": "18:09:30"}
|
| 569 |
+
{"current_steps": 2845, "total_steps": 12698, "loss": 0.2855, "lr": 3.815675884188818e-05, "epoch": 1.5683572216097024, "percentage": 22.41, "elapsed_time": "5:14:21", "remaining_time": "18:08:41"}
|
| 570 |
+
{"current_steps": 2850, "total_steps": 12698, "loss": 0.2796, "lr": 3.81452144238574e-05, "epoch": 1.5711135611907387, "percentage": 22.44, "elapsed_time": "5:14:46", "remaining_time": "18:07:40"}
|
| 571 |
+
{"current_steps": 2855, "total_steps": 12698, "loss": 0.2873, "lr": 3.813363572420738e-05, "epoch": 1.5738699007717751, "percentage": 22.48, "elapsed_time": "5:15:11", "remaining_time": "18:06:39"}
|
| 572 |
+
{"current_steps": 2860, "total_steps": 12698, "loss": 0.2779, "lr": 3.8122022764813674e-05, "epoch": 1.5766262403528115, "percentage": 22.52, "elapsed_time": "5:15:39", "remaining_time": "18:05:48"}
|
| 573 |
+
{"current_steps": 2865, "total_steps": 12698, "loss": 0.2779, "lr": 3.811037556761656e-05, "epoch": 1.579382579933848, "percentage": 22.56, "elapsed_time": "5:16:06", "remaining_time": "18:04:53"}
|
| 574 |
+
{"current_steps": 2870, "total_steps": 12698, "loss": 0.2801, "lr": 3.8098694154621004e-05, "epoch": 1.5821389195148843, "percentage": 22.6, "elapsed_time": "5:16:32", "remaining_time": "18:03:58"}
|
| 575 |
+
{"current_steps": 2875, "total_steps": 12698, "loss": 0.2931, "lr": 3.808697854789661e-05, "epoch": 1.5848952590959207, "percentage": 22.64, "elapsed_time": "5:16:57", "remaining_time": "18:02:57"}
|
| 576 |
+
{"current_steps": 2880, "total_steps": 12698, "loss": 0.3086, "lr": 3.8075228769577586e-05, "epoch": 1.587651598676957, "percentage": 22.68, "elapsed_time": "5:17:24", "remaining_time": "18:02:02"}
|
| 577 |
+
{"current_steps": 2885, "total_steps": 12698, "loss": 0.2871, "lr": 3.806344484186271e-05, "epoch": 1.5904079382579934, "percentage": 22.72, "elapsed_time": "5:17:48", "remaining_time": "18:00:58"}
|
| 578 |
+
{"current_steps": 2890, "total_steps": 12698, "loss": 0.2917, "lr": 3.805162678701526e-05, "epoch": 1.5931642778390298, "percentage": 22.76, "elapsed_time": "5:18:16", "remaining_time": "18:00:08"}
|
| 579 |
+
{"current_steps": 2895, "total_steps": 12698, "loss": 0.2814, "lr": 3.8039774627363e-05, "epoch": 1.5959206174200662, "percentage": 22.8, "elapsed_time": "5:18:44", "remaining_time": "17:59:19"}
|
| 580 |
+
{"current_steps": 2900, "total_steps": 12698, "loss": 0.2811, "lr": 3.802788838529813e-05, "epoch": 1.5986769570011026, "percentage": 22.84, "elapsed_time": "5:19:14", "remaining_time": "17:58:34"}
|
| 581 |
+
{"current_steps": 2905, "total_steps": 12698, "loss": 0.2876, "lr": 3.801596808327724e-05, "epoch": 1.601433296582139, "percentage": 22.88, "elapsed_time": "5:19:42", "remaining_time": "17:57:46"}
|
| 582 |
+
{"current_steps": 2910, "total_steps": 12698, "loss": 0.2769, "lr": 3.800401374382127e-05, "epoch": 1.6041896361631753, "percentage": 22.92, "elapsed_time": "5:20:11", "remaining_time": "17:56:59"}
|
| 583 |
+
{"current_steps": 2915, "total_steps": 12698, "loss": 0.2908, "lr": 3.799202538951546e-05, "epoch": 1.6069459757442117, "percentage": 22.96, "elapsed_time": "5:20:35", "remaining_time": "17:55:55"}
|
| 584 |
+
{"current_steps": 2920, "total_steps": 12698, "loss": 0.2839, "lr": 3.798000304300932e-05, "epoch": 1.609702315325248, "percentage": 23.0, "elapsed_time": "5:21:03", "remaining_time": "17:55:06"}
|
| 585 |
+
{"current_steps": 2925, "total_steps": 12698, "loss": 0.2953, "lr": 3.796794672701658e-05, "epoch": 1.6124586549062845, "percentage": 23.04, "elapsed_time": "5:21:31", "remaining_time": "17:54:15"}
|
| 586 |
+
{"current_steps": 2930, "total_steps": 12698, "loss": 0.3019, "lr": 3.795585646431516e-05, "epoch": 1.6152149944873209, "percentage": 23.07, "elapsed_time": "5:21:57", "remaining_time": "17:53:20"}
|
| 587 |
+
{"current_steps": 2935, "total_steps": 12698, "loss": 0.2938, "lr": 3.794373227774708e-05, "epoch": 1.6179713340683572, "percentage": 23.11, "elapsed_time": "5:22:24", "remaining_time": "17:52:28"}
|
| 588 |
+
{"current_steps": 2940, "total_steps": 12698, "loss": 0.3136, "lr": 3.7931574190218504e-05, "epoch": 1.6207276736493936, "percentage": 23.15, "elapsed_time": "5:22:50", "remaining_time": "17:51:31"}
|
| 589 |
+
{"current_steps": 2945, "total_steps": 12698, "loss": 0.2844, "lr": 3.791938222469959e-05, "epoch": 1.62348401323043, "percentage": 23.19, "elapsed_time": "5:23:14", "remaining_time": "17:50:29"}
|
| 590 |
+
{"current_steps": 2950, "total_steps": 12698, "loss": 0.3036, "lr": 3.790715640422455e-05, "epoch": 1.6262403528114664, "percentage": 23.23, "elapsed_time": "5:23:44", "remaining_time": "17:49:45"}
|
| 591 |
+
{"current_steps": 2955, "total_steps": 12698, "loss": 0.3073, "lr": 3.789489675189152e-05, "epoch": 1.6289966923925028, "percentage": 23.27, "elapsed_time": "5:24:11", "remaining_time": "17:48:54"}
|
| 592 |
+
{"current_steps": 2960, "total_steps": 12698, "loss": 0.2862, "lr": 3.788260329086258e-05, "epoch": 1.6317530319735392, "percentage": 23.31, "elapsed_time": "5:24:37", "remaining_time": "17:47:58"}
|
| 593 |
+
{"current_steps": 2965, "total_steps": 12698, "loss": 0.2918, "lr": 3.787027604436367e-05, "epoch": 1.6345093715545755, "percentage": 23.35, "elapsed_time": "5:25:08", "remaining_time": "17:47:18"}
|
| 594 |
+
{"current_steps": 2970, "total_steps": 12698, "loss": 0.2943, "lr": 3.785791503568457e-05, "epoch": 1.637265711135612, "percentage": 23.39, "elapsed_time": "5:25:34", "remaining_time": "17:46:23"}
|
| 595 |
+
{"current_steps": 2975, "total_steps": 12698, "loss": 0.2978, "lr": 3.784552028817884e-05, "epoch": 1.6400220507166483, "percentage": 23.43, "elapsed_time": "5:25:58", "remaining_time": "17:45:21"}
|
| 596 |
+
{"current_steps": 2980, "total_steps": 12698, "loss": 0.2995, "lr": 3.7833091825263785e-05, "epoch": 1.6427783902976847, "percentage": 23.47, "elapsed_time": "5:26:24", "remaining_time": "17:44:25"}
|
| 597 |
+
{"current_steps": 2985, "total_steps": 12698, "loss": 0.2731, "lr": 3.7820629670420406e-05, "epoch": 1.645534729878721, "percentage": 23.51, "elapsed_time": "5:26:51", "remaining_time": "17:43:34"}
|
| 598 |
+
{"current_steps": 2990, "total_steps": 12698, "loss": 0.2794, "lr": 3.780813384719336e-05, "epoch": 1.6482910694597575, "percentage": 23.55, "elapsed_time": "5:27:22", "remaining_time": "17:42:54"}
|
| 599 |
+
{"current_steps": 2995, "total_steps": 12698, "loss": 0.2835, "lr": 3.779560437919091e-05, "epoch": 1.6510474090407938, "percentage": 23.59, "elapsed_time": "5:27:50", "remaining_time": "17:42:07"}
|
| 600 |
+
{"current_steps": 3000, "total_steps": 12698, "loss": 0.2827, "lr": 3.7783041290084904e-05, "epoch": 1.6538037486218302, "percentage": 23.63, "elapsed_time": "5:28:18", "remaining_time": "17:41:17"}
|
| 601 |
+
{"current_steps": 3005, "total_steps": 12698, "loss": 0.2812, "lr": 3.777044460361067e-05, "epoch": 1.6565600882028666, "percentage": 23.67, "elapsed_time": "5:29:24", "remaining_time": "17:42:32"}
|
| 602 |
+
{"current_steps": 3010, "total_steps": 12698, "loss": 0.2936, "lr": 3.775781434356705e-05, "epoch": 1.659316427783903, "percentage": 23.7, "elapsed_time": "5:29:49", "remaining_time": "17:41:33"}
|
| 603 |
+
{"current_steps": 3015, "total_steps": 12698, "loss": 0.2805, "lr": 3.77451505338163e-05, "epoch": 1.6620727673649394, "percentage": 23.74, "elapsed_time": "5:30:16", "remaining_time": "17:40:42"}
|
| 604 |
+
{"current_steps": 3020, "total_steps": 12698, "loss": 0.2923, "lr": 3.773245319828405e-05, "epoch": 1.6648291069459757, "percentage": 23.78, "elapsed_time": "5:30:39", "remaining_time": "17:39:36"}
|
| 605 |
+
{"current_steps": 3025, "total_steps": 12698, "loss": 0.2854, "lr": 3.771972236095929e-05, "epoch": 1.6675854465270121, "percentage": 23.82, "elapsed_time": "5:31:10", "remaining_time": "17:39:00"}
|
| 606 |
+
{"current_steps": 3030, "total_steps": 12698, "loss": 0.2751, "lr": 3.77069580458943e-05, "epoch": 1.6703417861080485, "percentage": 23.86, "elapsed_time": "5:31:44", "remaining_time": "17:38:31"}
|
| 607 |
+
{"current_steps": 3035, "total_steps": 12698, "loss": 0.2671, "lr": 3.76941602772046e-05, "epoch": 1.673098125689085, "percentage": 23.9, "elapsed_time": "5:32:13", "remaining_time": "17:37:46"}
|
| 608 |
+
{"current_steps": 3040, "total_steps": 12698, "loss": 0.2749, "lr": 3.768132907906893e-05, "epoch": 1.6758544652701213, "percentage": 23.94, "elapsed_time": "5:32:41", "remaining_time": "17:36:56"}
|
| 609 |
+
{"current_steps": 3045, "total_steps": 12698, "loss": 0.2769, "lr": 3.766846447572916e-05, "epoch": 1.6786108048511577, "percentage": 23.98, "elapsed_time": "5:33:08", "remaining_time": "17:36:05"}
|
| 610 |
+
{"current_steps": 3050, "total_steps": 12698, "loss": 0.2738, "lr": 3.765556649149031e-05, "epoch": 1.681367144432194, "percentage": 24.02, "elapsed_time": "5:33:37", "remaining_time": "17:35:20"}
|
| 611 |
+
{"current_steps": 3055, "total_steps": 12698, "loss": 0.268, "lr": 3.7642635150720426e-05, "epoch": 1.6841234840132304, "percentage": 24.06, "elapsed_time": "5:34:04", "remaining_time": "17:34:28"}
|
| 612 |
+
{"current_steps": 3060, "total_steps": 12698, "loss": 0.2744, "lr": 3.7629670477850616e-05, "epoch": 1.6868798235942668, "percentage": 24.1, "elapsed_time": "5:34:28", "remaining_time": "17:33:30"}
|
| 613 |
+
{"current_steps": 3065, "total_steps": 12698, "loss": 0.2775, "lr": 3.761667249737491e-05, "epoch": 1.6896361631753032, "percentage": 24.14, "elapsed_time": "5:34:56", "remaining_time": "17:32:41"}
|
| 614 |
+
{"current_steps": 3070, "total_steps": 12698, "loss": 0.2993, "lr": 3.760364123385033e-05, "epoch": 1.6923925027563396, "percentage": 24.18, "elapsed_time": "5:35:22", "remaining_time": "17:31:47"}
|
| 615 |
+
{"current_steps": 3075, "total_steps": 12698, "loss": 0.2811, "lr": 3.759057671189673e-05, "epoch": 1.695148842337376, "percentage": 24.22, "elapsed_time": "5:35:44", "remaining_time": "17:30:41"}
|
| 616 |
+
{"current_steps": 3080, "total_steps": 12698, "loss": 0.2815, "lr": 3.757747895619681e-05, "epoch": 1.6979051819184123, "percentage": 24.26, "elapsed_time": "5:36:14", "remaining_time": "17:29:59"}
|
| 617 |
+
{"current_steps": 3085, "total_steps": 12698, "loss": 0.2713, "lr": 3.756434799149607e-05, "epoch": 1.7006615214994487, "percentage": 24.3, "elapsed_time": "5:36:39", "remaining_time": "17:29:03"}
|
| 618 |
+
{"current_steps": 3090, "total_steps": 12698, "loss": 0.2783, "lr": 3.7551183842602735e-05, "epoch": 1.703417861080485, "percentage": 24.33, "elapsed_time": "5:37:04", "remaining_time": "17:28:07"}
|
| 619 |
+
{"current_steps": 3095, "total_steps": 12698, "loss": 0.2862, "lr": 3.7537986534387754e-05, "epoch": 1.7061742006615215, "percentage": 24.37, "elapsed_time": "5:37:31", "remaining_time": "17:27:13"}
|
| 620 |
+
{"current_steps": 3100, "total_steps": 12698, "loss": 0.2874, "lr": 3.752475609178468e-05, "epoch": 1.7089305402425579, "percentage": 24.41, "elapsed_time": "5:37:57", "remaining_time": "17:26:22"}
|
| 621 |
+
{"current_steps": 3105, "total_steps": 12698, "loss": 0.279, "lr": 3.75114925397897e-05, "epoch": 1.7116868798235942, "percentage": 24.45, "elapsed_time": "5:38:24", "remaining_time": "17:25:32"}
|
| 622 |
+
{"current_steps": 3110, "total_steps": 12698, "loss": 0.2797, "lr": 3.7498195903461556e-05, "epoch": 1.7144432194046306, "percentage": 24.49, "elapsed_time": "5:38:50", "remaining_time": "17:24:37"}
|
| 623 |
+
{"current_steps": 3115, "total_steps": 12698, "loss": 0.2781, "lr": 3.748486620792147e-05, "epoch": 1.717199558985667, "percentage": 24.53, "elapsed_time": "5:39:18", "remaining_time": "17:23:49"}
|
| 624 |
+
{"current_steps": 3120, "total_steps": 12698, "loss": 0.2231, "lr": 3.747150347835314e-05, "epoch": 1.7199558985667034, "percentage": 24.57, "elapsed_time": "5:39:51", "remaining_time": "17:23:19"}
|
| 625 |
+
{"current_steps": 3125, "total_steps": 12698, "loss": 0.133, "lr": 3.7458107740002676e-05, "epoch": 1.7227122381477398, "percentage": 24.61, "elapsed_time": "5:40:15", "remaining_time": "17:22:21"}
|
| 626 |
+
{"current_steps": 3130, "total_steps": 12698, "loss": 0.1167, "lr": 3.744467901817854e-05, "epoch": 1.7254685777287762, "percentage": 24.65, "elapsed_time": "5:40:44", "remaining_time": "17:21:34"}
|