Training in progress, step 4500
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcbeae55e12d31142d58bbf3cad7e6aa3064922c8b634d0ed6e76ecac3d52d76
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45e29dbfca521f0fb191fb64ed560cc5872176b662af6406a7d35bfb228c768f
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:377a73758c3fb91f05bced440552c6f1306305cba4a7fb20b2090ae7ca3b2de1
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3c3868e255453f358e9bad3a0807092ac91effd0fba4bc57e6b7372329207c7
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -624,3 +624,322 @@
|
|
| 624 |
{"current_steps": 3120, "total_steps": 12698, "loss": 0.2231, "lr": 3.747150347835314e-05, "epoch": 1.7199558985667034, "percentage": 24.57, "elapsed_time": "5:39:51", "remaining_time": "17:23:19"}
|
| 625 |
{"current_steps": 3125, "total_steps": 12698, "loss": 0.133, "lr": 3.7458107740002676e-05, "epoch": 1.7227122381477398, "percentage": 24.61, "elapsed_time": "5:40:15", "remaining_time": "17:22:21"}
|
| 626 |
{"current_steps": 3130, "total_steps": 12698, "loss": 0.1167, "lr": 3.744467901817854e-05, "epoch": 1.7254685777287762, "percentage": 24.65, "elapsed_time": "5:40:44", "remaining_time": "17:21:34"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 624 |
{"current_steps": 3120, "total_steps": 12698, "loss": 0.2231, "lr": 3.747150347835314e-05, "epoch": 1.7199558985667034, "percentage": 24.57, "elapsed_time": "5:39:51", "remaining_time": "17:23:19"}
|
| 625 |
{"current_steps": 3125, "total_steps": 12698, "loss": 0.133, "lr": 3.7458107740002676e-05, "epoch": 1.7227122381477398, "percentage": 24.61, "elapsed_time": "5:40:15", "remaining_time": "17:22:21"}
|
| 626 |
{"current_steps": 3130, "total_steps": 12698, "loss": 0.1167, "lr": 3.744467901817854e-05, "epoch": 1.7254685777287762, "percentage": 24.65, "elapsed_time": "5:40:44", "remaining_time": "17:21:34"}
|
| 627 |
+
{"current_steps": 3135, "total_steps": 12698, "loss": 0.1204, "lr": 3.743121733825152e-05, "epoch": 1.7282249173098125, "percentage": 24.69, "elapsed_time": "5:41:06", "remaining_time": "17:20:30"}
|
| 628 |
+
{"current_steps": 3140, "total_steps": 12698, "loss": 0.105, "lr": 3.741772272565468e-05, "epoch": 1.730981256890849, "percentage": 24.73, "elapsed_time": "5:41:29", "remaining_time": "17:19:29"}
|
| 629 |
+
{"current_steps": 3145, "total_steps": 12698, "loss": 0.1193, "lr": 3.7404195205883274e-05, "epoch": 1.7337375964718853, "percentage": 24.77, "elapsed_time": "5:41:59", "remaining_time": "17:18:47"}
|
| 630 |
+
{"current_steps": 3150, "total_steps": 12698, "loss": 0.1682, "lr": 3.7390634804494757e-05, "epoch": 1.7364939360529217, "percentage": 24.81, "elapsed_time": "5:42:24", "remaining_time": "17:17:53"}
|
| 631 |
+
{"current_steps": 3155, "total_steps": 12698, "loss": 0.1304, "lr": 3.737704154710868e-05, "epoch": 1.739250275633958, "percentage": 24.85, "elapsed_time": "5:42:51", "remaining_time": "17:17:03"}
|
| 632 |
+
{"current_steps": 3160, "total_steps": 12698, "loss": 0.1259, "lr": 3.73634154594067e-05, "epoch": 1.7420066152149944, "percentage": 24.89, "elapsed_time": "5:43:16", "remaining_time": "17:16:06"}
|
| 633 |
+
{"current_steps": 3165, "total_steps": 12698, "loss": 0.1581, "lr": 3.734975656713248e-05, "epoch": 1.7447629547960308, "percentage": 24.93, "elapsed_time": "5:44:14", "remaining_time": "17:16:50"}
|
| 634 |
+
{"current_steps": 3170, "total_steps": 12698, "loss": 0.0969, "lr": 3.733606489609166e-05, "epoch": 1.7475192943770672, "percentage": 24.96, "elapsed_time": "5:44:45", "remaining_time": "17:16:14"}
|
| 635 |
+
{"current_steps": 3175, "total_steps": 12698, "loss": 0.1108, "lr": 3.732234047215181e-05, "epoch": 1.7502756339581036, "percentage": 25.0, "elapsed_time": "5:45:22", "remaining_time": "17:15:54"}
|
| 636 |
+
{"current_steps": 3180, "total_steps": 12698, "loss": 0.1102, "lr": 3.730858332124239e-05, "epoch": 1.75303197353914, "percentage": 25.04, "elapsed_time": "5:45:57", "remaining_time": "17:15:28"}
|
| 637 |
+
{"current_steps": 3185, "total_steps": 12698, "loss": 0.1635, "lr": 3.729479346935468e-05, "epoch": 1.7557883131201764, "percentage": 25.08, "elapsed_time": "5:46:30", "remaining_time": "17:14:57"}
|
| 638 |
+
{"current_steps": 3190, "total_steps": 12698, "loss": 0.1039, "lr": 3.728097094254174e-05, "epoch": 1.7585446527012127, "percentage": 25.12, "elapsed_time": "5:46:53", "remaining_time": "17:13:55"}
|
| 639 |
+
{"current_steps": 3195, "total_steps": 12698, "loss": 0.1191, "lr": 3.726711576691838e-05, "epoch": 1.7613009922822491, "percentage": 25.16, "elapsed_time": "5:47:23", "remaining_time": "17:13:14"}
|
| 640 |
+
{"current_steps": 3200, "total_steps": 12698, "loss": 0.0992, "lr": 3.725322796866106e-05, "epoch": 1.7640573318632855, "percentage": 25.2, "elapsed_time": "5:47:45", "remaining_time": "17:12:11"}
|
| 641 |
+
{"current_steps": 3205, "total_steps": 12698, "loss": 0.1158, "lr": 3.7239307574007916e-05, "epoch": 1.7668136714443219, "percentage": 25.24, "elapsed_time": "5:48:08", "remaining_time": "17:11:10"}
|
| 642 |
+
{"current_steps": 3210, "total_steps": 12698, "loss": 0.1218, "lr": 3.722535460925864e-05, "epoch": 1.7695700110253583, "percentage": 25.28, "elapsed_time": "5:48:34", "remaining_time": "17:10:19"}
|
| 643 |
+
{"current_steps": 3215, "total_steps": 12698, "loss": 0.1291, "lr": 3.721136910077446e-05, "epoch": 1.7723263506063947, "percentage": 25.32, "elapsed_time": "5:49:08", "remaining_time": "17:09:48"}
|
| 644 |
+
{"current_steps": 3220, "total_steps": 12698, "loss": 0.1266, "lr": 3.71973510749781e-05, "epoch": 1.775082690187431, "percentage": 25.36, "elapsed_time": "5:49:29", "remaining_time": "17:08:44"}
|
| 645 |
+
{"current_steps": 3225, "total_steps": 12698, "loss": 0.1645, "lr": 3.7183300558353704e-05, "epoch": 1.7778390297684674, "percentage": 25.4, "elapsed_time": "5:50:08", "remaining_time": "17:08:29"}
|
| 646 |
+
{"current_steps": 3230, "total_steps": 12698, "loss": 0.108, "lr": 3.716921757744682e-05, "epoch": 1.7805953693495038, "percentage": 25.44, "elapsed_time": "5:50:30", "remaining_time": "17:07:25"}
|
| 647 |
+
{"current_steps": 3235, "total_steps": 12698, "loss": 0.118, "lr": 3.715510215886431e-05, "epoch": 1.7833517089305402, "percentage": 25.48, "elapsed_time": "5:50:50", "remaining_time": "17:06:17"}
|
| 648 |
+
{"current_steps": 3240, "total_steps": 12698, "loss": 0.1561, "lr": 3.714095432927433e-05, "epoch": 1.7861080485115766, "percentage": 25.52, "elapsed_time": "5:51:16", "remaining_time": "17:05:25"}
|
| 649 |
+
{"current_steps": 3245, "total_steps": 12698, "loss": 0.1365, "lr": 3.712677411540627e-05, "epoch": 1.788864388092613, "percentage": 25.56, "elapsed_time": "5:51:53", "remaining_time": "17:05:05"}
|
| 650 |
+
{"current_steps": 3250, "total_steps": 12698, "loss": 0.1482, "lr": 3.711256154405071e-05, "epoch": 1.7916207276736493, "percentage": 25.59, "elapsed_time": "5:52:25", "remaining_time": "17:04:31"}
|
| 651 |
+
{"current_steps": 3255, "total_steps": 12698, "loss": 0.2978, "lr": 3.709831664205935e-05, "epoch": 1.7943770672546857, "percentage": 25.63, "elapsed_time": "5:53:12", "remaining_time": "17:04:41"}
|
| 652 |
+
{"current_steps": 3260, "total_steps": 12698, "loss": 0.1304, "lr": 3.708403943634499e-05, "epoch": 1.797133406835722, "percentage": 25.67, "elapsed_time": "5:53:44", "remaining_time": "17:04:06"}
|
| 653 |
+
{"current_steps": 3265, "total_steps": 12698, "loss": 0.1279, "lr": 3.706972995388143e-05, "epoch": 1.7998897464167585, "percentage": 25.71, "elapsed_time": "5:54:10", "remaining_time": "17:03:14"}
|
| 654 |
+
{"current_steps": 3270, "total_steps": 12698, "loss": 0.2233, "lr": 3.705538822170348e-05, "epoch": 1.8026460859977949, "percentage": 25.75, "elapsed_time": "5:55:03", "remaining_time": "17:03:42"}
|
| 655 |
+
{"current_steps": 3275, "total_steps": 12698, "loss": 0.0934, "lr": 3.704101426690686e-05, "epoch": 1.8054024255788312, "percentage": 25.79, "elapsed_time": "5:55:31", "remaining_time": "17:02:56"}
|
| 656 |
+
{"current_steps": 3280, "total_steps": 12698, "loss": 0.1266, "lr": 3.702660811664819e-05, "epoch": 1.8081587651598676, "percentage": 25.83, "elapsed_time": "5:56:05", "remaining_time": "17:02:28"}
|
| 657 |
+
{"current_steps": 3285, "total_steps": 12698, "loss": 0.124, "lr": 3.70121697981449e-05, "epoch": 1.810915104740904, "percentage": 25.87, "elapsed_time": "5:56:31", "remaining_time": "17:01:37"}
|
| 658 |
+
{"current_steps": 3290, "total_steps": 12698, "loss": 0.1079, "lr": 3.6997699338675184e-05, "epoch": 1.8136714443219404, "percentage": 25.91, "elapsed_time": "5:57:03", "remaining_time": "17:01:02"}
|
| 659 |
+
{"current_steps": 3295, "total_steps": 12698, "loss": 0.1057, "lr": 3.698319676557799e-05, "epoch": 1.8164277839029768, "percentage": 25.95, "elapsed_time": "5:57:27", "remaining_time": "17:00:04"}
|
| 660 |
+
{"current_steps": 3300, "total_steps": 12698, "loss": 0.1082, "lr": 3.696866210625291e-05, "epoch": 1.8191841234840131, "percentage": 25.99, "elapsed_time": "5:57:47", "remaining_time": "16:58:58"}
|
| 661 |
+
{"current_steps": 3305, "total_steps": 12698, "loss": 0.1028, "lr": 3.695409538816018e-05, "epoch": 1.8219404630650495, "percentage": 26.03, "elapsed_time": "5:58:10", "remaining_time": "16:57:58"}
|
| 662 |
+
{"current_steps": 3310, "total_steps": 12698, "loss": 0.1576, "lr": 3.693949663882058e-05, "epoch": 1.824696802646086, "percentage": 26.07, "elapsed_time": "5:58:44", "remaining_time": "16:57:27"}
|
| 663 |
+
{"current_steps": 3315, "total_steps": 12698, "loss": 0.1018, "lr": 3.692486588581543e-05, "epoch": 1.8274531422271223, "percentage": 26.11, "elapsed_time": "5:59:15", "remaining_time": "16:56:51"}
|
| 664 |
+
{"current_steps": 3320, "total_steps": 12698, "loss": 0.102, "lr": 3.6910203156786496e-05, "epoch": 1.8302094818081587, "percentage": 26.15, "elapsed_time": "5:59:38", "remaining_time": "16:55:52"}
|
| 665 |
+
{"current_steps": 3325, "total_steps": 12698, "loss": 0.0987, "lr": 3.6895508479435964e-05, "epoch": 1.832965821389195, "percentage": 26.19, "elapsed_time": "6:00:00", "remaining_time": "16:54:50"}
|
| 666 |
+
{"current_steps": 3330, "total_steps": 12698, "loss": 0.1008, "lr": 3.688078188152639e-05, "epoch": 1.8357221609702314, "percentage": 26.22, "elapsed_time": "6:00:29", "remaining_time": "16:54:09"}
|
| 667 |
+
{"current_steps": 3335, "total_steps": 12698, "loss": 0.1578, "lr": 3.6866023390880605e-05, "epoch": 1.8384785005512678, "percentage": 26.26, "elapsed_time": "6:01:15", "remaining_time": "16:54:13"}
|
| 668 |
+
{"current_steps": 3340, "total_steps": 12698, "loss": 0.1325, "lr": 3.6851233035381746e-05, "epoch": 1.8412348401323042, "percentage": 26.3, "elapsed_time": "6:01:48", "remaining_time": "16:53:42"}
|
| 669 |
+
{"current_steps": 3345, "total_steps": 12698, "loss": 0.1249, "lr": 3.683641084297309e-05, "epoch": 1.8439911797133406, "percentage": 26.34, "elapsed_time": "6:02:12", "remaining_time": "16:52:45"}
|
| 670 |
+
{"current_steps": 3350, "total_steps": 12698, "loss": 0.1437, "lr": 3.6821556841658116e-05, "epoch": 1.846747519294377, "percentage": 26.38, "elapsed_time": "6:02:35", "remaining_time": "16:51:48"}
|
| 671 |
+
{"current_steps": 3355, "total_steps": 12698, "loss": 0.1677, "lr": 3.680667105950037e-05, "epoch": 1.8495038588754134, "percentage": 26.42, "elapsed_time": "6:03:11", "remaining_time": "16:51:26"}
|
| 672 |
+
{"current_steps": 3360, "total_steps": 12698, "loss": 0.1176, "lr": 3.6791753524623456e-05, "epoch": 1.8522601984564497, "percentage": 26.46, "elapsed_time": "6:03:38", "remaining_time": "16:50:37"}
|
| 673 |
+
{"current_steps": 3365, "total_steps": 12698, "loss": 0.1375, "lr": 3.6776804265210963e-05, "epoch": 1.8550165380374861, "percentage": 26.5, "elapsed_time": "6:04:02", "remaining_time": "16:49:42"}
|
| 674 |
+
{"current_steps": 3370, "total_steps": 12698, "loss": 0.1202, "lr": 3.676182330950641e-05, "epoch": 1.8577728776185225, "percentage": 26.54, "elapsed_time": "6:04:24", "remaining_time": "16:48:39"}
|
| 675 |
+
{"current_steps": 3375, "total_steps": 12698, "loss": 0.1103, "lr": 3.67468106858132e-05, "epoch": 1.8605292171995589, "percentage": 26.58, "elapsed_time": "6:04:55", "remaining_time": "16:48:02"}
|
| 676 |
+
{"current_steps": 3380, "total_steps": 12698, "loss": 0.1147, "lr": 3.673176642249459e-05, "epoch": 1.8632855567805953, "percentage": 26.62, "elapsed_time": "6:05:38", "remaining_time": "16:47:59"}
|
| 677 |
+
{"current_steps": 3385, "total_steps": 12698, "loss": 0.1023, "lr": 3.671669054797358e-05, "epoch": 1.8660418963616316, "percentage": 26.66, "elapsed_time": "6:06:17", "remaining_time": "16:47:44"}
|
| 678 |
+
{"current_steps": 3390, "total_steps": 12698, "loss": 0.101, "lr": 3.670158309073291e-05, "epoch": 1.868798235942668, "percentage": 26.7, "elapsed_time": "6:06:41", "remaining_time": "16:46:50"}
|
| 679 |
+
{"current_steps": 3395, "total_steps": 12698, "loss": 0.1127, "lr": 3.6686444079314995e-05, "epoch": 1.8715545755237044, "percentage": 26.74, "elapsed_time": "6:07:18", "remaining_time": "16:46:28"}
|
| 680 |
+
{"current_steps": 3400, "total_steps": 12698, "loss": 0.12, "lr": 3.667127354232185e-05, "epoch": 1.8743109151047408, "percentage": 26.78, "elapsed_time": "6:07:59", "remaining_time": "16:46:21"}
|
| 681 |
+
{"current_steps": 3405, "total_steps": 12698, "loss": 0.1207, "lr": 3.6656071508415064e-05, "epoch": 1.8770672546857772, "percentage": 26.82, "elapsed_time": "6:08:24", "remaining_time": "16:45:27"}
|
| 682 |
+
{"current_steps": 3410, "total_steps": 12698, "loss": 0.1097, "lr": 3.6640838006315715e-05, "epoch": 1.8798235942668136, "percentage": 26.85, "elapsed_time": "6:08:45", "remaining_time": "16:44:25"}
|
| 683 |
+
{"current_steps": 3415, "total_steps": 12698, "loss": 0.1077, "lr": 3.6625573064804366e-05, "epoch": 1.88257993384785, "percentage": 26.89, "elapsed_time": "6:09:12", "remaining_time": "16:43:35"}
|
| 684 |
+
{"current_steps": 3420, "total_steps": 12698, "loss": 0.123, "lr": 3.661027671272094e-05, "epoch": 1.8853362734288863, "percentage": 26.93, "elapsed_time": "6:09:46", "remaining_time": "16:43:07"}
|
| 685 |
+
{"current_steps": 3425, "total_steps": 12698, "loss": 0.0922, "lr": 3.659494897896473e-05, "epoch": 1.8880926130099227, "percentage": 26.97, "elapsed_time": "6:10:08", "remaining_time": "16:42:08"}
|
| 686 |
+
{"current_steps": 3430, "total_steps": 12698, "loss": 0.1234, "lr": 3.65795898924943e-05, "epoch": 1.890848952590959, "percentage": 27.01, "elapsed_time": "6:10:33", "remaining_time": "16:41:14"}
|
| 687 |
+
{"current_steps": 3435, "total_steps": 12698, "loss": 0.1162, "lr": 3.656419948232747e-05, "epoch": 1.8936052921719955, "percentage": 27.05, "elapsed_time": "6:10:59", "remaining_time": "16:40:26"}
|
| 688 |
+
{"current_steps": 3440, "total_steps": 12698, "loss": 0.1262, "lr": 3.654877777754123e-05, "epoch": 1.8963616317530319, "percentage": 27.09, "elapsed_time": "6:11:30", "remaining_time": "16:39:51"}
|
| 689 |
+
{"current_steps": 3445, "total_steps": 12698, "loss": 0.1186, "lr": 3.653332480727168e-05, "epoch": 1.8991179713340682, "percentage": 27.13, "elapsed_time": "6:12:04", "remaining_time": "16:39:20"}
|
| 690 |
+
{"current_steps": 3450, "total_steps": 12698, "loss": 0.1305, "lr": 3.651784060071401e-05, "epoch": 1.9018743109151046, "percentage": 27.17, "elapsed_time": "6:12:25", "remaining_time": "16:38:18"}
|
| 691 |
+
{"current_steps": 3455, "total_steps": 12698, "loss": 0.1177, "lr": 3.6502325187122425e-05, "epoch": 1.904630650496141, "percentage": 27.21, "elapsed_time": "6:12:56", "remaining_time": "16:37:41"}
|
| 692 |
+
{"current_steps": 3460, "total_steps": 12698, "loss": 0.1231, "lr": 3.648677859581006e-05, "epoch": 1.9073869900771774, "percentage": 27.25, "elapsed_time": "6:13:25", "remaining_time": "16:37:01"}
|
| 693 |
+
{"current_steps": 3465, "total_steps": 12698, "loss": 0.1145, "lr": 3.6471200856148984e-05, "epoch": 1.9101433296582138, "percentage": 27.29, "elapsed_time": "6:13:50", "remaining_time": "16:36:08"}
|
| 694 |
+
{"current_steps": 3470, "total_steps": 12698, "loss": 0.1059, "lr": 3.6455591997570115e-05, "epoch": 1.9128996692392501, "percentage": 27.33, "elapsed_time": "6:14:11", "remaining_time": "16:35:06"}
|
| 695 |
+
{"current_steps": 3475, "total_steps": 12698, "loss": 0.1264, "lr": 3.643995204956315e-05, "epoch": 1.9156560088202865, "percentage": 27.37, "elapsed_time": "6:14:51", "remaining_time": "16:34:55"}
|
| 696 |
+
{"current_steps": 3480, "total_steps": 12698, "loss": 0.1104, "lr": 3.6424281041676526e-05, "epoch": 1.918412348401323, "percentage": 27.41, "elapsed_time": "6:15:18", "remaining_time": "16:34:07"}
|
| 697 |
+
{"current_steps": 3485, "total_steps": 12698, "loss": 0.1003, "lr": 3.6408579003517347e-05, "epoch": 1.9211686879823593, "percentage": 27.45, "elapsed_time": "6:15:46", "remaining_time": "16:33:24"}
|
| 698 |
+
{"current_steps": 3490, "total_steps": 12698, "loss": 0.1102, "lr": 3.639284596475138e-05, "epoch": 1.9239250275633957, "percentage": 27.48, "elapsed_time": "6:16:24", "remaining_time": "16:33:08"}
|
| 699 |
+
{"current_steps": 3495, "total_steps": 12698, "loss": 0.0976, "lr": 3.637708195510293e-05, "epoch": 1.926681367144432, "percentage": 27.52, "elapsed_time": "6:16:50", "remaining_time": "16:32:18"}
|
| 700 |
+
{"current_steps": 3500, "total_steps": 12698, "loss": 0.0937, "lr": 3.636128700435481e-05, "epoch": 1.9294377067254684, "percentage": 27.56, "elapsed_time": "6:17:15", "remaining_time": "16:31:24"}
|
| 701 |
+
{"current_steps": 3505, "total_steps": 12698, "loss": 0.116, "lr": 3.634546114234833e-05, "epoch": 1.9321940463065048, "percentage": 27.6, "elapsed_time": "6:17:42", "remaining_time": "16:30:38"}
|
| 702 |
+
{"current_steps": 3510, "total_steps": 12698, "loss": 0.1289, "lr": 3.632960439898315e-05, "epoch": 1.9349503858875412, "percentage": 27.64, "elapsed_time": "6:18:17", "remaining_time": "16:30:13"}
|
| 703 |
+
{"current_steps": 3515, "total_steps": 12698, "loss": 0.1102, "lr": 3.631371680421732e-05, "epoch": 1.9377067254685776, "percentage": 27.68, "elapsed_time": "6:18:41", "remaining_time": "16:29:19"}
|
| 704 |
+
{"current_steps": 3520, "total_steps": 12698, "loss": 0.1092, "lr": 3.6297798388067126e-05, "epoch": 1.940463065049614, "percentage": 27.72, "elapsed_time": "6:19:08", "remaining_time": "16:28:35"}
|
| 705 |
+
{"current_steps": 3525, "total_steps": 12698, "loss": 0.1369, "lr": 3.628184918060714e-05, "epoch": 1.9432194046306503, "percentage": 27.76, "elapsed_time": "6:19:30", "remaining_time": "16:27:36"}
|
| 706 |
+
{"current_steps": 3530, "total_steps": 12698, "loss": 0.1073, "lr": 3.626586921197007e-05, "epoch": 1.9459757442116867, "percentage": 27.8, "elapsed_time": "6:19:51", "remaining_time": "16:26:32"}
|
| 707 |
+
{"current_steps": 3535, "total_steps": 12698, "loss": 0.1164, "lr": 3.624985851234676e-05, "epoch": 1.9487320837927231, "percentage": 27.84, "elapsed_time": "6:20:14", "remaining_time": "16:25:36"}
|
| 708 |
+
{"current_steps": 3540, "total_steps": 12698, "loss": 0.111, "lr": 3.6233817111986096e-05, "epoch": 1.9514884233737595, "percentage": 27.88, "elapsed_time": "6:20:40", "remaining_time": "16:24:47"}
|
| 709 |
+
{"current_steps": 3545, "total_steps": 12698, "loss": 0.1606, "lr": 3.621774504119498e-05, "epoch": 1.9542447629547959, "percentage": 27.92, "elapsed_time": "6:21:16", "remaining_time": "16:24:25"}
|
| 710 |
+
{"current_steps": 3550, "total_steps": 12698, "loss": 0.1251, "lr": 3.620164233033826e-05, "epoch": 1.9570011025358323, "percentage": 27.96, "elapsed_time": "6:21:55", "remaining_time": "16:24:10"}
|
| 711 |
+
{"current_steps": 3555, "total_steps": 12698, "loss": 0.108, "lr": 3.618550900983867e-05, "epoch": 1.9597574421168686, "percentage": 28.0, "elapsed_time": "6:22:20", "remaining_time": "16:23:21"}
|
| 712 |
+
{"current_steps": 3560, "total_steps": 12698, "loss": 0.109, "lr": 3.616934511017677e-05, "epoch": 1.962513781697905, "percentage": 28.04, "elapsed_time": "6:22:42", "remaining_time": "16:22:20"}
|
| 713 |
+
{"current_steps": 3565, "total_steps": 12698, "loss": 0.1063, "lr": 3.615315066189089e-05, "epoch": 1.9652701212789414, "percentage": 28.08, "elapsed_time": "6:23:04", "remaining_time": "16:21:23"}
|
| 714 |
+
{"current_steps": 3570, "total_steps": 12698, "loss": 0.0999, "lr": 3.6136925695577085e-05, "epoch": 1.9680264608599778, "percentage": 28.11, "elapsed_time": "6:23:24", "remaining_time": "16:20:20"}
|
| 715 |
+
{"current_steps": 3575, "total_steps": 12698, "loss": 0.1388, "lr": 3.612067024188907e-05, "epoch": 1.9707828004410142, "percentage": 28.15, "elapsed_time": "6:23:45", "remaining_time": "16:19:18"}
|
| 716 |
+
{"current_steps": 3580, "total_steps": 12698, "loss": 0.0959, "lr": 3.6104384331538144e-05, "epoch": 1.9735391400220506, "percentage": 28.19, "elapsed_time": "6:24:09", "remaining_time": "16:18:26"}
|
| 717 |
+
{"current_steps": 3585, "total_steps": 12698, "loss": 0.1078, "lr": 3.608806799529317e-05, "epoch": 1.976295479603087, "percentage": 28.23, "elapsed_time": "6:24:31", "remaining_time": "16:17:26"}
|
| 718 |
+
{"current_steps": 3590, "total_steps": 12698, "loss": 0.1092, "lr": 3.607172126398046e-05, "epoch": 1.9790518191841233, "percentage": 28.27, "elapsed_time": "6:24:56", "remaining_time": "16:16:36"}
|
| 719 |
+
{"current_steps": 3595, "total_steps": 12698, "loss": 0.1093, "lr": 3.60553441684838e-05, "epoch": 1.98180815876516, "percentage": 28.31, "elapsed_time": "6:25:30", "remaining_time": "16:16:09"}
|
| 720 |
+
{"current_steps": 3600, "total_steps": 12698, "loss": 0.0937, "lr": 3.603893673974429e-05, "epoch": 1.9845644983461963, "percentage": 28.35, "elapsed_time": "6:26:00", "remaining_time": "16:15:31"}
|
| 721 |
+
{"current_steps": 3605, "total_steps": 12698, "loss": 0.1059, "lr": 3.6022499008760374e-05, "epoch": 1.9873208379272327, "percentage": 28.39, "elapsed_time": "6:26:32", "remaining_time": "16:14:58"}
|
| 722 |
+
{"current_steps": 3610, "total_steps": 12698, "loss": 0.1417, "lr": 3.600603100658773e-05, "epoch": 1.990077177508269, "percentage": 28.43, "elapsed_time": "6:27:31", "remaining_time": "16:15:34"}
|
| 723 |
+
{"current_steps": 3615, "total_steps": 12698, "loss": 0.1618, "lr": 3.5989532764339254e-05, "epoch": 1.9928335170893055, "percentage": 28.47, "elapsed_time": "6:28:14", "remaining_time": "16:15:28"}
|
| 724 |
+
{"current_steps": 3620, "total_steps": 12698, "loss": 0.1083, "lr": 3.5973004313184923e-05, "epoch": 1.9955898566703418, "percentage": 28.51, "elapsed_time": "6:28:44", "remaining_time": "16:14:52"}
|
| 725 |
+
{"current_steps": 3625, "total_steps": 12698, "loss": 0.1044, "lr": 3.5956445684351837e-05, "epoch": 1.9983461962513782, "percentage": 28.55, "elapsed_time": "6:29:09", "remaining_time": "16:14:00"}
|
| 726 |
+
{"current_steps": 3630, "total_steps": 12698, "loss": 0.1921, "lr": 3.5939856909124085e-05, "epoch": 2.0011025358324144, "percentage": 28.59, "elapsed_time": "6:30:14", "remaining_time": "16:14:52"}
|
| 727 |
+
{"current_steps": 3635, "total_steps": 12698, "loss": 0.2349, "lr": 3.5923238018842715e-05, "epoch": 2.0038588754134508, "percentage": 28.63, "elapsed_time": "6:31:27", "remaining_time": "16:16:00"}
|
| 728 |
+
{"current_steps": 3640, "total_steps": 12698, "loss": 0.2233, "lr": 3.590658904490568e-05, "epoch": 2.006615214994487, "percentage": 28.67, "elapsed_time": "6:32:34", "remaining_time": "16:16:55"}
|
| 729 |
+
{"current_steps": 3645, "total_steps": 12698, "loss": 0.2195, "lr": 3.588991001876775e-05, "epoch": 2.0093715545755235, "percentage": 28.71, "elapsed_time": "6:33:53", "remaining_time": "16:18:16"}
|
| 730 |
+
{"current_steps": 3650, "total_steps": 12698, "loss": 0.2098, "lr": 3.58732009719405e-05, "epoch": 2.01212789415656, "percentage": 28.74, "elapsed_time": "6:35:10", "remaining_time": "16:19:36"}
|
| 731 |
+
{"current_steps": 3655, "total_steps": 12698, "loss": 0.2134, "lr": 3.5856461935992194e-05, "epoch": 2.0148842337375963, "percentage": 28.78, "elapsed_time": "6:36:30", "remaining_time": "16:21:00"}
|
| 732 |
+
{"current_steps": 3660, "total_steps": 12698, "loss": 0.2297, "lr": 3.583969294254779e-05, "epoch": 2.0176405733186327, "percentage": 28.82, "elapsed_time": "6:37:46", "remaining_time": "16:22:16"}
|
| 733 |
+
{"current_steps": 3665, "total_steps": 12698, "loss": 0.2227, "lr": 3.58228940232888e-05, "epoch": 2.020396912899669, "percentage": 28.86, "elapsed_time": "6:39:02", "remaining_time": "16:23:29"}
|
| 734 |
+
{"current_steps": 3670, "total_steps": 12698, "loss": 0.2114, "lr": 3.580606520995331e-05, "epoch": 2.0231532524807054, "percentage": 28.9, "elapsed_time": "6:40:11", "remaining_time": "16:24:27"}
|
| 735 |
+
{"current_steps": 3675, "total_steps": 12698, "loss": 0.2051, "lr": 3.578920653433588e-05, "epoch": 2.025909592061742, "percentage": 28.94, "elapsed_time": "6:41:10", "remaining_time": "16:24:58"}
|
| 736 |
+
{"current_steps": 3680, "total_steps": 12698, "loss": 0.2088, "lr": 3.5772318028287464e-05, "epoch": 2.028665931642778, "percentage": 28.98, "elapsed_time": "6:42:24", "remaining_time": "16:26:07"}
|
| 737 |
+
{"current_steps": 3685, "total_steps": 12698, "loss": 0.2029, "lr": 3.5755399723715396e-05, "epoch": 2.0314222712238146, "percentage": 29.02, "elapsed_time": "6:43:37", "remaining_time": "16:27:11"}
|
| 738 |
+
{"current_steps": 3690, "total_steps": 12698, "loss": 0.2132, "lr": 3.573845165258331e-05, "epoch": 2.034178610804851, "percentage": 29.06, "elapsed_time": "6:44:44", "remaining_time": "16:28:04"}
|
| 739 |
+
{"current_steps": 3695, "total_steps": 12698, "loss": 0.2021, "lr": 3.572147384691107e-05, "epoch": 2.0369349503858873, "percentage": 29.1, "elapsed_time": "6:45:53", "remaining_time": "16:28:58"}
|
| 740 |
+
{"current_steps": 3700, "total_steps": 12698, "loss": 0.2016, "lr": 3.5704466338774714e-05, "epoch": 2.0396912899669237, "percentage": 29.14, "elapsed_time": "6:47:03", "remaining_time": "16:29:54"}
|
| 741 |
+
{"current_steps": 3705, "total_steps": 12698, "loss": 0.2089, "lr": 3.5687429160306405e-05, "epoch": 2.04244762954796, "percentage": 29.18, "elapsed_time": "6:48:08", "remaining_time": "16:30:38"}
|
| 742 |
+
{"current_steps": 3710, "total_steps": 12698, "loss": 0.2023, "lr": 3.567036234369435e-05, "epoch": 2.0452039691289965, "percentage": 29.22, "elapsed_time": "6:49:19", "remaining_time": "16:31:37"}
|
| 743 |
+
{"current_steps": 3715, "total_steps": 12698, "loss": 0.2048, "lr": 3.565326592118277e-05, "epoch": 2.047960308710033, "percentage": 29.26, "elapsed_time": "6:50:33", "remaining_time": "16:32:45"}
|
| 744 |
+
{"current_steps": 3720, "total_steps": 12698, "loss": 0.2227, "lr": 3.563613992507181e-05, "epoch": 2.0507166482910693, "percentage": 29.3, "elapsed_time": "6:51:44", "remaining_time": "16:33:43"}
|
| 745 |
+
{"current_steps": 3725, "total_steps": 12698, "loss": 0.2266, "lr": 3.5618984387717475e-05, "epoch": 2.0534729878721056, "percentage": 29.34, "elapsed_time": "6:52:48", "remaining_time": "16:34:22"}
|
| 746 |
+
{"current_steps": 3730, "total_steps": 12698, "loss": 0.1877, "lr": 3.5601799341531605e-05, "epoch": 2.056229327453142, "percentage": 29.37, "elapsed_time": "6:53:52", "remaining_time": "16:35:04"}
|
| 747 |
+
{"current_steps": 3735, "total_steps": 12698, "loss": 0.2016, "lr": 3.558458481898178e-05, "epoch": 2.0589856670341784, "percentage": 29.41, "elapsed_time": "6:55:03", "remaining_time": "16:36:00"}
|
| 748 |
+
{"current_steps": 3740, "total_steps": 12698, "loss": 0.2029, "lr": 3.556734085259127e-05, "epoch": 2.061742006615215, "percentage": 29.45, "elapsed_time": "6:56:16", "remaining_time": "16:37:02"}
|
| 749 |
+
{"current_steps": 3745, "total_steps": 12698, "loss": 0.2099, "lr": 3.555006747493896e-05, "epoch": 2.064498346196251, "percentage": 29.49, "elapsed_time": "6:57:23", "remaining_time": "16:37:51"}
|
| 750 |
+
{"current_steps": 3750, "total_steps": 12698, "loss": 0.2057, "lr": 3.553276471865934e-05, "epoch": 2.0672546857772875, "percentage": 29.53, "elapsed_time": "6:58:40", "remaining_time": "16:39:01"}
|
| 751 |
+
{"current_steps": 3755, "total_steps": 12698, "loss": 0.1982, "lr": 3.551543261644236e-05, "epoch": 2.070011025358324, "percentage": 29.57, "elapsed_time": "6:59:56", "remaining_time": "16:40:09"}
|
| 752 |
+
{"current_steps": 3760, "total_steps": 12698, "loss": 0.1788, "lr": 3.549807120103343e-05, "epoch": 2.0727673649393603, "percentage": 29.61, "elapsed_time": "7:01:14", "remaining_time": "16:41:19"}
|
| 753 |
+
{"current_steps": 3765, "total_steps": 12698, "loss": 0.1835, "lr": 3.548068050523336e-05, "epoch": 2.075523704520397, "percentage": 29.65, "elapsed_time": "7:02:26", "remaining_time": "16:42:17"}
|
| 754 |
+
{"current_steps": 3770, "total_steps": 12698, "loss": 0.196, "lr": 3.5463260561898246e-05, "epoch": 2.078280044101433, "percentage": 29.69, "elapsed_time": "7:03:44", "remaining_time": "16:43:28"}
|
| 755 |
+
{"current_steps": 3775, "total_steps": 12698, "loss": 0.2023, "lr": 3.544581140393947e-05, "epoch": 2.08103638368247, "percentage": 29.73, "elapsed_time": "7:04:26", "remaining_time": "16:43:16"}
|
| 756 |
+
{"current_steps": 3780, "total_steps": 12698, "loss": 0.21, "lr": 3.54283330643236e-05, "epoch": 2.083792723263506, "percentage": 29.77, "elapsed_time": "7:05:37", "remaining_time": "16:44:09"}
|
| 757 |
+
{"current_steps": 3785, "total_steps": 12698, "loss": 0.2227, "lr": 3.541082557607231e-05, "epoch": 2.0865490628445427, "percentage": 29.81, "elapsed_time": "7:06:52", "remaining_time": "16:45:11"}
|
| 758 |
+
{"current_steps": 3790, "total_steps": 12698, "loss": 0.2158, "lr": 3.53932889722624e-05, "epoch": 2.0893054024255786, "percentage": 29.85, "elapsed_time": "7:08:03", "remaining_time": "16:46:06"}
|
| 759 |
+
{"current_steps": 3795, "total_steps": 12698, "loss": 0.2037, "lr": 3.5375723286025615e-05, "epoch": 2.0920617420066154, "percentage": 29.89, "elapsed_time": "7:09:14", "remaining_time": "16:46:59"}
|
| 760 |
+
{"current_steps": 3800, "total_steps": 12698, "loss": 0.2056, "lr": 3.53581285505487e-05, "epoch": 2.0948180815876514, "percentage": 29.93, "elapsed_time": "7:10:32", "remaining_time": "16:48:08"}
|
| 761 |
+
{"current_steps": 3805, "total_steps": 12698, "loss": 0.21, "lr": 3.534050479907324e-05, "epoch": 2.097574421168688, "percentage": 29.97, "elapsed_time": "7:11:46", "remaining_time": "16:49:08"}
|
| 762 |
+
{"current_steps": 3810, "total_steps": 12698, "loss": 0.2057, "lr": 3.532285206489567e-05, "epoch": 2.1003307607497246, "percentage": 30.0, "elapsed_time": "7:13:02", "remaining_time": "16:50:13"}
|
| 763 |
+
{"current_steps": 3815, "total_steps": 12698, "loss": 0.2096, "lr": 3.5305170381367165e-05, "epoch": 2.103087100330761, "percentage": 30.04, "elapsed_time": "7:14:20", "remaining_time": "16:51:20"}
|
| 764 |
+
{"current_steps": 3820, "total_steps": 12698, "loss": 0.2081, "lr": 3.528745978189361e-05, "epoch": 2.1058434399117973, "percentage": 30.08, "elapsed_time": "7:15:35", "remaining_time": "16:52:22"}
|
| 765 |
+
{"current_steps": 3825, "total_steps": 12698, "loss": 0.2113, "lr": 3.52697202999355e-05, "epoch": 2.1085997794928337, "percentage": 30.12, "elapsed_time": "7:16:48", "remaining_time": "16:53:17"}
|
| 766 |
+
{"current_steps": 3830, "total_steps": 12698, "loss": 0.2032, "lr": 3.52519519690079e-05, "epoch": 2.11135611907387, "percentage": 30.16, "elapsed_time": "7:17:57", "remaining_time": "16:54:02"}
|
| 767 |
+
{"current_steps": 3835, "total_steps": 12698, "loss": 0.1975, "lr": 3.5234154822680394e-05, "epoch": 2.1141124586549065, "percentage": 30.2, "elapsed_time": "7:18:52", "remaining_time": "16:54:17"}
|
| 768 |
+
{"current_steps": 3840, "total_steps": 12698, "loss": 0.201, "lr": 3.5216328894577e-05, "epoch": 2.116868798235943, "percentage": 30.24, "elapsed_time": "7:19:50", "remaining_time": "16:54:36"}
|
| 769 |
+
{"current_steps": 3845, "total_steps": 12698, "loss": 0.203, "lr": 3.5198474218376106e-05, "epoch": 2.1196251378169793, "percentage": 30.28, "elapsed_time": "7:20:59", "remaining_time": "16:55:22"}
|
| 770 |
+
{"current_steps": 3850, "total_steps": 12698, "loss": 0.2046, "lr": 3.518059082781043e-05, "epoch": 2.1223814773980156, "percentage": 30.32, "elapsed_time": "7:22:11", "remaining_time": "16:56:15"}
|
| 771 |
+
{"current_steps": 3855, "total_steps": 12698, "loss": 0.1997, "lr": 3.516267875666692e-05, "epoch": 2.125137816979052, "percentage": 30.36, "elapsed_time": "7:23:28", "remaining_time": "16:57:17"}
|
| 772 |
+
{"current_steps": 3860, "total_steps": 12698, "loss": 0.2039, "lr": 3.514473803878672e-05, "epoch": 2.1278941565600884, "percentage": 30.4, "elapsed_time": "7:24:43", "remaining_time": "16:58:14"}
|
| 773 |
+
{"current_steps": 3865, "total_steps": 12698, "loss": 0.2065, "lr": 3.51267687080651e-05, "epoch": 2.130650496141125, "percentage": 30.44, "elapsed_time": "7:26:00", "remaining_time": "16:59:18"}
|
| 774 |
+
{"current_steps": 3870, "total_steps": 12698, "loss": 0.2097, "lr": 3.5108770798451376e-05, "epoch": 2.133406835722161, "percentage": 30.48, "elapsed_time": "7:27:10", "remaining_time": "17:00:04"}
|
| 775 |
+
{"current_steps": 3875, "total_steps": 12698, "loss": 0.1759, "lr": 3.5090744343948875e-05, "epoch": 2.1361631753031975, "percentage": 30.52, "elapsed_time": "7:27:55", "remaining_time": "16:59:52"}
|
| 776 |
+
{"current_steps": 3880, "total_steps": 12698, "loss": 0.2041, "lr": 3.507268937861484e-05, "epoch": 2.138919514884234, "percentage": 30.56, "elapsed_time": "7:29:01", "remaining_time": "17:00:30"}
|
| 777 |
+
{"current_steps": 3885, "total_steps": 12698, "loss": 0.1977, "lr": 3.505460593656039e-05, "epoch": 2.1416758544652703, "percentage": 30.6, "elapsed_time": "7:30:12", "remaining_time": "17:01:17"}
|
| 778 |
+
{"current_steps": 3890, "total_steps": 12698, "loss": 0.2052, "lr": 3.5036494051950414e-05, "epoch": 2.1444321940463067, "percentage": 30.63, "elapsed_time": "7:31:22", "remaining_time": "17:02:02"}
|
| 779 |
+
{"current_steps": 3895, "total_steps": 12698, "loss": 0.194, "lr": 3.5018353759003586e-05, "epoch": 2.147188533627343, "percentage": 30.67, "elapsed_time": "7:32:30", "remaining_time": "17:02:41"}
|
| 780 |
+
{"current_steps": 3900, "total_steps": 12698, "loss": 0.2007, "lr": 3.500018509199222e-05, "epoch": 2.1499448732083795, "percentage": 30.71, "elapsed_time": "7:33:40", "remaining_time": "17:03:26"}
|
| 781 |
+
{"current_steps": 3905, "total_steps": 12698, "loss": 0.2, "lr": 3.4981988085242243e-05, "epoch": 2.152701212789416, "percentage": 30.75, "elapsed_time": "7:34:56", "remaining_time": "17:04:24"}
|
| 782 |
+
{"current_steps": 3910, "total_steps": 12698, "loss": 0.2151, "lr": 3.4963762773133126e-05, "epoch": 2.1554575523704522, "percentage": 30.79, "elapsed_time": "7:35:21", "remaining_time": "17:03:26"}
|
| 783 |
+
{"current_steps": 3915, "total_steps": 12698, "loss": 0.196, "lr": 3.494550919009782e-05, "epoch": 2.1582138919514886, "percentage": 30.83, "elapsed_time": "7:35:33", "remaining_time": "17:01:59"}
|
| 784 |
+
{"current_steps": 3920, "total_steps": 12698, "loss": 0.1952, "lr": 3.4927227370622675e-05, "epoch": 2.160970231532525, "percentage": 30.87, "elapsed_time": "7:35:46", "remaining_time": "17:00:35"}
|
| 785 |
+
{"current_steps": 3925, "total_steps": 12698, "loss": 0.1882, "lr": 3.49089173492474e-05, "epoch": 2.1637265711135614, "percentage": 30.91, "elapsed_time": "7:35:58", "remaining_time": "16:59:10"}
|
| 786 |
+
{"current_steps": 3930, "total_steps": 12698, "loss": 0.191, "lr": 3.4890579160564985e-05, "epoch": 2.1664829106945978, "percentage": 30.95, "elapsed_time": "7:36:11", "remaining_time": "16:57:47"}
|
| 787 |
+
{"current_steps": 3935, "total_steps": 12698, "loss": 0.1917, "lr": 3.487221283922164e-05, "epoch": 2.169239250275634, "percentage": 30.99, "elapsed_time": "7:36:23", "remaining_time": "16:56:21"}
|
| 788 |
+
{"current_steps": 3940, "total_steps": 12698, "loss": 0.1857, "lr": 3.485381841991671e-05, "epoch": 2.1719955898566705, "percentage": 31.03, "elapsed_time": "7:36:36", "remaining_time": "16:54:57"}
|
| 789 |
+
{"current_steps": 3945, "total_steps": 12698, "loss": 0.2069, "lr": 3.4835395937402636e-05, "epoch": 2.174751929437707, "percentage": 31.07, "elapsed_time": "7:36:48", "remaining_time": "16:53:33"}
|
| 790 |
+
{"current_steps": 3950, "total_steps": 12698, "loss": 0.187, "lr": 3.481694542648488e-05, "epoch": 2.1775082690187433, "percentage": 31.11, "elapsed_time": "7:36:59", "remaining_time": "16:52:06"}
|
| 791 |
+
{"current_steps": 3955, "total_steps": 12698, "loss": 0.196, "lr": 3.479846692202187e-05, "epoch": 2.1802646085997797, "percentage": 31.15, "elapsed_time": "7:37:12", "remaining_time": "16:50:43"}
|
| 792 |
+
{"current_steps": 3960, "total_steps": 12698, "loss": 0.1812, "lr": 3.4779960458924876e-05, "epoch": 2.183020948180816, "percentage": 31.19, "elapsed_time": "7:37:25", "remaining_time": "16:49:21"}
|
| 793 |
+
{"current_steps": 3965, "total_steps": 12698, "loss": 0.1976, "lr": 3.476142607215805e-05, "epoch": 2.1857772877618524, "percentage": 31.23, "elapsed_time": "7:37:39", "remaining_time": "16:47:59"}
|
| 794 |
+
{"current_steps": 3970, "total_steps": 12698, "loss": 0.1849, "lr": 3.474286379673826e-05, "epoch": 2.188533627342889, "percentage": 31.26, "elapsed_time": "7:37:51", "remaining_time": "16:46:35"}
|
| 795 |
+
{"current_steps": 3975, "total_steps": 12698, "loss": 0.168, "lr": 3.472427366773508e-05, "epoch": 2.191289966923925, "percentage": 31.3, "elapsed_time": "7:38:02", "remaining_time": "16:45:10"}
|
| 796 |
+
{"current_steps": 3980, "total_steps": 12698, "loss": 0.1736, "lr": 3.47056557202707e-05, "epoch": 2.1940463065049616, "percentage": 31.34, "elapsed_time": "7:38:15", "remaining_time": "16:43:47"}
|
| 797 |
+
{"current_steps": 3985, "total_steps": 12698, "loss": 0.1862, "lr": 3.468700998951987e-05, "epoch": 2.196802646085998, "percentage": 31.38, "elapsed_time": "7:38:28", "remaining_time": "16:42:25"}
|
| 798 |
+
{"current_steps": 3990, "total_steps": 12698, "loss": 0.1918, "lr": 3.466833651070983e-05, "epoch": 2.1995589856670343, "percentage": 31.42, "elapsed_time": "7:38:41", "remaining_time": "16:41:04"}
|
| 799 |
+
{"current_steps": 3995, "total_steps": 12698, "loss": 0.1923, "lr": 3.464963531912024e-05, "epoch": 2.2023153252480707, "percentage": 31.46, "elapsed_time": "7:38:55", "remaining_time": "16:39:44"}
|
| 800 |
+
{"current_steps": 4000, "total_steps": 12698, "loss": 0.1805, "lr": 3.463090645008313e-05, "epoch": 2.205071664829107, "percentage": 31.5, "elapsed_time": "7:39:07", "remaining_time": "16:38:23"}
|
| 801 |
+
{"current_steps": 4005, "total_steps": 12698, "loss": 0.1811, "lr": 3.461214993898282e-05, "epoch": 2.2078280044101435, "percentage": 31.54, "elapsed_time": "7:39:20", "remaining_time": "16:37:00"}
|
| 802 |
+
{"current_steps": 4010, "total_steps": 12698, "loss": 0.1947, "lr": 3.459336582125584e-05, "epoch": 2.21058434399118, "percentage": 31.58, "elapsed_time": "7:39:35", "remaining_time": "16:35:44"}
|
| 803 |
+
{"current_steps": 4015, "total_steps": 12698, "loss": 0.1962, "lr": 3.4574554132390884e-05, "epoch": 2.2133406835722162, "percentage": 31.62, "elapsed_time": "7:39:50", "remaining_time": "16:34:28"}
|
| 804 |
+
{"current_steps": 4020, "total_steps": 12698, "loss": 0.183, "lr": 3.455571490792873e-05, "epoch": 2.2160970231532526, "percentage": 31.66, "elapsed_time": "7:40:03", "remaining_time": "16:33:07"}
|
| 805 |
+
{"current_steps": 4025, "total_steps": 12698, "loss": 0.1789, "lr": 3.45368481834622e-05, "epoch": 2.218853362734289, "percentage": 31.7, "elapsed_time": "7:40:15", "remaining_time": "16:31:45"}
|
| 806 |
+
{"current_steps": 4030, "total_steps": 12698, "loss": 0.1848, "lr": 3.451795399463605e-05, "epoch": 2.2216097023153254, "percentage": 31.74, "elapsed_time": "7:40:27", "remaining_time": "16:30:23"}
|
| 807 |
+
{"current_steps": 4035, "total_steps": 12698, "loss": 0.1864, "lr": 3.4499032377146926e-05, "epoch": 2.224366041896362, "percentage": 31.78, "elapsed_time": "7:40:40", "remaining_time": "16:29:02"}
|
| 808 |
+
{"current_steps": 4040, "total_steps": 12698, "loss": 0.1875, "lr": 3.448008336674331e-05, "epoch": 2.227122381477398, "percentage": 31.82, "elapsed_time": "7:40:53", "remaining_time": "16:27:42"}
|
| 809 |
+
{"current_steps": 4045, "total_steps": 12698, "loss": 0.1806, "lr": 3.446110699922541e-05, "epoch": 2.2298787210584345, "percentage": 31.86, "elapsed_time": "7:41:07", "remaining_time": "16:26:25"}
|
| 810 |
+
{"current_steps": 4050, "total_steps": 12698, "loss": 0.1803, "lr": 3.4442103310445166e-05, "epoch": 2.232635060639471, "percentage": 31.89, "elapsed_time": "7:41:20", "remaining_time": "16:25:05"}
|
| 811 |
+
{"current_steps": 4055, "total_steps": 12698, "loss": 0.1846, "lr": 3.442307233630608e-05, "epoch": 2.2353914002205073, "percentage": 31.93, "elapsed_time": "7:41:32", "remaining_time": "16:23:45"}
|
| 812 |
+
{"current_steps": 4060, "total_steps": 12698, "loss": 0.1852, "lr": 3.4404014112763236e-05, "epoch": 2.2381477398015437, "percentage": 31.97, "elapsed_time": "7:41:45", "remaining_time": "16:22:26"}
|
| 813 |
+
{"current_steps": 4065, "total_steps": 12698, "loss": 0.1817, "lr": 3.43849286758232e-05, "epoch": 2.24090407938258, "percentage": 32.01, "elapsed_time": "7:41:57", "remaining_time": "16:21:04"}
|
| 814 |
+
{"current_steps": 4070, "total_steps": 12698, "loss": 0.1786, "lr": 3.436581606154394e-05, "epoch": 2.2436604189636165, "percentage": 32.05, "elapsed_time": "7:42:09", "remaining_time": "16:19:43"}
|
| 815 |
+
{"current_steps": 4075, "total_steps": 12698, "loss": 0.1746, "lr": 3.434667630603478e-05, "epoch": 2.246416758544653, "percentage": 32.09, "elapsed_time": "7:42:21", "remaining_time": "16:18:22"}
|
| 816 |
+
{"current_steps": 4080, "total_steps": 12698, "loss": 0.1805, "lr": 3.4327509445456325e-05, "epoch": 2.249173098125689, "percentage": 32.13, "elapsed_time": "7:42:33", "remaining_time": "16:17:01"}
|
| 817 |
+
{"current_steps": 4085, "total_steps": 12698, "loss": 0.1805, "lr": 3.430831551602038e-05, "epoch": 2.2519294377067256, "percentage": 32.17, "elapsed_time": "7:42:45", "remaining_time": "16:15:42"}
|
| 818 |
+
{"current_steps": 4090, "total_steps": 12698, "loss": 0.174, "lr": 3.4289094553989885e-05, "epoch": 2.254685777287762, "percentage": 32.21, "elapsed_time": "7:42:57", "remaining_time": "16:14:21"}
|
| 819 |
+
{"current_steps": 4095, "total_steps": 12698, "loss": 0.1786, "lr": 3.426984659567887e-05, "epoch": 2.2574421168687984, "percentage": 32.25, "elapsed_time": "7:43:09", "remaining_time": "16:13:02"}
|
| 820 |
+
{"current_steps": 4100, "total_steps": 12698, "loss": 0.1838, "lr": 3.425057167745236e-05, "epoch": 2.2601984564498347, "percentage": 32.29, "elapsed_time": "7:43:22", "remaining_time": "16:11:43"}
|
| 821 |
+
{"current_steps": 4105, "total_steps": 12698, "loss": 0.1842, "lr": 3.42312698357263e-05, "epoch": 2.262954796030871, "percentage": 32.33, "elapsed_time": "7:43:34", "remaining_time": "16:10:23"}
|
| 822 |
+
{"current_steps": 4110, "total_steps": 12698, "loss": 0.1819, "lr": 3.421194110696754e-05, "epoch": 2.2657111356119075, "percentage": 32.37, "elapsed_time": "7:43:47", "remaining_time": "16:09:07"}
|
| 823 |
+
{"current_steps": 4115, "total_steps": 12698, "loss": 0.1843, "lr": 3.419258552769369e-05, "epoch": 2.268467475192944, "percentage": 32.41, "elapsed_time": "7:44:00", "remaining_time": "16:07:49"}
|
| 824 |
+
{"current_steps": 4120, "total_steps": 12698, "loss": 0.1911, "lr": 3.41732031344731e-05, "epoch": 2.2712238147739803, "percentage": 32.45, "elapsed_time": "7:44:15", "remaining_time": "16:06:36"}
|
| 825 |
+
{"current_steps": 4125, "total_steps": 12698, "loss": 0.1852, "lr": 3.4153793963924794e-05, "epoch": 2.2739801543550167, "percentage": 32.49, "elapsed_time": "7:44:27", "remaining_time": "16:05:17"}
|
| 826 |
+
{"current_steps": 4130, "total_steps": 12698, "loss": 0.1775, "lr": 3.413435805271836e-05, "epoch": 2.276736493936053, "percentage": 32.52, "elapsed_time": "7:44:40", "remaining_time": "16:04:01"}
|
| 827 |
+
{"current_steps": 4135, "total_steps": 12698, "loss": 0.1845, "lr": 3.411489543757394e-05, "epoch": 2.2794928335170894, "percentage": 32.56, "elapsed_time": "7:44:53", "remaining_time": "16:02:43"}
|
| 828 |
+
{"current_steps": 4140, "total_steps": 12698, "loss": 0.1789, "lr": 3.409540615526209e-05, "epoch": 2.282249173098126, "percentage": 32.6, "elapsed_time": "7:45:05", "remaining_time": "16:01:24"}
|
| 829 |
+
{"current_steps": 4145, "total_steps": 12698, "loss": 0.1708, "lr": 3.407589024260378e-05, "epoch": 2.285005512679162, "percentage": 32.64, "elapsed_time": "7:45:16", "remaining_time": "16:00:05"}
|
| 830 |
+
{"current_steps": 4150, "total_steps": 12698, "loss": 0.1787, "lr": 3.405634773647027e-05, "epoch": 2.2877618522601986, "percentage": 32.68, "elapsed_time": "7:45:28", "remaining_time": "15:58:46"}
|
| 831 |
+
{"current_steps": 4155, "total_steps": 12698, "loss": 0.1796, "lr": 3.403677867378307e-05, "epoch": 2.290518191841235, "percentage": 32.72, "elapsed_time": "7:45:42", "remaining_time": "15:57:31"}
|
| 832 |
+
{"current_steps": 4160, "total_steps": 12698, "loss": 0.1824, "lr": 3.4017183091513884e-05, "epoch": 2.2932745314222713, "percentage": 32.76, "elapsed_time": "7:45:54", "remaining_time": "15:56:14"}
|
| 833 |
+
{"current_steps": 4165, "total_steps": 12698, "loss": 0.18, "lr": 3.399756102668448e-05, "epoch": 2.2960308710033077, "percentage": 32.8, "elapsed_time": "7:46:06", "remaining_time": "15:54:57"}
|
| 834 |
+
{"current_steps": 4170, "total_steps": 12698, "loss": 0.1773, "lr": 3.3977912516366685e-05, "epoch": 2.298787210584344, "percentage": 32.84, "elapsed_time": "7:46:19", "remaining_time": "15:53:41"}
|
| 835 |
+
{"current_steps": 4175, "total_steps": 12698, "loss": 0.1789, "lr": 3.395823759768229e-05, "epoch": 2.3015435501653805, "percentage": 32.88, "elapsed_time": "7:46:33", "remaining_time": "15:52:27"}
|
| 836 |
+
{"current_steps": 4180, "total_steps": 12698, "loss": 0.1791, "lr": 3.393853630780297e-05, "epoch": 2.304299889746417, "percentage": 32.92, "elapsed_time": "7:46:45", "remaining_time": "15:51:09"}
|
| 837 |
+
{"current_steps": 4185, "total_steps": 12698, "loss": 0.1775, "lr": 3.391880868395022e-05, "epoch": 2.3070562293274532, "percentage": 32.96, "elapsed_time": "7:46:57", "remaining_time": "15:49:52"}
|
| 838 |
+
{"current_steps": 4190, "total_steps": 12698, "loss": 0.1772, "lr": 3.38990547633953e-05, "epoch": 2.3098125689084896, "percentage": 33.0, "elapsed_time": "7:47:10", "remaining_time": "15:48:36"}
|
| 839 |
+
{"current_steps": 4195, "total_steps": 12698, "loss": 0.1724, "lr": 3.3879274583459145e-05, "epoch": 2.312568908489526, "percentage": 33.04, "elapsed_time": "7:47:21", "remaining_time": "15:47:19"}
|
| 840 |
+
{"current_steps": 4200, "total_steps": 12698, "loss": 0.1841, "lr": 3.3859468181512305e-05, "epoch": 2.3153252480705624, "percentage": 33.08, "elapsed_time": "7:47:35", "remaining_time": "15:46:06"}
|
| 841 |
+
{"current_steps": 4205, "total_steps": 12698, "loss": 0.1809, "lr": 3.3839635594974864e-05, "epoch": 2.3180815876515988, "percentage": 33.12, "elapsed_time": "7:47:49", "remaining_time": "15:44:52"}
|
| 842 |
+
{"current_steps": 4210, "total_steps": 12698, "loss": 0.1729, "lr": 3.381977686131639e-05, "epoch": 2.320837927232635, "percentage": 33.15, "elapsed_time": "7:48:00", "remaining_time": "15:43:35"}
|
| 843 |
+
{"current_steps": 4215, "total_steps": 12698, "loss": 0.182, "lr": 3.379989201805582e-05, "epoch": 2.3235942668136715, "percentage": 33.19, "elapsed_time": "7:48:12", "remaining_time": "15:42:18"}
|
| 844 |
+
{"current_steps": 4220, "total_steps": 12698, "loss": 0.1801, "lr": 3.377998110276147e-05, "epoch": 2.326350606394708, "percentage": 33.23, "elapsed_time": "7:48:24", "remaining_time": "15:41:02"}
|
| 845 |
+
{"current_steps": 4225, "total_steps": 12698, "loss": 0.1851, "lr": 3.376004415305086e-05, "epoch": 2.3291069459757443, "percentage": 33.27, "elapsed_time": "7:48:37", "remaining_time": "15:39:47"}
|
| 846 |
+
{"current_steps": 4230, "total_steps": 12698, "loss": 0.1862, "lr": 3.374008120659073e-05, "epoch": 2.3318632855567807, "percentage": 33.31, "elapsed_time": "7:48:49", "remaining_time": "15:38:32"}
|
| 847 |
+
{"current_steps": 4235, "total_steps": 12698, "loss": 0.1802, "lr": 3.372009230109694e-05, "epoch": 2.334619625137817, "percentage": 33.35, "elapsed_time": "7:49:01", "remaining_time": "15:37:16"}
|
| 848 |
+
{"current_steps": 4240, "total_steps": 12698, "loss": 0.1878, "lr": 3.3700077474334354e-05, "epoch": 2.3373759647188534, "percentage": 33.39, "elapsed_time": "7:49:13", "remaining_time": "15:36:00"}
|
| 849 |
+
{"current_steps": 4245, "total_steps": 12698, "loss": 0.1794, "lr": 3.3680036764116866e-05, "epoch": 2.34013230429989, "percentage": 33.43, "elapsed_time": "7:49:25", "remaining_time": "15:34:45"}
|
| 850 |
+
{"current_steps": 4250, "total_steps": 12698, "loss": 0.1929, "lr": 3.365997020830722e-05, "epoch": 2.342888643880926, "percentage": 33.47, "elapsed_time": "7:49:38", "remaining_time": "15:33:32"}
|
| 851 |
+
{"current_steps": 4255, "total_steps": 12698, "loss": 0.186, "lr": 3.363987784481702e-05, "epoch": 2.3456449834619626, "percentage": 33.51, "elapsed_time": "7:49:53", "remaining_time": "15:32:22"}
|
| 852 |
+
{"current_steps": 4260, "total_steps": 12698, "loss": 0.1861, "lr": 3.361975971160662e-05, "epoch": 2.348401323042999, "percentage": 33.55, "elapsed_time": "7:50:05", "remaining_time": "15:31:08"}
|
| 853 |
+
{"current_steps": 4265, "total_steps": 12698, "loss": 0.181, "lr": 3.359961584668505e-05, "epoch": 2.3511576626240354, "percentage": 33.59, "elapsed_time": "7:50:17", "remaining_time": "15:29:52"}
|
| 854 |
+
{"current_steps": 4270, "total_steps": 12698, "loss": 0.1762, "lr": 3.357944628810998e-05, "epoch": 2.3539140022050717, "percentage": 33.63, "elapsed_time": "7:50:29", "remaining_time": "15:28:38"}
|
| 855 |
+
{"current_steps": 4275, "total_steps": 12698, "loss": 0.1868, "lr": 3.35592510739876e-05, "epoch": 2.356670341786108, "percentage": 33.67, "elapsed_time": "7:50:42", "remaining_time": "15:27:25"}
|
| 856 |
+
{"current_steps": 4280, "total_steps": 12698, "loss": 0.1783, "lr": 3.3539030242472574e-05, "epoch": 2.3594266813671445, "percentage": 33.71, "elapsed_time": "7:50:54", "remaining_time": "15:26:11"}
|
| 857 |
+
{"current_steps": 4285, "total_steps": 12698, "loss": 0.1738, "lr": 3.351878383176797e-05, "epoch": 2.362183020948181, "percentage": 33.75, "elapsed_time": "7:51:06", "remaining_time": "15:24:57"}
|
| 858 |
+
{"current_steps": 4290, "total_steps": 12698, "loss": 0.1733, "lr": 3.34985118801252e-05, "epoch": 2.3649393605292173, "percentage": 33.78, "elapsed_time": "7:51:18", "remaining_time": "15:23:43"}
|
| 859 |
+
{"current_steps": 4295, "total_steps": 12698, "loss": 0.1916, "lr": 3.347821442584389e-05, "epoch": 2.3676957001102537, "percentage": 33.82, "elapsed_time": "7:51:31", "remaining_time": "15:22:30"}
|
| 860 |
+
{"current_steps": 4300, "total_steps": 12698, "loss": 0.1798, "lr": 3.3457891507271876e-05, "epoch": 2.37045203969129, "percentage": 33.86, "elapsed_time": "7:51:43", "remaining_time": "15:21:16"}
|
| 861 |
+
{"current_steps": 4305, "total_steps": 12698, "loss": 0.1765, "lr": 3.34375431628051e-05, "epoch": 2.3732083792723264, "percentage": 33.9, "elapsed_time": "7:51:59", "remaining_time": "15:20:10"}
|
| 862 |
+
{"current_steps": 4310, "total_steps": 12698, "loss": 0.1679, "lr": 3.341716943088754e-05, "epoch": 2.375964718853363, "percentage": 33.94, "elapsed_time": "7:52:15", "remaining_time": "15:19:04"}
|
| 863 |
+
{"current_steps": 4315, "total_steps": 12698, "loss": 0.1611, "lr": 3.3396770350011134e-05, "epoch": 2.378721058434399, "percentage": 33.98, "elapsed_time": "7:52:26", "remaining_time": "15:17:50"}
|
| 864 |
+
{"current_steps": 4320, "total_steps": 12698, "loss": 0.1789, "lr": 3.3376345958715716e-05, "epoch": 2.3814773980154356, "percentage": 34.02, "elapsed_time": "7:52:38", "remaining_time": "15:16:37"}
|
| 865 |
+
{"current_steps": 4325, "total_steps": 12698, "loss": 0.1789, "lr": 3.335589629558894e-05, "epoch": 2.384233737596472, "percentage": 34.06, "elapsed_time": "7:52:52", "remaining_time": "15:15:27"}
|
| 866 |
+
{"current_steps": 4330, "total_steps": 12698, "loss": 0.1753, "lr": 3.33354213992662e-05, "epoch": 2.3869900771775083, "percentage": 34.1, "elapsed_time": "7:53:04", "remaining_time": "15:14:15"}
|
| 867 |
+
{"current_steps": 4335, "total_steps": 12698, "loss": 0.1804, "lr": 3.3314921308430554e-05, "epoch": 2.3897464167585447, "percentage": 34.14, "elapsed_time": "7:53:17", "remaining_time": "15:13:03"}
|
| 868 |
+
{"current_steps": 4340, "total_steps": 12698, "loss": 0.1793, "lr": 3.32943960618127e-05, "epoch": 2.392502756339581, "percentage": 34.18, "elapsed_time": "7:53:29", "remaining_time": "15:11:51"}
|
| 869 |
+
{"current_steps": 4345, "total_steps": 12698, "loss": 0.1813, "lr": 3.32738456981908e-05, "epoch": 2.3952590959206175, "percentage": 34.22, "elapsed_time": "7:53:41", "remaining_time": "15:10:39"}
|
| 870 |
+
{"current_steps": 4350, "total_steps": 12698, "loss": 0.2882, "lr": 3.325327025639054e-05, "epoch": 2.398015435501654, "percentage": 34.26, "elapsed_time": "7:54:26", "remaining_time": "15:10:28"}
|
| 871 |
+
{"current_steps": 4355, "total_steps": 12698, "loss": 0.2798, "lr": 3.3232669775284926e-05, "epoch": 2.4007717750826902, "percentage": 34.3, "elapsed_time": "7:55:11", "remaining_time": "15:10:20"}
|
| 872 |
+
{"current_steps": 4360, "total_steps": 12698, "loss": 0.2705, "lr": 3.321204429379429e-05, "epoch": 2.4035281146637266, "percentage": 34.34, "elapsed_time": "7:56:10", "remaining_time": "15:10:38"}
|
| 873 |
+
{"current_steps": 4365, "total_steps": 12698, "loss": 0.2679, "lr": 3.3191393850886225e-05, "epoch": 2.406284454244763, "percentage": 34.38, "elapsed_time": "7:57:01", "remaining_time": "15:10:40"}
|
| 874 |
+
{"current_steps": 4370, "total_steps": 12698, "loss": 0.2749, "lr": 3.317071848557544e-05, "epoch": 2.4090407938257994, "percentage": 34.41, "elapsed_time": "7:57:52", "remaining_time": "15:10:41"}
|
| 875 |
+
{"current_steps": 4375, "total_steps": 12698, "loss": 0.2802, "lr": 3.315001823692376e-05, "epoch": 2.4117971334068358, "percentage": 34.45, "elapsed_time": "7:58:43", "remaining_time": "15:10:43"}
|
| 876 |
+
{"current_steps": 4380, "total_steps": 12698, "loss": 0.2644, "lr": 3.3129293144039995e-05, "epoch": 2.414553472987872, "percentage": 34.49, "elapsed_time": "7:59:40", "remaining_time": "15:10:55"}
|
| 877 |
+
{"current_steps": 4385, "total_steps": 12698, "loss": 0.2712, "lr": 3.310854324607993e-05, "epoch": 2.4173098125689085, "percentage": 34.53, "elapsed_time": "8:00:25", "remaining_time": "15:10:47"}
|
| 878 |
+
{"current_steps": 4390, "total_steps": 12698, "loss": 0.2797, "lr": 3.308776858224619e-05, "epoch": 2.420066152149945, "percentage": 34.57, "elapsed_time": "8:01:22", "remaining_time": "15:11:00"}
|
| 879 |
+
{"current_steps": 4395, "total_steps": 12698, "loss": 0.2767, "lr": 3.3066969191788184e-05, "epoch": 2.4228224917309813, "percentage": 34.61, "elapsed_time": "8:02:10", "remaining_time": "15:10:54"}
|
| 880 |
+
{"current_steps": 4400, "total_steps": 12698, "loss": 0.2783, "lr": 3.304614511400205e-05, "epoch": 2.4255788313120177, "percentage": 34.65, "elapsed_time": "8:03:01", "remaining_time": "15:10:56"}
|
| 881 |
+
{"current_steps": 4405, "total_steps": 12698, "loss": 0.2651, "lr": 3.3025296388230564e-05, "epoch": 2.428335170893054, "percentage": 34.69, "elapsed_time": "8:04:03", "remaining_time": "15:11:17"}
|
| 882 |
+
{"current_steps": 4410, "total_steps": 12698, "loss": 0.2735, "lr": 3.300442305386308e-05, "epoch": 2.4310915104740904, "percentage": 34.73, "elapsed_time": "8:04:45", "remaining_time": "15:11:01"}
|
| 883 |
+
{"current_steps": 4415, "total_steps": 12698, "loss": 0.267, "lr": 3.2983525150335414e-05, "epoch": 2.433847850055127, "percentage": 34.77, "elapsed_time": "8:05:21", "remaining_time": "15:10:35"}
|
| 884 |
+
{"current_steps": 4420, "total_steps": 12698, "loss": 0.2794, "lr": 3.2962602717129834e-05, "epoch": 2.436604189636163, "percentage": 34.81, "elapsed_time": "8:05:50", "remaining_time": "15:09:55"}
|
| 885 |
+
{"current_steps": 4425, "total_steps": 12698, "loss": 0.2701, "lr": 3.294165579377493e-05, "epoch": 2.4393605292171996, "percentage": 34.85, "elapsed_time": "8:06:17", "remaining_time": "15:09:10"}
|
| 886 |
+
{"current_steps": 4430, "total_steps": 12698, "loss": 0.2698, "lr": 3.292068441984558e-05, "epoch": 2.442116868798236, "percentage": 34.89, "elapsed_time": "8:06:44", "remaining_time": "15:08:25"}
|
| 887 |
+
{"current_steps": 4435, "total_steps": 12698, "loss": 0.2852, "lr": 3.2899688634962846e-05, "epoch": 2.4448732083792724, "percentage": 34.93, "elapsed_time": "8:07:09", "remaining_time": "15:07:37"}
|
| 888 |
+
{"current_steps": 4440, "total_steps": 12698, "loss": 0.2778, "lr": 3.287866847879389e-05, "epoch": 2.4476295479603087, "percentage": 34.97, "elapsed_time": "8:07:33", "remaining_time": "15:06:49"}
|
| 889 |
+
{"current_steps": 4445, "total_steps": 12698, "loss": 0.273, "lr": 3.285762399105195e-05, "epoch": 2.450385887541345, "percentage": 35.01, "elapsed_time": "8:08:03", "remaining_time": "15:06:10"}
|
| 890 |
+
{"current_steps": 4450, "total_steps": 12698, "loss": 0.2784, "lr": 3.283655521149623e-05, "epoch": 2.4531422271223815, "percentage": 35.04, "elapsed_time": "8:08:29", "remaining_time": "15:05:23"}
|
| 891 |
+
{"current_steps": 4455, "total_steps": 12698, "loss": 0.2673, "lr": 3.281546217993181e-05, "epoch": 2.455898566703418, "percentage": 35.08, "elapsed_time": "8:08:58", "remaining_time": "15:04:43"}
|
| 892 |
+
{"current_steps": 4460, "total_steps": 12698, "loss": 0.2518, "lr": 3.27943449362096e-05, "epoch": 2.4586549062844543, "percentage": 35.12, "elapsed_time": "8:09:24", "remaining_time": "15:03:59"}
|
| 893 |
+
{"current_steps": 4465, "total_steps": 12698, "loss": 0.2682, "lr": 3.277320352022624e-05, "epoch": 2.4614112458654906, "percentage": 35.16, "elapsed_time": "8:09:50", "remaining_time": "15:03:13"}
|
| 894 |
+
{"current_steps": 4470, "total_steps": 12698, "loss": 0.2755, "lr": 3.275203797192406e-05, "epoch": 2.464167585446527, "percentage": 35.2, "elapsed_time": "8:10:15", "remaining_time": "15:02:24"}
|
| 895 |
+
{"current_steps": 4475, "total_steps": 12698, "loss": 0.265, "lr": 3.2730848331290984e-05, "epoch": 2.4669239250275634, "percentage": 35.24, "elapsed_time": "8:10:42", "remaining_time": "15:01:40"}
|
| 896 |
+
{"current_steps": 4480, "total_steps": 12698, "loss": 0.2675, "lr": 3.270963463836043e-05, "epoch": 2.4696802646086, "percentage": 35.28, "elapsed_time": "8:11:08", "remaining_time": "15:00:56"}
|
| 897 |
+
{"current_steps": 4485, "total_steps": 12698, "loss": 0.2573, "lr": 3.268839693321128e-05, "epoch": 2.472436604189636, "percentage": 35.32, "elapsed_time": "8:11:33", "remaining_time": "15:00:09"}
|
| 898 |
+
{"current_steps": 4490, "total_steps": 12698, "loss": 0.2754, "lr": 3.266713525596776e-05, "epoch": 2.4751929437706726, "percentage": 35.36, "elapsed_time": "8:12:01", "remaining_time": "14:59:27"}
|
| 899 |
+
{"current_steps": 4495, "total_steps": 12698, "loss": 0.2585, "lr": 3.2645849646799406e-05, "epoch": 2.477949283351709, "percentage": 35.4, "elapsed_time": "8:12:28", "remaining_time": "14:58:43"}
|
| 900 |
+
{"current_steps": 4500, "total_steps": 12698, "loss": 0.2629, "lr": 3.262454014592097e-05, "epoch": 2.4807056229327453, "percentage": 35.44, "elapsed_time": "8:12:54", "remaining_time": "14:57:57"}
|
| 901 |
+
{"current_steps": 4505, "total_steps": 12698, "loss": 0.2621, "lr": 3.260320679359232e-05, "epoch": 2.4834619625137817, "percentage": 35.48, "elapsed_time": "8:13:58", "remaining_time": "14:58:22"}
|
| 902 |
+
{"current_steps": 4510, "total_steps": 12698, "loss": 0.2648, "lr": 3.258184963011842e-05, "epoch": 2.486218302094818, "percentage": 35.52, "elapsed_time": "8:14:26", "remaining_time": "14:57:40"}
|
| 903 |
+
{"current_steps": 4515, "total_steps": 12698, "loss": 0.2578, "lr": 3.2560468695849174e-05, "epoch": 2.4889746416758545, "percentage": 35.56, "elapsed_time": "8:14:52", "remaining_time": "14:56:54"}
|
| 904 |
+
{"current_steps": 4520, "total_steps": 12698, "loss": 0.2728, "lr": 3.253906403117945e-05, "epoch": 2.491730981256891, "percentage": 35.6, "elapsed_time": "8:15:17", "remaining_time": "14:56:07"}
|
| 905 |
+
{"current_steps": 4525, "total_steps": 12698, "loss": 0.269, "lr": 3.25176356765489e-05, "epoch": 2.4944873208379272, "percentage": 35.64, "elapsed_time": "8:15:40", "remaining_time": "14:55:16"}
|
| 906 |
+
{"current_steps": 4530, "total_steps": 12698, "loss": 0.2592, "lr": 3.249618367244197e-05, "epoch": 2.4972436604189636, "percentage": 35.67, "elapsed_time": "8:16:08", "remaining_time": "14:54:34"}
|
| 907 |
+
{"current_steps": 4535, "total_steps": 12698, "loss": 0.257, "lr": 3.2474708059387775e-05, "epoch": 2.5, "percentage": 35.71, "elapsed_time": "8:16:35", "remaining_time": "14:53:51"}
|
| 908 |
+
{"current_steps": 4540, "total_steps": 12698, "loss": 0.2676, "lr": 3.245320887796001e-05, "epoch": 2.5027563395810364, "percentage": 35.75, "elapsed_time": "8:17:03", "remaining_time": "14:53:09"}
|
| 909 |
+
{"current_steps": 4545, "total_steps": 12698, "loss": 0.2609, "lr": 3.2431686168776944e-05, "epoch": 2.5055126791620728, "percentage": 35.79, "elapsed_time": "8:17:33", "remaining_time": "14:52:31"}
|
| 910 |
+
{"current_steps": 4550, "total_steps": 12698, "loss": 0.2526, "lr": 3.241013997250126e-05, "epoch": 2.508269018743109, "percentage": 35.83, "elapsed_time": "8:17:58", "remaining_time": "14:51:45"}
|
| 911 |
+
{"current_steps": 4555, "total_steps": 12698, "loss": 0.2718, "lr": 3.2388570329840025e-05, "epoch": 2.5110253583241455, "percentage": 35.87, "elapsed_time": "8:18:23", "remaining_time": "14:50:59"}
|
| 912 |
+
{"current_steps": 4560, "total_steps": 12698, "loss": 0.2599, "lr": 3.236697728154461e-05, "epoch": 2.513781697905182, "percentage": 35.91, "elapsed_time": "8:18:51", "remaining_time": "14:50:18"}
|
| 913 |
+
{"current_steps": 4565, "total_steps": 12698, "loss": 0.2552, "lr": 3.234536086841061e-05, "epoch": 2.5165380374862183, "percentage": 35.95, "elapsed_time": "8:19:22", "remaining_time": "14:49:41"}
|
| 914 |
+
{"current_steps": 4570, "total_steps": 12698, "loss": 0.2476, "lr": 3.232372113127774e-05, "epoch": 2.5192943770672547, "percentage": 35.99, "elapsed_time": "8:19:46", "remaining_time": "14:48:52"}
|
| 915 |
+
{"current_steps": 4575, "total_steps": 12698, "loss": 0.2756, "lr": 3.230205811102979e-05, "epoch": 2.522050716648291, "percentage": 36.03, "elapsed_time": "8:20:13", "remaining_time": "14:48:09"}
|
| 916 |
+
{"current_steps": 4580, "total_steps": 12698, "loss": 0.2528, "lr": 3.228037184859456e-05, "epoch": 2.5248070562293274, "percentage": 36.07, "elapsed_time": "8:20:42", "remaining_time": "14:47:29"}
|
| 917 |
+
{"current_steps": 4585, "total_steps": 12698, "loss": 0.2734, "lr": 3.2258662384943745e-05, "epoch": 2.527563395810364, "percentage": 36.11, "elapsed_time": "8:21:06", "remaining_time": "14:46:41"}
|
| 918 |
+
{"current_steps": 4590, "total_steps": 12698, "loss": 0.2611, "lr": 3.2236929761092865e-05, "epoch": 2.5303197353914, "percentage": 36.15, "elapsed_time": "8:21:33", "remaining_time": "14:45:59"}
|
| 919 |
+
{"current_steps": 4595, "total_steps": 12698, "loss": 0.2689, "lr": 3.221517401810121e-05, "epoch": 2.5330760749724366, "percentage": 36.19, "elapsed_time": "8:22:02", "remaining_time": "14:45:19"}
|
| 920 |
+
{"current_steps": 4600, "total_steps": 12698, "loss": 0.2518, "lr": 3.219339519707173e-05, "epoch": 2.535832414553473, "percentage": 36.23, "elapsed_time": "8:22:29", "remaining_time": "14:44:35"}
|
| 921 |
+
{"current_steps": 4605, "total_steps": 12698, "loss": 0.2732, "lr": 3.217159333915101e-05, "epoch": 2.5385887541345094, "percentage": 36.27, "elapsed_time": "8:22:56", "remaining_time": "14:43:53"}
|
| 922 |
+
{"current_steps": 4610, "total_steps": 12698, "loss": 0.2537, "lr": 3.214976848552913e-05, "epoch": 2.5413450937155457, "percentage": 36.3, "elapsed_time": "8:23:23", "remaining_time": "14:43:10"}
|
| 923 |
+
{"current_steps": 4615, "total_steps": 12698, "loss": 0.2473, "lr": 3.212792067743963e-05, "epoch": 2.544101433296582, "percentage": 36.34, "elapsed_time": "8:23:50", "remaining_time": "14:42:27"}
|
| 924 |
+
{"current_steps": 4620, "total_steps": 12698, "loss": 0.2408, "lr": 3.21060499561594e-05, "epoch": 2.5468577728776185, "percentage": 36.38, "elapsed_time": "8:24:14", "remaining_time": "14:41:40"}
|
| 925 |
+
{"current_steps": 4625, "total_steps": 12698, "loss": 0.271, "lr": 3.208415636300864e-05, "epoch": 2.549614112458655, "percentage": 36.42, "elapsed_time": "8:24:43", "remaining_time": "14:41:00"}
|
| 926 |
+
{"current_steps": 4630, "total_steps": 12698, "loss": 0.2599, "lr": 3.2062239939350756e-05, "epoch": 2.5523704520396913, "percentage": 36.46, "elapsed_time": "8:25:12", "remaining_time": "14:40:21"}
|
| 927 |
+
{"current_steps": 4635, "total_steps": 12698, "loss": 0.2624, "lr": 3.204030072659229e-05, "epoch": 2.5551267916207276, "percentage": 36.5, "elapsed_time": "8:25:46", "remaining_time": "14:39:51"}
|
| 928 |
+
{"current_steps": 4640, "total_steps": 12698, "loss": 0.2583, "lr": 3.201833876618281e-05, "epoch": 2.557883131201764, "percentage": 36.54, "elapsed_time": "8:26:14", "remaining_time": "14:39:08"}
|
| 929 |
+
{"current_steps": 4645, "total_steps": 12698, "loss": 0.2677, "lr": 3.199635409961491e-05, "epoch": 2.5606394707828004, "percentage": 36.58, "elapsed_time": "8:26:42", "remaining_time": "14:38:28"}
|
| 930 |
+
{"current_steps": 4650, "total_steps": 12698, "loss": 0.2623, "lr": 3.197434676842404e-05, "epoch": 2.563395810363837, "percentage": 36.62, "elapsed_time": "8:27:09", "remaining_time": "14:37:46"}
|
| 931 |
+
{"current_steps": 4655, "total_steps": 12698, "loss": 0.2526, "lr": 3.19523168141885e-05, "epoch": 2.566152149944873, "percentage": 36.66, "elapsed_time": "8:27:35", "remaining_time": "14:37:01"}
|
| 932 |
+
{"current_steps": 4660, "total_steps": 12698, "loss": 0.2503, "lr": 3.193026427852932e-05, "epoch": 2.5689084895259096, "percentage": 36.7, "elapsed_time": "8:28:03", "remaining_time": "14:36:21"}
|
| 933 |
+
{"current_steps": 4665, "total_steps": 12698, "loss": 0.2489, "lr": 3.190818920311018e-05, "epoch": 2.571664829106946, "percentage": 36.74, "elapsed_time": "8:28:29", "remaining_time": "14:35:36"}
|
| 934 |
+
{"current_steps": 4670, "total_steps": 12698, "loss": 0.2502, "lr": 3.1886091629637376e-05, "epoch": 2.5744211686879823, "percentage": 36.78, "elapsed_time": "8:28:54", "remaining_time": "14:34:51"}
|
| 935 |
+
{"current_steps": 4675, "total_steps": 12698, "loss": 0.2424, "lr": 3.186397159985967e-05, "epoch": 2.5771775082690187, "percentage": 36.82, "elapsed_time": "8:29:23", "remaining_time": "14:34:11"}
|
| 936 |
+
{"current_steps": 4680, "total_steps": 12698, "loss": 0.2463, "lr": 3.1841829155568284e-05, "epoch": 2.579933847850055, "percentage": 36.86, "elapsed_time": "8:29:48", "remaining_time": "14:33:25"}
|
| 937 |
+
{"current_steps": 4685, "total_steps": 12698, "loss": 0.2473, "lr": 3.181966433859676e-05, "epoch": 2.5826901874310915, "percentage": 36.9, "elapsed_time": "8:30:15", "remaining_time": "14:32:43"}
|
| 938 |
+
{"current_steps": 4690, "total_steps": 12698, "loss": 0.2676, "lr": 3.179747719082094e-05, "epoch": 2.585446527012128, "percentage": 36.93, "elapsed_time": "8:30:40", "remaining_time": "14:31:56"}
|
| 939 |
+
{"current_steps": 4695, "total_steps": 12698, "loss": 0.2598, "lr": 3.1775267754158824e-05, "epoch": 2.5882028665931642, "percentage": 36.97, "elapsed_time": "8:31:06", "remaining_time": "14:31:13"}
|
| 940 |
+
{"current_steps": 4700, "total_steps": 12698, "loss": 0.2556, "lr": 3.1753036070570554e-05, "epoch": 2.5909592061742006, "percentage": 37.01, "elapsed_time": "8:31:31", "remaining_time": "14:30:28"}
|
| 941 |
+
{"current_steps": 4705, "total_steps": 12698, "loss": 0.2518, "lr": 3.1730782182058255e-05, "epoch": 2.593715545755237, "percentage": 37.05, "elapsed_time": "8:31:58", "remaining_time": "14:29:45"}
|
| 942 |
+
{"current_steps": 4710, "total_steps": 12698, "loss": 0.2455, "lr": 3.170850613066607e-05, "epoch": 2.5964718853362734, "percentage": 37.09, "elapsed_time": "8:32:26", "remaining_time": "14:29:05"}
|
| 943 |
+
{"current_steps": 4715, "total_steps": 12698, "loss": 0.2448, "lr": 3.168620795847994e-05, "epoch": 2.5992282249173098, "percentage": 37.13, "elapsed_time": "8:32:56", "remaining_time": "14:28:27"}
|
| 944 |
+
{"current_steps": 4720, "total_steps": 12698, "loss": 0.2485, "lr": 3.1663887707627666e-05, "epoch": 2.601984564498346, "percentage": 37.17, "elapsed_time": "8:33:24", "remaining_time": "14:27:47"}
|
| 945 |
+
{"current_steps": 4725, "total_steps": 12698, "loss": 0.2497, "lr": 3.164154542027872e-05, "epoch": 2.6047409040793825, "percentage": 37.21, "elapsed_time": "8:33:52", "remaining_time": "14:27:06"}
|