Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14b226c7c50675048cb0c2eecd73ceca347cdd605108af0f0b768a50dd8cc465
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da69f9d171f80af167aa76fd30082a9eebee7945161b89c9bab74def273940dd
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:085472deac36cb0c83c59b542e27b61ca618f1675792d2c27ea49ce2c31f1d05
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:533e2975ff9b99c5d981cb5747deaa054880a68f095277bfb443e24d7a13945c
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -645,3 +645,162 @@
|
|
645 |
{"current_steps": 645, "total_steps": 805, "loss": 1.5557, "lr": 9.259279090167994e-06, "epoch": 3.996908809891808, "percentage": 80.12, "elapsed_time": "9:26:18", "remaining_time": "2:20:28"}
|
646 |
{"current_steps": 646, "total_steps": 805, "loss": 0.87, "lr": 9.148514734018917e-06, "epoch": 4.006182380216384, "percentage": 80.25, "elapsed_time": "9:28:32", "remaining_time": "2:19:56"}
|
647 |
{"current_steps": 647, "total_steps": 805, "loss": 0.8649, "lr": 9.038331273364869e-06, "epoch": 4.012364760432766, "percentage": 80.37, "elapsed_time": "9:29:24", "remaining_time": "2:19:03"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
645 |
{"current_steps": 645, "total_steps": 805, "loss": 1.5557, "lr": 9.259279090167994e-06, "epoch": 3.996908809891808, "percentage": 80.12, "elapsed_time": "9:26:18", "remaining_time": "2:20:28"}
|
646 |
{"current_steps": 646, "total_steps": 805, "loss": 0.87, "lr": 9.148514734018917e-06, "epoch": 4.006182380216384, "percentage": 80.25, "elapsed_time": "9:28:32", "remaining_time": "2:19:56"}
|
647 |
{"current_steps": 647, "total_steps": 805, "loss": 0.8649, "lr": 9.038331273364869e-06, "epoch": 4.012364760432766, "percentage": 80.37, "elapsed_time": "9:29:24", "remaining_time": "2:19:03"}
|
648 |
+
{"current_steps": 648, "total_steps": 805, "loss": 0.8577, "lr": 8.928730782824755e-06, "epoch": 4.01854714064915, "percentage": 80.5, "elapsed_time": "9:30:15", "remaining_time": "2:18:09"}
|
649 |
+
{"current_steps": 649, "total_steps": 805, "loss": 0.8571, "lr": 8.819715326040965e-06, "epoch": 4.024729520865534, "percentage": 80.62, "elapsed_time": "9:31:06", "remaining_time": "2:17:16"}
|
650 |
+
{"current_steps": 650, "total_steps": 805, "loss": 0.8609, "lr": 8.711286955640332e-06, "epoch": 4.030911901081916, "percentage": 80.75, "elapsed_time": "9:31:57", "remaining_time": "2:16:23"}
|
651 |
+
{"current_steps": 651, "total_steps": 805, "loss": 0.8566, "lr": 8.603447713195634e-06, "epoch": 4.0370942812983, "percentage": 80.87, "elapsed_time": "9:32:49", "remaining_time": "2:15:30"}
|
652 |
+
{"current_steps": 652, "total_steps": 805, "loss": 0.8608, "lr": 8.496199629187072e-06, "epoch": 4.043276661514684, "percentage": 80.99, "elapsed_time": "9:33:40", "remaining_time": "2:14:37"}
|
653 |
+
{"current_steps": 653, "total_steps": 805, "loss": 0.8675, "lr": 8.389544722964076e-06, "epoch": 4.049459041731066, "percentage": 81.12, "elapsed_time": "9:34:31", "remaining_time": "2:13:44"}
|
654 |
+
{"current_steps": 654, "total_steps": 805, "loss": 0.8689, "lr": 8.283485002707233e-06, "epoch": 4.05564142194745, "percentage": 81.24, "elapsed_time": "9:35:22", "remaining_time": "2:12:50"}
|
655 |
+
{"current_steps": 655, "total_steps": 805, "loss": 0.853, "lr": 8.178022465390549e-06, "epoch": 4.061823802163833, "percentage": 81.37, "elapsed_time": "9:36:14", "remaining_time": "2:11:57"}
|
656 |
+
{"current_steps": 656, "total_steps": 805, "loss": 0.8645, "lr": 8.073159096743799e-06, "epoch": 4.068006182380216, "percentage": 81.49, "elapsed_time": "9:37:09", "remaining_time": "2:11:05"}
|
657 |
+
{"current_steps": 657, "total_steps": 805, "loss": 0.8517, "lr": 7.968896871215147e-06, "epoch": 4.0741885625966, "percentage": 81.61, "elapsed_time": "9:38:15", "remaining_time": "2:10:15"}
|
658 |
+
{"current_steps": 658, "total_steps": 805, "loss": 0.858, "lr": 7.865237751933965e-06, "epoch": 4.080370942812983, "percentage": 81.74, "elapsed_time": "9:39:10", "remaining_time": "2:09:23"}
|
659 |
+
{"current_steps": 659, "total_steps": 805, "loss": 0.8552, "lr": 7.762183690673887e-06, "epoch": 4.086553323029366, "percentage": 81.86, "elapsed_time": "9:40:01", "remaining_time": "2:08:30"}
|
660 |
+
{"current_steps": 660, "total_steps": 805, "loss": 0.8559, "lr": 7.659736627816064e-06, "epoch": 4.09273570324575, "percentage": 81.99, "elapsed_time": "9:40:52", "remaining_time": "2:07:37"}
|
661 |
+
{"current_steps": 661, "total_steps": 805, "loss": 0.8527, "lr": 7.557898492312561e-06, "epoch": 4.098918083462133, "percentage": 82.11, "elapsed_time": "9:41:44", "remaining_time": "2:06:43"}
|
662 |
+
{"current_steps": 662, "total_steps": 805, "loss": 0.8551, "lr": 7.456671201650145e-06, "epoch": 4.105100463678516, "percentage": 82.24, "elapsed_time": "9:42:35", "remaining_time": "2:05:50"}
|
663 |
+
{"current_steps": 663, "total_steps": 805, "loss": 0.8557, "lr": 7.356056661814106e-06, "epoch": 4.1112828438949, "percentage": 82.36, "elapsed_time": "9:43:26", "remaining_time": "2:04:57"}
|
664 |
+
{"current_steps": 664, "total_steps": 805, "loss": 0.8539, "lr": 7.256056767252402e-06, "epoch": 4.117465224111283, "percentage": 82.48, "elapsed_time": "9:44:17", "remaining_time": "2:04:04"}
|
665 |
+
{"current_steps": 665, "total_steps": 805, "loss": 0.853, "lr": 7.156673400839933e-06, "epoch": 4.123647604327666, "percentage": 82.61, "elapsed_time": "9:45:09", "remaining_time": "2:03:11"}
|
666 |
+
{"current_steps": 666, "total_steps": 805, "loss": 0.8464, "lr": 7.057908433843205e-06, "epoch": 4.12982998454405, "percentage": 82.73, "elapsed_time": "9:46:00", "remaining_time": "2:02:18"}
|
667 |
+
{"current_steps": 667, "total_steps": 805, "loss": 0.86, "lr": 6.959763725884956e-06, "epoch": 4.1360123647604325, "percentage": 82.86, "elapsed_time": "9:46:51", "remaining_time": "2:01:25"}
|
668 |
+
{"current_steps": 668, "total_steps": 805, "loss": 0.8559, "lr": 6.862241124909262e-06, "epoch": 4.142194744976816, "percentage": 82.98, "elapsed_time": "9:47:42", "remaining_time": "2:00:32"}
|
669 |
+
{"current_steps": 669, "total_steps": 805, "loss": 0.8547, "lr": 6.765342467146632e-06, "epoch": 4.1483771251932, "percentage": 83.11, "elapsed_time": "9:48:33", "remaining_time": "1:59:38"}
|
670 |
+
{"current_steps": 670, "total_steps": 805, "loss": 0.8563, "lr": 6.66906957707957e-06, "epoch": 4.1545595054095825, "percentage": 83.23, "elapsed_time": "9:49:24", "remaining_time": "1:58:45"}
|
671 |
+
{"current_steps": 671, "total_steps": 805, "loss": 0.8536, "lr": 6.5734242674080705e-06, "epoch": 4.160741885625966, "percentage": 83.35, "elapsed_time": "9:50:20", "remaining_time": "1:57:53"}
|
672 |
+
{"current_steps": 672, "total_steps": 805, "loss": 0.8624, "lr": 6.478408339015603e-06, "epoch": 4.166924265842349, "percentage": 83.48, "elapsed_time": "9:51:27", "remaining_time": "1:57:03"}
|
673 |
+
{"current_steps": 673, "total_steps": 805, "loss": 0.8588, "lr": 6.384023580935155e-06, "epoch": 4.1731066460587325, "percentage": 83.6, "elapsed_time": "9:52:21", "remaining_time": "1:56:11"}
|
674 |
+
{"current_steps": 674, "total_steps": 805, "loss": 0.8497, "lr": 6.290271770315541e-06, "epoch": 4.179289026275116, "percentage": 83.73, "elapsed_time": "9:53:12", "remaining_time": "1:55:17"}
|
675 |
+
{"current_steps": 675, "total_steps": 805, "loss": 0.859, "lr": 6.1971546723879864e-06, "epoch": 4.185471406491499, "percentage": 83.85, "elapsed_time": "9:54:04", "remaining_time": "1:54:24"}
|
676 |
+
{"current_steps": 676, "total_steps": 805, "loss": 0.8649, "lr": 6.104674040432797e-06, "epoch": 4.1916537867078825, "percentage": 83.98, "elapsed_time": "9:54:55", "remaining_time": "1:53:31"}
|
677 |
+
{"current_steps": 677, "total_steps": 805, "loss": 0.8536, "lr": 6.012831615746484e-06, "epoch": 4.197836166924266, "percentage": 84.1, "elapsed_time": "9:55:46", "remaining_time": "1:52:38"}
|
678 |
+
{"current_steps": 678, "total_steps": 805, "loss": 0.8633, "lr": 5.9216291276088435e-06, "epoch": 4.204018547140649, "percentage": 84.22, "elapsed_time": "9:56:37", "remaining_time": "1:51:45"}
|
679 |
+
{"current_steps": 679, "total_steps": 805, "loss": 0.863, "lr": 5.831068293250481e-06, "epoch": 4.210200927357032, "percentage": 84.35, "elapsed_time": "9:57:29", "remaining_time": "1:50:52"}
|
680 |
+
{"current_steps": 680, "total_steps": 805, "loss": 0.8623, "lr": 5.74115081782042e-06, "epoch": 4.216383307573416, "percentage": 84.47, "elapsed_time": "9:58:20", "remaining_time": "1:49:59"}
|
681 |
+
{"current_steps": 681, "total_steps": 805, "loss": 0.8582, "lr": 5.651878394354091e-06, "epoch": 4.222565687789799, "percentage": 84.6, "elapsed_time": "9:59:11", "remaining_time": "1:49:06"}
|
682 |
+
{"current_steps": 682, "total_steps": 805, "loss": 0.8565, "lr": 5.563252703741322e-06, "epoch": 4.228748068006182, "percentage": 84.72, "elapsed_time": "10:00:03", "remaining_time": "1:48:13"}
|
683 |
+
{"current_steps": 683, "total_steps": 805, "loss": 0.8553, "lr": 5.475275414694787e-06, "epoch": 4.234930448222566, "percentage": 84.84, "elapsed_time": "10:00:54", "remaining_time": "1:47:20"}
|
684 |
+
{"current_steps": 684, "total_steps": 805, "loss": 0.8586, "lr": 5.387948183718563e-06, "epoch": 4.241112828438949, "percentage": 84.97, "elapsed_time": "10:01:45", "remaining_time": "1:46:27"}
|
685 |
+
{"current_steps": 685, "total_steps": 805, "loss": 0.8639, "lr": 5.30127265507693e-06, "epoch": 4.247295208655332, "percentage": 85.09, "elapsed_time": "10:02:36", "remaining_time": "1:45:33"}
|
686 |
+
{"current_steps": 686, "total_steps": 805, "loss": 0.845, "lr": 5.215250460763397e-06, "epoch": 4.253477588871716, "percentage": 85.22, "elapsed_time": "10:03:32", "remaining_time": "1:44:41"}
|
687 |
+
{"current_steps": 687, "total_steps": 805, "loss": 0.8509, "lr": 5.129883220470007e-06, "epoch": 4.259659969088099, "percentage": 85.34, "elapsed_time": "10:04:38", "remaining_time": "1:43:51"}
|
688 |
+
{"current_steps": 688, "total_steps": 805, "loss": 0.8522, "lr": 5.045172541556831e-06, "epoch": 4.265842349304482, "percentage": 85.47, "elapsed_time": "10:05:31", "remaining_time": "1:42:58"}
|
689 |
+
{"current_steps": 689, "total_steps": 805, "loss": 0.8647, "lr": 4.961120019021684e-06, "epoch": 4.272024729520865, "percentage": 85.59, "elapsed_time": "10:06:22", "remaining_time": "1:42:05"}
|
690 |
+
{"current_steps": 690, "total_steps": 805, "loss": 0.8586, "lr": 4.877727235470113e-06, "epoch": 4.278207109737249, "percentage": 85.71, "elapsed_time": "10:07:13", "remaining_time": "1:41:12"}
|
691 |
+
{"current_steps": 691, "total_steps": 805, "loss": 0.8606, "lr": 4.794995761085593e-06, "epoch": 4.284389489953632, "percentage": 85.84, "elapsed_time": "10:08:04", "remaining_time": "1:40:19"}
|
692 |
+
{"current_steps": 692, "total_steps": 805, "loss": 0.8561, "lr": 4.712927153599967e-06, "epoch": 4.290571870170015, "percentage": 85.96, "elapsed_time": "10:08:55", "remaining_time": "1:39:26"}
|
693 |
+
{"current_steps": 693, "total_steps": 805, "loss": 0.8526, "lr": 4.631522958264083e-06, "epoch": 4.296754250386399, "percentage": 86.09, "elapsed_time": "10:09:47", "remaining_time": "1:38:33"}
|
694 |
+
{"current_steps": 694, "total_steps": 805, "loss": 0.8556, "lr": 4.550784707818756e-06, "epoch": 4.302936630602782, "percentage": 86.21, "elapsed_time": "10:10:38", "remaining_time": "1:37:40"}
|
695 |
+
{"current_steps": 695, "total_steps": 805, "loss": 0.8616, "lr": 4.47071392246587e-06, "epoch": 4.309119010819165, "percentage": 86.34, "elapsed_time": "10:11:29", "remaining_time": "1:36:46"}
|
696 |
+
{"current_steps": 696, "total_steps": 805, "loss": 0.8595, "lr": 4.3913121098397675e-06, "epoch": 4.315301391035549, "percentage": 86.46, "elapsed_time": "10:12:20", "remaining_time": "1:35:53"}
|
697 |
+
{"current_steps": 697, "total_steps": 805, "loss": 0.8472, "lr": 4.312580764978825e-06, "epoch": 4.321483771251932, "percentage": 86.58, "elapsed_time": "10:13:12", "remaining_time": "1:35:00"}
|
698 |
+
{"current_steps": 698, "total_steps": 805, "loss": 0.8652, "lr": 4.234521370297398e-06, "epoch": 4.327666151468315, "percentage": 86.71, "elapsed_time": "10:14:03", "remaining_time": "1:34:07"}
|
699 |
+
{"current_steps": 699, "total_steps": 805, "loss": 0.862, "lr": 4.157135395557786e-06, "epoch": 4.333848531684699, "percentage": 86.83, "elapsed_time": "10:14:54", "remaining_time": "1:33:14"}
|
700 |
+
{"current_steps": 700, "total_steps": 805, "loss": 0.8626, "lr": 4.080424297842656e-06, "epoch": 4.340030911901082, "percentage": 86.96, "elapsed_time": "10:15:45", "remaining_time": "1:32:21"}
|
701 |
+
{"current_steps": 701, "total_steps": 805, "loss": 0.8599, "lr": 4.004389521527543e-06, "epoch": 4.346213292117465, "percentage": 87.08, "elapsed_time": "10:16:41", "remaining_time": "1:31:29"}
|
702 |
+
{"current_steps": 702, "total_steps": 805, "loss": 0.8643, "lr": 3.929032498253729e-06, "epoch": 4.352395672333849, "percentage": 87.2, "elapsed_time": "10:17:48", "remaining_time": "1:30:38"}
|
703 |
+
{"current_steps": 703, "total_steps": 805, "loss": 0.8684, "lr": 3.8543546469011904e-06, "epoch": 4.358578052550232, "percentage": 87.33, "elapsed_time": "10:18:41", "remaining_time": "1:29:46"}
|
704 |
+
{"current_steps": 704, "total_steps": 805, "loss": 0.8554, "lr": 3.780357373561958e-06, "epoch": 4.364760432766615, "percentage": 87.45, "elapsed_time": "10:19:32", "remaining_time": "1:28:53"}
|
705 |
+
{"current_steps": 705, "total_steps": 805, "loss": 0.8649, "lr": 3.7070420715136133e-06, "epoch": 4.370942812982999, "percentage": 87.58, "elapsed_time": "10:20:24", "remaining_time": "1:28:00"}
|
706 |
+
{"current_steps": 706, "total_steps": 805, "loss": 0.8549, "lr": 3.634410121193059e-06, "epoch": 4.377125193199381, "percentage": 87.7, "elapsed_time": "10:21:15", "remaining_time": "1:27:07"}
|
707 |
+
{"current_steps": 707, "total_steps": 805, "loss": 0.848, "lr": 3.562462890170526e-06, "epoch": 4.383307573415765, "percentage": 87.83, "elapsed_time": "10:22:06", "remaining_time": "1:26:13"}
|
708 |
+
{"current_steps": 708, "total_steps": 805, "loss": 0.8634, "lr": 3.4912017331238057e-06, "epoch": 4.3894899536321486, "percentage": 87.95, "elapsed_time": "10:22:57", "remaining_time": "1:25:20"}
|
709 |
+
{"current_steps": 709, "total_steps": 805, "loss": 0.8595, "lr": 3.420627991812788e-06, "epoch": 4.395672333848531, "percentage": 88.07, "elapsed_time": "10:23:48", "remaining_time": "1:24:27"}
|
710 |
+
{"current_steps": 710, "total_steps": 805, "loss": 0.8526, "lr": 3.3507429950541527e-06, "epoch": 4.401854714064915, "percentage": 88.2, "elapsed_time": "10:24:40", "remaining_time": "1:23:34"}
|
711 |
+
{"current_steps": 711, "total_steps": 805, "loss": 0.8583, "lr": 3.281548058696373e-06, "epoch": 4.4080370942812985, "percentage": 88.32, "elapsed_time": "10:25:31", "remaining_time": "1:22:41"}
|
712 |
+
{"current_steps": 712, "total_steps": 805, "loss": 0.8671, "lr": 3.2130444855949406e-06, "epoch": 4.414219474497681, "percentage": 88.45, "elapsed_time": "10:26:22", "remaining_time": "1:21:48"}
|
713 |
+
{"current_steps": 713, "total_steps": 805, "loss": 0.8616, "lr": 3.145233565587824e-06, "epoch": 4.420401854714065, "percentage": 88.57, "elapsed_time": "10:27:14", "remaining_time": "1:20:56"}
|
714 |
+
{"current_steps": 714, "total_steps": 805, "loss": 0.8566, "lr": 3.078116575471173e-06, "epoch": 4.4265842349304485, "percentage": 88.7, "elapsed_time": "10:28:05", "remaining_time": "1:20:03"}
|
715 |
+
{"current_steps": 715, "total_steps": 805, "loss": 0.8581, "lr": 3.0116947789753028e-06, "epoch": 4.432766615146831, "percentage": 88.82, "elapsed_time": "10:28:57", "remaining_time": "1:19:10"}
|
716 |
+
{"current_steps": 716, "total_steps": 805, "loss": 0.8646, "lr": 2.9459694267408977e-06, "epoch": 4.438948995363215, "percentage": 88.94, "elapsed_time": "10:29:53", "remaining_time": "1:18:17"}
|
717 |
+
{"current_steps": 717, "total_steps": 805, "loss": 0.8636, "lr": 2.8809417562954435e-06, "epoch": 4.4451313755795985, "percentage": 89.07, "elapsed_time": "10:30:59", "remaining_time": "1:17:26"}
|
718 |
+
{"current_steps": 718, "total_steps": 805, "loss": 0.8474, "lr": 2.8166129920299278e-06, "epoch": 4.451313755795981, "percentage": 89.19, "elapsed_time": "10:31:52", "remaining_time": "1:16:33"}
|
719 |
+
{"current_steps": 719, "total_steps": 805, "loss": 0.848, "lr": 2.752984345175809e-06, "epoch": 4.457496136012365, "percentage": 89.32, "elapsed_time": "10:32:43", "remaining_time": "1:15:40"}
|
720 |
+
{"current_steps": 720, "total_steps": 805, "loss": 0.8599, "lr": 2.690057013782195e-06, "epoch": 4.4636785162287484, "percentage": 89.44, "elapsed_time": "10:33:34", "remaining_time": "1:14:47"}
|
721 |
+
{"current_steps": 721, "total_steps": 805, "loss": 0.8585, "lr": 2.6278321826932818e-06, "epoch": 4.469860896445131, "percentage": 89.57, "elapsed_time": "10:34:26", "remaining_time": "1:13:54"}
|
722 |
+
{"current_steps": 722, "total_steps": 805, "loss": 0.8704, "lr": 2.566311023526056e-06, "epoch": 4.476043276661515, "percentage": 89.69, "elapsed_time": "10:35:17", "remaining_time": "1:13:01"}
|
723 |
+
{"current_steps": 723, "total_steps": 805, "loss": 0.8619, "lr": 2.5054946946482208e-06, "epoch": 4.4822256568778975, "percentage": 89.81, "elapsed_time": "10:36:08", "remaining_time": "1:12:08"}
|
724 |
+
{"current_steps": 724, "total_steps": 805, "loss": 0.8498, "lr": 2.445384341156389e-06, "epoch": 4.488408037094281, "percentage": 89.94, "elapsed_time": "10:36:59", "remaining_time": "1:11:15"}
|
725 |
+
{"current_steps": 725, "total_steps": 805, "loss": 0.8567, "lr": 2.3859810948545414e-06, "epoch": 4.494590417310665, "percentage": 90.06, "elapsed_time": "10:37:51", "remaining_time": "1:10:23"}
|
726 |
+
{"current_steps": 726, "total_steps": 805, "loss": 0.8556, "lr": 2.3272860742326798e-06, "epoch": 4.500772797527048, "percentage": 90.19, "elapsed_time": "10:38:42", "remaining_time": "1:09:30"}
|
727 |
+
{"current_steps": 727, "total_steps": 805, "loss": 0.8533, "lr": 2.269300384445812e-06, "epoch": 4.506955177743431, "percentage": 90.31, "elapsed_time": "10:39:33", "remaining_time": "1:08:37"}
|
728 |
+
{"current_steps": 728, "total_steps": 805, "loss": 0.856, "lr": 2.2120251172931082e-06, "epoch": 4.513137557959815, "percentage": 90.43, "elapsed_time": "10:40:24", "remaining_time": "1:07:44"}
|
729 |
+
{"current_steps": 729, "total_steps": 805, "loss": 0.8583, "lr": 2.15546135119733e-06, "epoch": 4.5193199381761975, "percentage": 90.56, "elapsed_time": "10:41:15", "remaining_time": "1:06:51"}
|
730 |
+
{"current_steps": 730, "total_steps": 805, "loss": 0.8522, "lr": 2.0996101511846056e-06, "epoch": 4.525502318392581, "percentage": 90.68, "elapsed_time": "10:42:07", "remaining_time": "1:05:58"}
|
731 |
+
{"current_steps": 731, "total_steps": 805, "loss": 0.8537, "lr": 2.0444725688642685e-06, "epoch": 4.531684698608965, "percentage": 90.81, "elapsed_time": "10:43:03", "remaining_time": "1:05:05"}
|
732 |
+
{"current_steps": 732, "total_steps": 805, "loss": 0.8552, "lr": 1.9900496424091375e-06, "epoch": 4.5378670788253475, "percentage": 90.93, "elapsed_time": "10:44:10", "remaining_time": "1:04:14"}
|
733 |
+
{"current_steps": 733, "total_steps": 805, "loss": 0.8562, "lr": 1.9363423965359195e-06, "epoch": 4.544049459041731, "percentage": 91.06, "elapsed_time": "10:45:03", "remaining_time": "1:03:21"}
|
734 |
+
{"current_steps": 734, "total_steps": 805, "loss": 0.8506, "lr": 1.883351842485972e-06, "epoch": 4.550231839258115, "percentage": 91.18, "elapsed_time": "10:45:55", "remaining_time": "1:02:28"}
|
735 |
+
{"current_steps": 735, "total_steps": 805, "loss": 0.8589, "lr": 1.8310789780061887e-06, "epoch": 4.556414219474497, "percentage": 91.3, "elapsed_time": "10:46:46", "remaining_time": "1:01:35"}
|
736 |
+
{"current_steps": 736, "total_steps": 805, "loss": 0.8568, "lr": 1.7795247873302735e-06, "epoch": 4.562596599690881, "percentage": 91.43, "elapsed_time": "10:47:37", "remaining_time": "1:00:42"}
|
737 |
+
{"current_steps": 737, "total_steps": 805, "loss": 0.8549, "lr": 1.728690241160189e-06, "epoch": 4.568778979907265, "percentage": 91.55, "elapsed_time": "10:48:29", "remaining_time": "0:59:49"}
|
738 |
+
{"current_steps": 738, "total_steps": 805, "loss": 0.8616, "lr": 1.6785762966478715e-06, "epoch": 4.574961360123647, "percentage": 91.68, "elapsed_time": "10:49:20", "remaining_time": "0:58:57"}
|
739 |
+
{"current_steps": 739, "total_steps": 805, "loss": 0.85, "lr": 1.6291838973772068e-06, "epoch": 4.581143740340031, "percentage": 91.8, "elapsed_time": "10:50:11", "remaining_time": "0:58:04"}
|
740 |
+
{"current_steps": 740, "total_steps": 805, "loss": 0.8542, "lr": 1.5805139733462827e-06, "epoch": 4.587326120556414, "percentage": 91.93, "elapsed_time": "10:51:03", "remaining_time": "0:57:11"}
|
741 |
+
{"current_steps": 741, "total_steps": 805, "loss": 0.863, "lr": 1.532567440949868e-06, "epoch": 4.593508500772797, "percentage": 92.05, "elapsed_time": "10:51:54", "remaining_time": "0:56:18"}
|
742 |
+
{"current_steps": 742, "total_steps": 805, "loss": 0.8582, "lr": 1.4853452029621518e-06, "epoch": 4.599690880989181, "percentage": 92.17, "elapsed_time": "10:52:45", "remaining_time": "0:55:25"}
|
743 |
+
{"current_steps": 743, "total_steps": 805, "loss": 0.8666, "lr": 1.4388481485197558e-06, "epoch": 4.605873261205565, "percentage": 92.3, "elapsed_time": "10:53:37", "remaining_time": "0:54:32"}
|
744 |
+
{"current_steps": 744, "total_steps": 805, "loss": 0.8543, "lr": 1.3930771531049847e-06, "epoch": 4.612055641421947, "percentage": 92.42, "elapsed_time": "10:54:28", "remaining_time": "0:53:39"}
|
745 |
+
{"current_steps": 745, "total_steps": 805, "loss": 0.8605, "lr": 1.3480330785293494e-06, "epoch": 4.618238021638331, "percentage": 92.55, "elapsed_time": "10:55:19", "remaining_time": "0:52:46"}
|
746 |
+
{"current_steps": 746, "total_steps": 805, "loss": 0.8602, "lr": 1.3037167729173273e-06, "epoch": 4.624420401854714, "percentage": 92.67, "elapsed_time": "10:56:16", "remaining_time": "0:51:54"}
|
747 |
+
{"current_steps": 747, "total_steps": 805, "loss": 0.8612, "lr": 1.2601290706904102e-06, "epoch": 4.630602782071097, "percentage": 92.8, "elapsed_time": "10:57:22", "remaining_time": "0:51:02"}
|
748 |
+
{"current_steps": 748, "total_steps": 805, "loss": 0.8692, "lr": 1.2172707925513838e-06, "epoch": 4.636785162287481, "percentage": 92.92, "elapsed_time": "10:58:16", "remaining_time": "0:50:09"}
|
749 |
+
{"current_steps": 749, "total_steps": 805, "loss": 0.8739, "lr": 1.1751427454688735e-06, "epoch": 4.642967542503864, "percentage": 93.04, "elapsed_time": "10:59:07", "remaining_time": "0:49:16"}
|
750 |
+
{"current_steps": 750, "total_steps": 805, "loss": 0.8507, "lr": 1.1337457226621518e-06, "epoch": 4.649149922720247, "percentage": 93.17, "elapsed_time": "10:59:59", "remaining_time": "0:48:23"}
|
751 |
+
{"current_steps": 751, "total_steps": 805, "loss": 0.8688, "lr": 1.0930805035862125e-06, "epoch": 4.655332302936631, "percentage": 93.29, "elapsed_time": "11:00:50", "remaining_time": "0:47:31"}
|
752 |
+
{"current_steps": 752, "total_steps": 805, "loss": 0.8576, "lr": 1.0531478539170713e-06, "epoch": 4.661514683153014, "percentage": 93.42, "elapsed_time": "11:01:41", "remaining_time": "0:46:38"}
|
753 |
+
{"current_steps": 753, "total_steps": 805, "loss": 0.8586, "lr": 1.0139485255373826e-06, "epoch": 4.667697063369397, "percentage": 93.54, "elapsed_time": "11:02:33", "remaining_time": "0:45:45"}
|
754 |
+
{"current_steps": 754, "total_steps": 805, "loss": 0.8732, "lr": 9.75483256522236e-07, "epoch": 4.673879443585781, "percentage": 93.66, "elapsed_time": "11:03:24", "remaining_time": "0:44:52"}
|
755 |
+
{"current_steps": 755, "total_steps": 805, "loss": 0.8501, "lr": 9.377527711253198e-07, "epoch": 4.680061823802164, "percentage": 93.79, "elapsed_time": "11:04:15", "remaining_time": "0:43:59"}
|
756 |
+
{"current_steps": 756, "total_steps": 805, "loss": 0.8606, "lr": 9.007577797652245e-07, "epoch": 4.686244204018547, "percentage": 93.91, "elapsed_time": "11:05:07", "remaining_time": "0:43:06"}
|
757 |
+
{"current_steps": 757, "total_steps": 805, "loss": 0.8687, "lr": 8.644989790121072e-07, "epoch": 4.69242658423493, "percentage": 94.04, "elapsed_time": "11:05:58", "remaining_time": "0:42:13"}
|
758 |
+
{"current_steps": 758, "total_steps": 805, "loss": 0.8623, "lr": 8.289770515745599e-07, "epoch": 4.698608964451314, "percentage": 94.16, "elapsed_time": "11:06:49", "remaining_time": "0:41:20"}
|
759 |
+
{"current_steps": 759, "total_steps": 805, "loss": 0.8663, "lr": 7.941926662867528e-07, "epoch": 4.704791344667697, "percentage": 94.29, "elapsed_time": "11:07:41", "remaining_time": "0:40:27"}
|
760 |
+
{"current_steps": 760, "total_steps": 805, "loss": 0.8533, "lr": 7.60146478095849e-07, "epoch": 4.710973724884081, "percentage": 94.41, "elapsed_time": "11:08:32", "remaining_time": "0:39:35"}
|
761 |
+
{"current_steps": 761, "total_steps": 805, "loss": 0.8545, "lr": 7.268391280496589e-07, "epoch": 4.717156105100464, "percentage": 94.53, "elapsed_time": "11:09:28", "remaining_time": "0:38:42"}
|
762 |
+
{"current_steps": 762, "total_steps": 805, "loss": 0.8593, "lr": 6.94271243284601e-07, "epoch": 4.723338485316847, "percentage": 94.66, "elapsed_time": "11:10:35", "remaining_time": "0:37:50"}
|
763 |
+
{"current_steps": 763, "total_steps": 805, "loss": 0.8637, "lr": 6.624434370138532e-07, "epoch": 4.72952086553323, "percentage": 94.78, "elapsed_time": "11:11:28", "remaining_time": "0:36:57"}
|
764 |
+
{"current_steps": 764, "total_steps": 805, "loss": 0.8527, "lr": 6.313563085158425e-07, "epoch": 4.7357032457496135, "percentage": 94.91, "elapsed_time": "11:12:19", "remaining_time": "0:36:04"}
|
765 |
+
{"current_steps": 765, "total_steps": 805, "loss": 0.8512, "lr": 6.010104431229202e-07, "epoch": 4.741885625965997, "percentage": 95.03, "elapsed_time": "11:13:11", "remaining_time": "0:35:11"}
|
766 |
+
{"current_steps": 766, "total_steps": 805, "loss": 0.8535, "lr": 5.714064122103935e-07, "epoch": 4.74806800618238, "percentage": 95.16, "elapsed_time": "11:14:02", "remaining_time": "0:34:19"}
|
767 |
+
{"current_steps": 767, "total_steps": 805, "loss": 0.8563, "lr": 5.425447731857248e-07, "epoch": 4.7542503863987635, "percentage": 95.28, "elapsed_time": "11:14:53", "remaining_time": "0:33:26"}
|
768 |
+
{"current_steps": 768, "total_steps": 805, "loss": 0.8558, "lr": 5.144260694780512e-07, "epoch": 4.760432766615147, "percentage": 95.4, "elapsed_time": "11:15:44", "remaining_time": "0:32:33"}
|
769 |
+
{"current_steps": 769, "total_steps": 805, "loss": 0.8574, "lr": 4.870508305279531e-07, "epoch": 4.76661514683153, "percentage": 95.53, "elapsed_time": "11:16:35", "remaining_time": "0:31:40"}
|
770 |
+
{"current_steps": 770, "total_steps": 805, "loss": 0.8678, "lr": 4.604195717774973e-07, "epoch": 4.7727975270479135, "percentage": 95.65, "elapsed_time": "11:17:26", "remaining_time": "0:30:47"}
|
771 |
+
{"current_steps": 771, "total_steps": 805, "loss": 0.8652, "lr": 4.3453279466049383e-07, "epoch": 4.778979907264297, "percentage": 95.78, "elapsed_time": "11:18:17", "remaining_time": "0:29:54"}
|
772 |
+
{"current_steps": 772, "total_steps": 805, "loss": 0.8489, "lr": 4.0939098659309895e-07, "epoch": 4.78516228748068, "percentage": 95.9, "elapsed_time": "11:19:09", "remaining_time": "0:29:01"}
|
773 |
+
{"current_steps": 773, "total_steps": 805, "loss": 0.87, "lr": 3.849946209646138e-07, "epoch": 4.7913446676970635, "percentage": 96.02, "elapsed_time": "11:20:00", "remaining_time": "0:28:09"}
|
774 |
+
{"current_steps": 774, "total_steps": 805, "loss": 0.861, "lr": 3.6134415712857587e-07, "epoch": 4.797527047913446, "percentage": 96.15, "elapsed_time": "11:20:51", "remaining_time": "0:27:16"}
|
775 |
+
{"current_steps": 775, "total_steps": 805, "loss": 0.8506, "lr": 3.384400403941124e-07, "epoch": 4.80370942812983, "percentage": 96.27, "elapsed_time": "11:21:43", "remaining_time": "0:26:23"}
|
776 |
+
{"current_steps": 776, "total_steps": 805, "loss": 0.8498, "lr": 3.1628270201754743e-07, "epoch": 4.809891808346213, "percentage": 96.4, "elapsed_time": "11:22:40", "remaining_time": "0:25:30"}
|
777 |
+
{"current_steps": 777, "total_steps": 805, "loss": 0.8537, "lr": 2.948725591942925e-07, "epoch": 4.816074188562597, "percentage": 96.52, "elapsed_time": "11:23:46", "remaining_time": "0:24:38"}
|
778 |
+
{"current_steps": 778, "total_steps": 805, "loss": 0.8668, "lr": 2.742100150509819e-07, "epoch": 4.82225656877898, "percentage": 96.65, "elapsed_time": "11:24:39", "remaining_time": "0:23:45"}
|
779 |
+
{"current_steps": 779, "total_steps": 805, "loss": 0.8657, "lr": 2.542954586378921e-07, "epoch": 4.828438948995363, "percentage": 96.77, "elapsed_time": "11:25:30", "remaining_time": "0:22:52"}
|
780 |
+
{"current_steps": 780, "total_steps": 805, "loss": 0.8631, "lr": 2.351292649216097e-07, "epoch": 4.834621329211746, "percentage": 96.89, "elapsed_time": "11:26:21", "remaining_time": "0:21:59"}
|
781 |
+
{"current_steps": 781, "total_steps": 805, "loss": 0.8657, "lr": 2.167117947779751e-07, "epoch": 4.84080370942813, "percentage": 97.02, "elapsed_time": "11:27:13", "remaining_time": "0:21:07"}
|
782 |
+
{"current_steps": 782, "total_steps": 805, "loss": 0.8666, "lr": 1.990433949852788e-07, "epoch": 4.846986089644513, "percentage": 97.14, "elapsed_time": "11:28:04", "remaining_time": "0:20:14"}
|
783 |
+
{"current_steps": 783, "total_steps": 805, "loss": 0.8635, "lr": 1.821243982177423e-07, "epoch": 4.853168469860896, "percentage": 97.27, "elapsed_time": "11:28:55", "remaining_time": "0:19:21"}
|
784 |
+
{"current_steps": 784, "total_steps": 805, "loss": 0.8496, "lr": 1.6595512303925199e-07, "epoch": 4.85935085007728, "percentage": 97.39, "elapsed_time": "11:29:46", "remaining_time": "0:18:28"}
|
785 |
+
{"current_steps": 785, "total_steps": 805, "loss": 0.8764, "lr": 1.5053587389735502e-07, "epoch": 4.865533230293663, "percentage": 97.52, "elapsed_time": "11:30:38", "remaining_time": "0:17:35"}
|
786 |
+
{"current_steps": 786, "total_steps": 805, "loss": 0.8548, "lr": 1.358669411175395e-07, "epoch": 4.871715610510046, "percentage": 97.64, "elapsed_time": "11:31:29", "remaining_time": "0:16:42"}
|
787 |
+
{"current_steps": 787, "total_steps": 805, "loss": 0.8653, "lr": 1.2194860089774995e-07, "epoch": 4.87789799072643, "percentage": 97.76, "elapsed_time": "11:32:20", "remaining_time": "0:15:50"}
|
788 |
+
{"current_steps": 788, "total_steps": 805, "loss": 0.8623, "lr": 1.0878111530320478e-07, "epoch": 4.884080370942813, "percentage": 97.89, "elapsed_time": "11:33:11", "remaining_time": "0:14:57"}
|
789 |
+
{"current_steps": 789, "total_steps": 805, "loss": 0.8614, "lr": 9.636473226144916e-08, "epoch": 4.890262751159196, "percentage": 98.01, "elapsed_time": "11:34:02", "remaining_time": "0:14:04"}
|
790 |
+
{"current_steps": 790, "total_steps": 805, "loss": 0.8647, "lr": 8.469968555769648e-08, "epoch": 4.89644513137558, "percentage": 98.14, "elapsed_time": "11:34:54", "remaining_time": "0:13:11"}
|
791 |
+
{"current_steps": 791, "total_steps": 805, "loss": 0.8482, "lr": 7.37861948304186e-08, "epoch": 4.902627511591962, "percentage": 98.26, "elapsed_time": "11:35:51", "remaining_time": "0:12:18"}
|
792 |
+
{"current_steps": 792, "total_steps": 805, "loss": 0.851, "lr": 6.362446556720691e-08, "epoch": 4.908809891808346, "percentage": 98.39, "elapsed_time": "11:36:58", "remaining_time": "0:11:26"}
|
793 |
+
{"current_steps": 793, "total_steps": 805, "loss": 0.8663, "lr": 5.421468910092209e-08, "epoch": 4.91499227202473, "percentage": 98.51, "elapsed_time": "11:37:50", "remaining_time": "0:10:33"}
|
794 |
+
{"current_steps": 794, "total_steps": 805, "loss": 0.8488, "lr": 4.555704260607474e-08, "epoch": 4.921174652241113, "percentage": 98.63, "elapsed_time": "11:38:42", "remaining_time": "0:09:40"}
|
795 |
+
{"current_steps": 795, "total_steps": 805, "loss": 0.8606, "lr": 3.765168909548589e-08, "epoch": 4.927357032457496, "percentage": 98.76, "elapsed_time": "11:39:33", "remaining_time": "0:08:47"}
|
796 |
+
{"current_steps": 796, "total_steps": 805, "loss": 0.8639, "lr": 3.049877741723606e-08, "epoch": 4.93353941267388, "percentage": 98.88, "elapsed_time": "11:40:24", "remaining_time": "0:07:55"}
|
797 |
+
{"current_steps": 797, "total_steps": 805, "loss": 0.8559, "lr": 2.4098442251849762e-08, "epoch": 4.939721792890262, "percentage": 99.01, "elapsed_time": "11:41:15", "remaining_time": "0:07:02"}
|
798 |
+
{"current_steps": 798, "total_steps": 805, "loss": 0.8421, "lr": 1.8450804109759745e-08, "epoch": 4.945904173106646, "percentage": 99.13, "elapsed_time": "11:42:07", "remaining_time": "0:06:09"}
|
799 |
+
{"current_steps": 799, "total_steps": 805, "loss": 0.8565, "lr": 1.3555969329037688e-08, "epoch": 4.95208655332303, "percentage": 99.25, "elapsed_time": "11:42:58", "remaining_time": "0:05:16"}
|
800 |
+
{"current_steps": 800, "total_steps": 805, "loss": 0.8638, "lr": 9.41403007340025e-09, "epoch": 4.958268933539412, "percentage": 99.38, "elapsed_time": "11:43:50", "remaining_time": "0:04:23"}
|
801 |
+
{"current_steps": 801, "total_steps": 805, "loss": 0.8553, "lr": 6.025064330463792e-09, "epoch": 4.964451313755796, "percentage": 99.5, "elapsed_time": "11:44:41", "remaining_time": "0:03:31"}
|
802 |
+
{"current_steps": 802, "total_steps": 805, "loss": 0.8633, "lr": 3.3891359102877773e-09, "epoch": 4.97063369397218, "percentage": 99.63, "elapsed_time": "11:45:32", "remaining_time": "0:02:38"}
|
803 |
+
{"current_steps": 803, "total_steps": 805, "loss": 0.8764, "lr": 1.506294444153511e-09, "epoch": 4.976816074188562, "percentage": 99.75, "elapsed_time": "11:46:24", "remaining_time": "0:01:45"}
|
804 |
+
{"current_steps": 804, "total_steps": 805, "loss": 0.8589, "lr": 3.7657538364932467e-10, "epoch": 4.982998454404946, "percentage": 99.88, "elapsed_time": "11:47:15", "remaining_time": "0:00:52"}
|
805 |
+
{"current_steps": 805, "total_steps": 805, "loss": 0.8693, "lr": 0.0, "epoch": 4.9891808346213296, "percentage": 100.0, "elapsed_time": "11:48:07", "remaining_time": "0:00:00"}
|
806 |
+
{"current_steps": 805, "total_steps": 805, "epoch": 4.9891808346213296, "percentage": 100.0, "elapsed_time": "11:49:37", "remaining_time": "0:00:00"}
|