sedrickkeh commited on
Commit
a6f37bf
·
verified ·
1 Parent(s): b0dbcb2

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f2847db22199909f646da9598708ba8a76fca89963331733640a896c01fbdaa
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14b226c7c50675048cb0c2eecd73ceca347cdd605108af0f0b768a50dd8cc465
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78120afa70a3ba8c9d1ae5147f81ce5b27ba5d87edfb5db259f9ec8b30581096
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da69f9d171f80af167aa76fd30082a9eebee7945161b89c9bab74def273940dd
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d4cb7412ebe98a1ee942e05fd6ca6b203ab00227bbca66de73d4314b59917f0
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:085472deac36cb0c83c59b542e27b61ca618f1675792d2c27ea49ce2c31f1d05
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6720f03e4311ee6116ffb1d26a365add8ca6cf2939801f7634c94900f58c7104
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:533e2975ff9b99c5d981cb5747deaa054880a68f095277bfb443e24d7a13945c
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -645,3 +645,162 @@
645
  {"current_steps": 645, "total_steps": 805, "loss": 1.5557, "lr": 9.259279090167994e-06, "epoch": 3.996908809891808, "percentage": 80.12, "elapsed_time": "9:26:18", "remaining_time": "2:20:28"}
646
  {"current_steps": 646, "total_steps": 805, "loss": 0.87, "lr": 9.148514734018917e-06, "epoch": 4.006182380216384, "percentage": 80.25, "elapsed_time": "9:28:32", "remaining_time": "2:19:56"}
647
  {"current_steps": 647, "total_steps": 805, "loss": 0.8649, "lr": 9.038331273364869e-06, "epoch": 4.012364760432766, "percentage": 80.37, "elapsed_time": "9:29:24", "remaining_time": "2:19:03"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
645
  {"current_steps": 645, "total_steps": 805, "loss": 1.5557, "lr": 9.259279090167994e-06, "epoch": 3.996908809891808, "percentage": 80.12, "elapsed_time": "9:26:18", "remaining_time": "2:20:28"}
646
  {"current_steps": 646, "total_steps": 805, "loss": 0.87, "lr": 9.148514734018917e-06, "epoch": 4.006182380216384, "percentage": 80.25, "elapsed_time": "9:28:32", "remaining_time": "2:19:56"}
647
  {"current_steps": 647, "total_steps": 805, "loss": 0.8649, "lr": 9.038331273364869e-06, "epoch": 4.012364760432766, "percentage": 80.37, "elapsed_time": "9:29:24", "remaining_time": "2:19:03"}
648
+ {"current_steps": 648, "total_steps": 805, "loss": 0.8577, "lr": 8.928730782824755e-06, "epoch": 4.01854714064915, "percentage": 80.5, "elapsed_time": "9:30:15", "remaining_time": "2:18:09"}
649
+ {"current_steps": 649, "total_steps": 805, "loss": 0.8571, "lr": 8.819715326040965e-06, "epoch": 4.024729520865534, "percentage": 80.62, "elapsed_time": "9:31:06", "remaining_time": "2:17:16"}
650
+ {"current_steps": 650, "total_steps": 805, "loss": 0.8609, "lr": 8.711286955640332e-06, "epoch": 4.030911901081916, "percentage": 80.75, "elapsed_time": "9:31:57", "remaining_time": "2:16:23"}
651
+ {"current_steps": 651, "total_steps": 805, "loss": 0.8566, "lr": 8.603447713195634e-06, "epoch": 4.0370942812983, "percentage": 80.87, "elapsed_time": "9:32:49", "remaining_time": "2:15:30"}
652
+ {"current_steps": 652, "total_steps": 805, "loss": 0.8608, "lr": 8.496199629187072e-06, "epoch": 4.043276661514684, "percentage": 80.99, "elapsed_time": "9:33:40", "remaining_time": "2:14:37"}
653
+ {"current_steps": 653, "total_steps": 805, "loss": 0.8675, "lr": 8.389544722964076e-06, "epoch": 4.049459041731066, "percentage": 81.12, "elapsed_time": "9:34:31", "remaining_time": "2:13:44"}
654
+ {"current_steps": 654, "total_steps": 805, "loss": 0.8689, "lr": 8.283485002707233e-06, "epoch": 4.05564142194745, "percentage": 81.24, "elapsed_time": "9:35:22", "remaining_time": "2:12:50"}
655
+ {"current_steps": 655, "total_steps": 805, "loss": 0.853, "lr": 8.178022465390549e-06, "epoch": 4.061823802163833, "percentage": 81.37, "elapsed_time": "9:36:14", "remaining_time": "2:11:57"}
656
+ {"current_steps": 656, "total_steps": 805, "loss": 0.8645, "lr": 8.073159096743799e-06, "epoch": 4.068006182380216, "percentage": 81.49, "elapsed_time": "9:37:09", "remaining_time": "2:11:05"}
657
+ {"current_steps": 657, "total_steps": 805, "loss": 0.8517, "lr": 7.968896871215147e-06, "epoch": 4.0741885625966, "percentage": 81.61, "elapsed_time": "9:38:15", "remaining_time": "2:10:15"}
658
+ {"current_steps": 658, "total_steps": 805, "loss": 0.858, "lr": 7.865237751933965e-06, "epoch": 4.080370942812983, "percentage": 81.74, "elapsed_time": "9:39:10", "remaining_time": "2:09:23"}
659
+ {"current_steps": 659, "total_steps": 805, "loss": 0.8552, "lr": 7.762183690673887e-06, "epoch": 4.086553323029366, "percentage": 81.86, "elapsed_time": "9:40:01", "remaining_time": "2:08:30"}
660
+ {"current_steps": 660, "total_steps": 805, "loss": 0.8559, "lr": 7.659736627816064e-06, "epoch": 4.09273570324575, "percentage": 81.99, "elapsed_time": "9:40:52", "remaining_time": "2:07:37"}
661
+ {"current_steps": 661, "total_steps": 805, "loss": 0.8527, "lr": 7.557898492312561e-06, "epoch": 4.098918083462133, "percentage": 82.11, "elapsed_time": "9:41:44", "remaining_time": "2:06:43"}
662
+ {"current_steps": 662, "total_steps": 805, "loss": 0.8551, "lr": 7.456671201650145e-06, "epoch": 4.105100463678516, "percentage": 82.24, "elapsed_time": "9:42:35", "remaining_time": "2:05:50"}
663
+ {"current_steps": 663, "total_steps": 805, "loss": 0.8557, "lr": 7.356056661814106e-06, "epoch": 4.1112828438949, "percentage": 82.36, "elapsed_time": "9:43:26", "remaining_time": "2:04:57"}
664
+ {"current_steps": 664, "total_steps": 805, "loss": 0.8539, "lr": 7.256056767252402e-06, "epoch": 4.117465224111283, "percentage": 82.48, "elapsed_time": "9:44:17", "remaining_time": "2:04:04"}
665
+ {"current_steps": 665, "total_steps": 805, "loss": 0.853, "lr": 7.156673400839933e-06, "epoch": 4.123647604327666, "percentage": 82.61, "elapsed_time": "9:45:09", "remaining_time": "2:03:11"}
666
+ {"current_steps": 666, "total_steps": 805, "loss": 0.8464, "lr": 7.057908433843205e-06, "epoch": 4.12982998454405, "percentage": 82.73, "elapsed_time": "9:46:00", "remaining_time": "2:02:18"}
667
+ {"current_steps": 667, "total_steps": 805, "loss": 0.86, "lr": 6.959763725884956e-06, "epoch": 4.1360123647604325, "percentage": 82.86, "elapsed_time": "9:46:51", "remaining_time": "2:01:25"}
668
+ {"current_steps": 668, "total_steps": 805, "loss": 0.8559, "lr": 6.862241124909262e-06, "epoch": 4.142194744976816, "percentage": 82.98, "elapsed_time": "9:47:42", "remaining_time": "2:00:32"}
669
+ {"current_steps": 669, "total_steps": 805, "loss": 0.8547, "lr": 6.765342467146632e-06, "epoch": 4.1483771251932, "percentage": 83.11, "elapsed_time": "9:48:33", "remaining_time": "1:59:38"}
670
+ {"current_steps": 670, "total_steps": 805, "loss": 0.8563, "lr": 6.66906957707957e-06, "epoch": 4.1545595054095825, "percentage": 83.23, "elapsed_time": "9:49:24", "remaining_time": "1:58:45"}
671
+ {"current_steps": 671, "total_steps": 805, "loss": 0.8536, "lr": 6.5734242674080705e-06, "epoch": 4.160741885625966, "percentage": 83.35, "elapsed_time": "9:50:20", "remaining_time": "1:57:53"}
672
+ {"current_steps": 672, "total_steps": 805, "loss": 0.8624, "lr": 6.478408339015603e-06, "epoch": 4.166924265842349, "percentage": 83.48, "elapsed_time": "9:51:27", "remaining_time": "1:57:03"}
673
+ {"current_steps": 673, "total_steps": 805, "loss": 0.8588, "lr": 6.384023580935155e-06, "epoch": 4.1731066460587325, "percentage": 83.6, "elapsed_time": "9:52:21", "remaining_time": "1:56:11"}
674
+ {"current_steps": 674, "total_steps": 805, "loss": 0.8497, "lr": 6.290271770315541e-06, "epoch": 4.179289026275116, "percentage": 83.73, "elapsed_time": "9:53:12", "remaining_time": "1:55:17"}
675
+ {"current_steps": 675, "total_steps": 805, "loss": 0.859, "lr": 6.1971546723879864e-06, "epoch": 4.185471406491499, "percentage": 83.85, "elapsed_time": "9:54:04", "remaining_time": "1:54:24"}
676
+ {"current_steps": 676, "total_steps": 805, "loss": 0.8649, "lr": 6.104674040432797e-06, "epoch": 4.1916537867078825, "percentage": 83.98, "elapsed_time": "9:54:55", "remaining_time": "1:53:31"}
677
+ {"current_steps": 677, "total_steps": 805, "loss": 0.8536, "lr": 6.012831615746484e-06, "epoch": 4.197836166924266, "percentage": 84.1, "elapsed_time": "9:55:46", "remaining_time": "1:52:38"}
678
+ {"current_steps": 678, "total_steps": 805, "loss": 0.8633, "lr": 5.9216291276088435e-06, "epoch": 4.204018547140649, "percentage": 84.22, "elapsed_time": "9:56:37", "remaining_time": "1:51:45"}
679
+ {"current_steps": 679, "total_steps": 805, "loss": 0.863, "lr": 5.831068293250481e-06, "epoch": 4.210200927357032, "percentage": 84.35, "elapsed_time": "9:57:29", "remaining_time": "1:50:52"}
680
+ {"current_steps": 680, "total_steps": 805, "loss": 0.8623, "lr": 5.74115081782042e-06, "epoch": 4.216383307573416, "percentage": 84.47, "elapsed_time": "9:58:20", "remaining_time": "1:49:59"}
681
+ {"current_steps": 681, "total_steps": 805, "loss": 0.8582, "lr": 5.651878394354091e-06, "epoch": 4.222565687789799, "percentage": 84.6, "elapsed_time": "9:59:11", "remaining_time": "1:49:06"}
682
+ {"current_steps": 682, "total_steps": 805, "loss": 0.8565, "lr": 5.563252703741322e-06, "epoch": 4.228748068006182, "percentage": 84.72, "elapsed_time": "10:00:03", "remaining_time": "1:48:13"}
683
+ {"current_steps": 683, "total_steps": 805, "loss": 0.8553, "lr": 5.475275414694787e-06, "epoch": 4.234930448222566, "percentage": 84.84, "elapsed_time": "10:00:54", "remaining_time": "1:47:20"}
684
+ {"current_steps": 684, "total_steps": 805, "loss": 0.8586, "lr": 5.387948183718563e-06, "epoch": 4.241112828438949, "percentage": 84.97, "elapsed_time": "10:01:45", "remaining_time": "1:46:27"}
685
+ {"current_steps": 685, "total_steps": 805, "loss": 0.8639, "lr": 5.30127265507693e-06, "epoch": 4.247295208655332, "percentage": 85.09, "elapsed_time": "10:02:36", "remaining_time": "1:45:33"}
686
+ {"current_steps": 686, "total_steps": 805, "loss": 0.845, "lr": 5.215250460763397e-06, "epoch": 4.253477588871716, "percentage": 85.22, "elapsed_time": "10:03:32", "remaining_time": "1:44:41"}
687
+ {"current_steps": 687, "total_steps": 805, "loss": 0.8509, "lr": 5.129883220470007e-06, "epoch": 4.259659969088099, "percentage": 85.34, "elapsed_time": "10:04:38", "remaining_time": "1:43:51"}
688
+ {"current_steps": 688, "total_steps": 805, "loss": 0.8522, "lr": 5.045172541556831e-06, "epoch": 4.265842349304482, "percentage": 85.47, "elapsed_time": "10:05:31", "remaining_time": "1:42:58"}
689
+ {"current_steps": 689, "total_steps": 805, "loss": 0.8647, "lr": 4.961120019021684e-06, "epoch": 4.272024729520865, "percentage": 85.59, "elapsed_time": "10:06:22", "remaining_time": "1:42:05"}
690
+ {"current_steps": 690, "total_steps": 805, "loss": 0.8586, "lr": 4.877727235470113e-06, "epoch": 4.278207109737249, "percentage": 85.71, "elapsed_time": "10:07:13", "remaining_time": "1:41:12"}
691
+ {"current_steps": 691, "total_steps": 805, "loss": 0.8606, "lr": 4.794995761085593e-06, "epoch": 4.284389489953632, "percentage": 85.84, "elapsed_time": "10:08:04", "remaining_time": "1:40:19"}
692
+ {"current_steps": 692, "total_steps": 805, "loss": 0.8561, "lr": 4.712927153599967e-06, "epoch": 4.290571870170015, "percentage": 85.96, "elapsed_time": "10:08:55", "remaining_time": "1:39:26"}
693
+ {"current_steps": 693, "total_steps": 805, "loss": 0.8526, "lr": 4.631522958264083e-06, "epoch": 4.296754250386399, "percentage": 86.09, "elapsed_time": "10:09:47", "remaining_time": "1:38:33"}
694
+ {"current_steps": 694, "total_steps": 805, "loss": 0.8556, "lr": 4.550784707818756e-06, "epoch": 4.302936630602782, "percentage": 86.21, "elapsed_time": "10:10:38", "remaining_time": "1:37:40"}
695
+ {"current_steps": 695, "total_steps": 805, "loss": 0.8616, "lr": 4.47071392246587e-06, "epoch": 4.309119010819165, "percentage": 86.34, "elapsed_time": "10:11:29", "remaining_time": "1:36:46"}
696
+ {"current_steps": 696, "total_steps": 805, "loss": 0.8595, "lr": 4.3913121098397675e-06, "epoch": 4.315301391035549, "percentage": 86.46, "elapsed_time": "10:12:20", "remaining_time": "1:35:53"}
697
+ {"current_steps": 697, "total_steps": 805, "loss": 0.8472, "lr": 4.312580764978825e-06, "epoch": 4.321483771251932, "percentage": 86.58, "elapsed_time": "10:13:12", "remaining_time": "1:35:00"}
698
+ {"current_steps": 698, "total_steps": 805, "loss": 0.8652, "lr": 4.234521370297398e-06, "epoch": 4.327666151468315, "percentage": 86.71, "elapsed_time": "10:14:03", "remaining_time": "1:34:07"}
699
+ {"current_steps": 699, "total_steps": 805, "loss": 0.862, "lr": 4.157135395557786e-06, "epoch": 4.333848531684699, "percentage": 86.83, "elapsed_time": "10:14:54", "remaining_time": "1:33:14"}
700
+ {"current_steps": 700, "total_steps": 805, "loss": 0.8626, "lr": 4.080424297842656e-06, "epoch": 4.340030911901082, "percentage": 86.96, "elapsed_time": "10:15:45", "remaining_time": "1:32:21"}
701
+ {"current_steps": 701, "total_steps": 805, "loss": 0.8599, "lr": 4.004389521527543e-06, "epoch": 4.346213292117465, "percentage": 87.08, "elapsed_time": "10:16:41", "remaining_time": "1:31:29"}
702
+ {"current_steps": 702, "total_steps": 805, "loss": 0.8643, "lr": 3.929032498253729e-06, "epoch": 4.352395672333849, "percentage": 87.2, "elapsed_time": "10:17:48", "remaining_time": "1:30:38"}
703
+ {"current_steps": 703, "total_steps": 805, "loss": 0.8684, "lr": 3.8543546469011904e-06, "epoch": 4.358578052550232, "percentage": 87.33, "elapsed_time": "10:18:41", "remaining_time": "1:29:46"}
704
+ {"current_steps": 704, "total_steps": 805, "loss": 0.8554, "lr": 3.780357373561958e-06, "epoch": 4.364760432766615, "percentage": 87.45, "elapsed_time": "10:19:32", "remaining_time": "1:28:53"}
705
+ {"current_steps": 705, "total_steps": 805, "loss": 0.8649, "lr": 3.7070420715136133e-06, "epoch": 4.370942812982999, "percentage": 87.58, "elapsed_time": "10:20:24", "remaining_time": "1:28:00"}
706
+ {"current_steps": 706, "total_steps": 805, "loss": 0.8549, "lr": 3.634410121193059e-06, "epoch": 4.377125193199381, "percentage": 87.7, "elapsed_time": "10:21:15", "remaining_time": "1:27:07"}
707
+ {"current_steps": 707, "total_steps": 805, "loss": 0.848, "lr": 3.562462890170526e-06, "epoch": 4.383307573415765, "percentage": 87.83, "elapsed_time": "10:22:06", "remaining_time": "1:26:13"}
708
+ {"current_steps": 708, "total_steps": 805, "loss": 0.8634, "lr": 3.4912017331238057e-06, "epoch": 4.3894899536321486, "percentage": 87.95, "elapsed_time": "10:22:57", "remaining_time": "1:25:20"}
709
+ {"current_steps": 709, "total_steps": 805, "loss": 0.8595, "lr": 3.420627991812788e-06, "epoch": 4.395672333848531, "percentage": 88.07, "elapsed_time": "10:23:48", "remaining_time": "1:24:27"}
710
+ {"current_steps": 710, "total_steps": 805, "loss": 0.8526, "lr": 3.3507429950541527e-06, "epoch": 4.401854714064915, "percentage": 88.2, "elapsed_time": "10:24:40", "remaining_time": "1:23:34"}
711
+ {"current_steps": 711, "total_steps": 805, "loss": 0.8583, "lr": 3.281548058696373e-06, "epoch": 4.4080370942812985, "percentage": 88.32, "elapsed_time": "10:25:31", "remaining_time": "1:22:41"}
712
+ {"current_steps": 712, "total_steps": 805, "loss": 0.8671, "lr": 3.2130444855949406e-06, "epoch": 4.414219474497681, "percentage": 88.45, "elapsed_time": "10:26:22", "remaining_time": "1:21:48"}
713
+ {"current_steps": 713, "total_steps": 805, "loss": 0.8616, "lr": 3.145233565587824e-06, "epoch": 4.420401854714065, "percentage": 88.57, "elapsed_time": "10:27:14", "remaining_time": "1:20:56"}
714
+ {"current_steps": 714, "total_steps": 805, "loss": 0.8566, "lr": 3.078116575471173e-06, "epoch": 4.4265842349304485, "percentage": 88.7, "elapsed_time": "10:28:05", "remaining_time": "1:20:03"}
715
+ {"current_steps": 715, "total_steps": 805, "loss": 0.8581, "lr": 3.0116947789753028e-06, "epoch": 4.432766615146831, "percentage": 88.82, "elapsed_time": "10:28:57", "remaining_time": "1:19:10"}
716
+ {"current_steps": 716, "total_steps": 805, "loss": 0.8646, "lr": 2.9459694267408977e-06, "epoch": 4.438948995363215, "percentage": 88.94, "elapsed_time": "10:29:53", "remaining_time": "1:18:17"}
717
+ {"current_steps": 717, "total_steps": 805, "loss": 0.8636, "lr": 2.8809417562954435e-06, "epoch": 4.4451313755795985, "percentage": 89.07, "elapsed_time": "10:30:59", "remaining_time": "1:17:26"}
718
+ {"current_steps": 718, "total_steps": 805, "loss": 0.8474, "lr": 2.8166129920299278e-06, "epoch": 4.451313755795981, "percentage": 89.19, "elapsed_time": "10:31:52", "remaining_time": "1:16:33"}
719
+ {"current_steps": 719, "total_steps": 805, "loss": 0.848, "lr": 2.752984345175809e-06, "epoch": 4.457496136012365, "percentage": 89.32, "elapsed_time": "10:32:43", "remaining_time": "1:15:40"}
720
+ {"current_steps": 720, "total_steps": 805, "loss": 0.8599, "lr": 2.690057013782195e-06, "epoch": 4.4636785162287484, "percentage": 89.44, "elapsed_time": "10:33:34", "remaining_time": "1:14:47"}
721
+ {"current_steps": 721, "total_steps": 805, "loss": 0.8585, "lr": 2.6278321826932818e-06, "epoch": 4.469860896445131, "percentage": 89.57, "elapsed_time": "10:34:26", "remaining_time": "1:13:54"}
722
+ {"current_steps": 722, "total_steps": 805, "loss": 0.8704, "lr": 2.566311023526056e-06, "epoch": 4.476043276661515, "percentage": 89.69, "elapsed_time": "10:35:17", "remaining_time": "1:13:01"}
723
+ {"current_steps": 723, "total_steps": 805, "loss": 0.8619, "lr": 2.5054946946482208e-06, "epoch": 4.4822256568778975, "percentage": 89.81, "elapsed_time": "10:36:08", "remaining_time": "1:12:08"}
724
+ {"current_steps": 724, "total_steps": 805, "loss": 0.8498, "lr": 2.445384341156389e-06, "epoch": 4.488408037094281, "percentage": 89.94, "elapsed_time": "10:36:59", "remaining_time": "1:11:15"}
725
+ {"current_steps": 725, "total_steps": 805, "loss": 0.8567, "lr": 2.3859810948545414e-06, "epoch": 4.494590417310665, "percentage": 90.06, "elapsed_time": "10:37:51", "remaining_time": "1:10:23"}
726
+ {"current_steps": 726, "total_steps": 805, "loss": 0.8556, "lr": 2.3272860742326798e-06, "epoch": 4.500772797527048, "percentage": 90.19, "elapsed_time": "10:38:42", "remaining_time": "1:09:30"}
727
+ {"current_steps": 727, "total_steps": 805, "loss": 0.8533, "lr": 2.269300384445812e-06, "epoch": 4.506955177743431, "percentage": 90.31, "elapsed_time": "10:39:33", "remaining_time": "1:08:37"}
728
+ {"current_steps": 728, "total_steps": 805, "loss": 0.856, "lr": 2.2120251172931082e-06, "epoch": 4.513137557959815, "percentage": 90.43, "elapsed_time": "10:40:24", "remaining_time": "1:07:44"}
729
+ {"current_steps": 729, "total_steps": 805, "loss": 0.8583, "lr": 2.15546135119733e-06, "epoch": 4.5193199381761975, "percentage": 90.56, "elapsed_time": "10:41:15", "remaining_time": "1:06:51"}
730
+ {"current_steps": 730, "total_steps": 805, "loss": 0.8522, "lr": 2.0996101511846056e-06, "epoch": 4.525502318392581, "percentage": 90.68, "elapsed_time": "10:42:07", "remaining_time": "1:05:58"}
731
+ {"current_steps": 731, "total_steps": 805, "loss": 0.8537, "lr": 2.0444725688642685e-06, "epoch": 4.531684698608965, "percentage": 90.81, "elapsed_time": "10:43:03", "remaining_time": "1:05:05"}
732
+ {"current_steps": 732, "total_steps": 805, "loss": 0.8552, "lr": 1.9900496424091375e-06, "epoch": 4.5378670788253475, "percentage": 90.93, "elapsed_time": "10:44:10", "remaining_time": "1:04:14"}
733
+ {"current_steps": 733, "total_steps": 805, "loss": 0.8562, "lr": 1.9363423965359195e-06, "epoch": 4.544049459041731, "percentage": 91.06, "elapsed_time": "10:45:03", "remaining_time": "1:03:21"}
734
+ {"current_steps": 734, "total_steps": 805, "loss": 0.8506, "lr": 1.883351842485972e-06, "epoch": 4.550231839258115, "percentage": 91.18, "elapsed_time": "10:45:55", "remaining_time": "1:02:28"}
735
+ {"current_steps": 735, "total_steps": 805, "loss": 0.8589, "lr": 1.8310789780061887e-06, "epoch": 4.556414219474497, "percentage": 91.3, "elapsed_time": "10:46:46", "remaining_time": "1:01:35"}
736
+ {"current_steps": 736, "total_steps": 805, "loss": 0.8568, "lr": 1.7795247873302735e-06, "epoch": 4.562596599690881, "percentage": 91.43, "elapsed_time": "10:47:37", "remaining_time": "1:00:42"}
737
+ {"current_steps": 737, "total_steps": 805, "loss": 0.8549, "lr": 1.728690241160189e-06, "epoch": 4.568778979907265, "percentage": 91.55, "elapsed_time": "10:48:29", "remaining_time": "0:59:49"}
738
+ {"current_steps": 738, "total_steps": 805, "loss": 0.8616, "lr": 1.6785762966478715e-06, "epoch": 4.574961360123647, "percentage": 91.68, "elapsed_time": "10:49:20", "remaining_time": "0:58:57"}
739
+ {"current_steps": 739, "total_steps": 805, "loss": 0.85, "lr": 1.6291838973772068e-06, "epoch": 4.581143740340031, "percentage": 91.8, "elapsed_time": "10:50:11", "remaining_time": "0:58:04"}
740
+ {"current_steps": 740, "total_steps": 805, "loss": 0.8542, "lr": 1.5805139733462827e-06, "epoch": 4.587326120556414, "percentage": 91.93, "elapsed_time": "10:51:03", "remaining_time": "0:57:11"}
741
+ {"current_steps": 741, "total_steps": 805, "loss": 0.863, "lr": 1.532567440949868e-06, "epoch": 4.593508500772797, "percentage": 92.05, "elapsed_time": "10:51:54", "remaining_time": "0:56:18"}
742
+ {"current_steps": 742, "total_steps": 805, "loss": 0.8582, "lr": 1.4853452029621518e-06, "epoch": 4.599690880989181, "percentage": 92.17, "elapsed_time": "10:52:45", "remaining_time": "0:55:25"}
743
+ {"current_steps": 743, "total_steps": 805, "loss": 0.8666, "lr": 1.4388481485197558e-06, "epoch": 4.605873261205565, "percentage": 92.3, "elapsed_time": "10:53:37", "remaining_time": "0:54:32"}
744
+ {"current_steps": 744, "total_steps": 805, "loss": 0.8543, "lr": 1.3930771531049847e-06, "epoch": 4.612055641421947, "percentage": 92.42, "elapsed_time": "10:54:28", "remaining_time": "0:53:39"}
745
+ {"current_steps": 745, "total_steps": 805, "loss": 0.8605, "lr": 1.3480330785293494e-06, "epoch": 4.618238021638331, "percentage": 92.55, "elapsed_time": "10:55:19", "remaining_time": "0:52:46"}
746
+ {"current_steps": 746, "total_steps": 805, "loss": 0.8602, "lr": 1.3037167729173273e-06, "epoch": 4.624420401854714, "percentage": 92.67, "elapsed_time": "10:56:16", "remaining_time": "0:51:54"}
747
+ {"current_steps": 747, "total_steps": 805, "loss": 0.8612, "lr": 1.2601290706904102e-06, "epoch": 4.630602782071097, "percentage": 92.8, "elapsed_time": "10:57:22", "remaining_time": "0:51:02"}
748
+ {"current_steps": 748, "total_steps": 805, "loss": 0.8692, "lr": 1.2172707925513838e-06, "epoch": 4.636785162287481, "percentage": 92.92, "elapsed_time": "10:58:16", "remaining_time": "0:50:09"}
749
+ {"current_steps": 749, "total_steps": 805, "loss": 0.8739, "lr": 1.1751427454688735e-06, "epoch": 4.642967542503864, "percentage": 93.04, "elapsed_time": "10:59:07", "remaining_time": "0:49:16"}
750
+ {"current_steps": 750, "total_steps": 805, "loss": 0.8507, "lr": 1.1337457226621518e-06, "epoch": 4.649149922720247, "percentage": 93.17, "elapsed_time": "10:59:59", "remaining_time": "0:48:23"}
751
+ {"current_steps": 751, "total_steps": 805, "loss": 0.8688, "lr": 1.0930805035862125e-06, "epoch": 4.655332302936631, "percentage": 93.29, "elapsed_time": "11:00:50", "remaining_time": "0:47:31"}
752
+ {"current_steps": 752, "total_steps": 805, "loss": 0.8576, "lr": 1.0531478539170713e-06, "epoch": 4.661514683153014, "percentage": 93.42, "elapsed_time": "11:01:41", "remaining_time": "0:46:38"}
753
+ {"current_steps": 753, "total_steps": 805, "loss": 0.8586, "lr": 1.0139485255373826e-06, "epoch": 4.667697063369397, "percentage": 93.54, "elapsed_time": "11:02:33", "remaining_time": "0:45:45"}
754
+ {"current_steps": 754, "total_steps": 805, "loss": 0.8732, "lr": 9.75483256522236e-07, "epoch": 4.673879443585781, "percentage": 93.66, "elapsed_time": "11:03:24", "remaining_time": "0:44:52"}
755
+ {"current_steps": 755, "total_steps": 805, "loss": 0.8501, "lr": 9.377527711253198e-07, "epoch": 4.680061823802164, "percentage": 93.79, "elapsed_time": "11:04:15", "remaining_time": "0:43:59"}
756
+ {"current_steps": 756, "total_steps": 805, "loss": 0.8606, "lr": 9.007577797652245e-07, "epoch": 4.686244204018547, "percentage": 93.91, "elapsed_time": "11:05:07", "remaining_time": "0:43:06"}
757
+ {"current_steps": 757, "total_steps": 805, "loss": 0.8687, "lr": 8.644989790121072e-07, "epoch": 4.69242658423493, "percentage": 94.04, "elapsed_time": "11:05:58", "remaining_time": "0:42:13"}
758
+ {"current_steps": 758, "total_steps": 805, "loss": 0.8623, "lr": 8.289770515745599e-07, "epoch": 4.698608964451314, "percentage": 94.16, "elapsed_time": "11:06:49", "remaining_time": "0:41:20"}
759
+ {"current_steps": 759, "total_steps": 805, "loss": 0.8663, "lr": 7.941926662867528e-07, "epoch": 4.704791344667697, "percentage": 94.29, "elapsed_time": "11:07:41", "remaining_time": "0:40:27"}
760
+ {"current_steps": 760, "total_steps": 805, "loss": 0.8533, "lr": 7.60146478095849e-07, "epoch": 4.710973724884081, "percentage": 94.41, "elapsed_time": "11:08:32", "remaining_time": "0:39:35"}
761
+ {"current_steps": 761, "total_steps": 805, "loss": 0.8545, "lr": 7.268391280496589e-07, "epoch": 4.717156105100464, "percentage": 94.53, "elapsed_time": "11:09:28", "remaining_time": "0:38:42"}
762
+ {"current_steps": 762, "total_steps": 805, "loss": 0.8593, "lr": 6.94271243284601e-07, "epoch": 4.723338485316847, "percentage": 94.66, "elapsed_time": "11:10:35", "remaining_time": "0:37:50"}
763
+ {"current_steps": 763, "total_steps": 805, "loss": 0.8637, "lr": 6.624434370138532e-07, "epoch": 4.72952086553323, "percentage": 94.78, "elapsed_time": "11:11:28", "remaining_time": "0:36:57"}
764
+ {"current_steps": 764, "total_steps": 805, "loss": 0.8527, "lr": 6.313563085158425e-07, "epoch": 4.7357032457496135, "percentage": 94.91, "elapsed_time": "11:12:19", "remaining_time": "0:36:04"}
765
+ {"current_steps": 765, "total_steps": 805, "loss": 0.8512, "lr": 6.010104431229202e-07, "epoch": 4.741885625965997, "percentage": 95.03, "elapsed_time": "11:13:11", "remaining_time": "0:35:11"}
766
+ {"current_steps": 766, "total_steps": 805, "loss": 0.8535, "lr": 5.714064122103935e-07, "epoch": 4.74806800618238, "percentage": 95.16, "elapsed_time": "11:14:02", "remaining_time": "0:34:19"}
767
+ {"current_steps": 767, "total_steps": 805, "loss": 0.8563, "lr": 5.425447731857248e-07, "epoch": 4.7542503863987635, "percentage": 95.28, "elapsed_time": "11:14:53", "remaining_time": "0:33:26"}
768
+ {"current_steps": 768, "total_steps": 805, "loss": 0.8558, "lr": 5.144260694780512e-07, "epoch": 4.760432766615147, "percentage": 95.4, "elapsed_time": "11:15:44", "remaining_time": "0:32:33"}
769
+ {"current_steps": 769, "total_steps": 805, "loss": 0.8574, "lr": 4.870508305279531e-07, "epoch": 4.76661514683153, "percentage": 95.53, "elapsed_time": "11:16:35", "remaining_time": "0:31:40"}
770
+ {"current_steps": 770, "total_steps": 805, "loss": 0.8678, "lr": 4.604195717774973e-07, "epoch": 4.7727975270479135, "percentage": 95.65, "elapsed_time": "11:17:26", "remaining_time": "0:30:47"}
771
+ {"current_steps": 771, "total_steps": 805, "loss": 0.8652, "lr": 4.3453279466049383e-07, "epoch": 4.778979907264297, "percentage": 95.78, "elapsed_time": "11:18:17", "remaining_time": "0:29:54"}
772
+ {"current_steps": 772, "total_steps": 805, "loss": 0.8489, "lr": 4.0939098659309895e-07, "epoch": 4.78516228748068, "percentage": 95.9, "elapsed_time": "11:19:09", "remaining_time": "0:29:01"}
773
+ {"current_steps": 773, "total_steps": 805, "loss": 0.87, "lr": 3.849946209646138e-07, "epoch": 4.7913446676970635, "percentage": 96.02, "elapsed_time": "11:20:00", "remaining_time": "0:28:09"}
774
+ {"current_steps": 774, "total_steps": 805, "loss": 0.861, "lr": 3.6134415712857587e-07, "epoch": 4.797527047913446, "percentage": 96.15, "elapsed_time": "11:20:51", "remaining_time": "0:27:16"}
775
+ {"current_steps": 775, "total_steps": 805, "loss": 0.8506, "lr": 3.384400403941124e-07, "epoch": 4.80370942812983, "percentage": 96.27, "elapsed_time": "11:21:43", "remaining_time": "0:26:23"}
776
+ {"current_steps": 776, "total_steps": 805, "loss": 0.8498, "lr": 3.1628270201754743e-07, "epoch": 4.809891808346213, "percentage": 96.4, "elapsed_time": "11:22:40", "remaining_time": "0:25:30"}
777
+ {"current_steps": 777, "total_steps": 805, "loss": 0.8537, "lr": 2.948725591942925e-07, "epoch": 4.816074188562597, "percentage": 96.52, "elapsed_time": "11:23:46", "remaining_time": "0:24:38"}
778
+ {"current_steps": 778, "total_steps": 805, "loss": 0.8668, "lr": 2.742100150509819e-07, "epoch": 4.82225656877898, "percentage": 96.65, "elapsed_time": "11:24:39", "remaining_time": "0:23:45"}
779
+ {"current_steps": 779, "total_steps": 805, "loss": 0.8657, "lr": 2.542954586378921e-07, "epoch": 4.828438948995363, "percentage": 96.77, "elapsed_time": "11:25:30", "remaining_time": "0:22:52"}
780
+ {"current_steps": 780, "total_steps": 805, "loss": 0.8631, "lr": 2.351292649216097e-07, "epoch": 4.834621329211746, "percentage": 96.89, "elapsed_time": "11:26:21", "remaining_time": "0:21:59"}
781
+ {"current_steps": 781, "total_steps": 805, "loss": 0.8657, "lr": 2.167117947779751e-07, "epoch": 4.84080370942813, "percentage": 97.02, "elapsed_time": "11:27:13", "remaining_time": "0:21:07"}
782
+ {"current_steps": 782, "total_steps": 805, "loss": 0.8666, "lr": 1.990433949852788e-07, "epoch": 4.846986089644513, "percentage": 97.14, "elapsed_time": "11:28:04", "remaining_time": "0:20:14"}
783
+ {"current_steps": 783, "total_steps": 805, "loss": 0.8635, "lr": 1.821243982177423e-07, "epoch": 4.853168469860896, "percentage": 97.27, "elapsed_time": "11:28:55", "remaining_time": "0:19:21"}
784
+ {"current_steps": 784, "total_steps": 805, "loss": 0.8496, "lr": 1.6595512303925199e-07, "epoch": 4.85935085007728, "percentage": 97.39, "elapsed_time": "11:29:46", "remaining_time": "0:18:28"}
785
+ {"current_steps": 785, "total_steps": 805, "loss": 0.8764, "lr": 1.5053587389735502e-07, "epoch": 4.865533230293663, "percentage": 97.52, "elapsed_time": "11:30:38", "remaining_time": "0:17:35"}
786
+ {"current_steps": 786, "total_steps": 805, "loss": 0.8548, "lr": 1.358669411175395e-07, "epoch": 4.871715610510046, "percentage": 97.64, "elapsed_time": "11:31:29", "remaining_time": "0:16:42"}
787
+ {"current_steps": 787, "total_steps": 805, "loss": 0.8653, "lr": 1.2194860089774995e-07, "epoch": 4.87789799072643, "percentage": 97.76, "elapsed_time": "11:32:20", "remaining_time": "0:15:50"}
788
+ {"current_steps": 788, "total_steps": 805, "loss": 0.8623, "lr": 1.0878111530320478e-07, "epoch": 4.884080370942813, "percentage": 97.89, "elapsed_time": "11:33:11", "remaining_time": "0:14:57"}
789
+ {"current_steps": 789, "total_steps": 805, "loss": 0.8614, "lr": 9.636473226144916e-08, "epoch": 4.890262751159196, "percentage": 98.01, "elapsed_time": "11:34:02", "remaining_time": "0:14:04"}
790
+ {"current_steps": 790, "total_steps": 805, "loss": 0.8647, "lr": 8.469968555769648e-08, "epoch": 4.89644513137558, "percentage": 98.14, "elapsed_time": "11:34:54", "remaining_time": "0:13:11"}
791
+ {"current_steps": 791, "total_steps": 805, "loss": 0.8482, "lr": 7.37861948304186e-08, "epoch": 4.902627511591962, "percentage": 98.26, "elapsed_time": "11:35:51", "remaining_time": "0:12:18"}
792
+ {"current_steps": 792, "total_steps": 805, "loss": 0.851, "lr": 6.362446556720691e-08, "epoch": 4.908809891808346, "percentage": 98.39, "elapsed_time": "11:36:58", "remaining_time": "0:11:26"}
793
+ {"current_steps": 793, "total_steps": 805, "loss": 0.8663, "lr": 5.421468910092209e-08, "epoch": 4.91499227202473, "percentage": 98.51, "elapsed_time": "11:37:50", "remaining_time": "0:10:33"}
794
+ {"current_steps": 794, "total_steps": 805, "loss": 0.8488, "lr": 4.555704260607474e-08, "epoch": 4.921174652241113, "percentage": 98.63, "elapsed_time": "11:38:42", "remaining_time": "0:09:40"}
795
+ {"current_steps": 795, "total_steps": 805, "loss": 0.8606, "lr": 3.765168909548589e-08, "epoch": 4.927357032457496, "percentage": 98.76, "elapsed_time": "11:39:33", "remaining_time": "0:08:47"}
796
+ {"current_steps": 796, "total_steps": 805, "loss": 0.8639, "lr": 3.049877741723606e-08, "epoch": 4.93353941267388, "percentage": 98.88, "elapsed_time": "11:40:24", "remaining_time": "0:07:55"}
797
+ {"current_steps": 797, "total_steps": 805, "loss": 0.8559, "lr": 2.4098442251849762e-08, "epoch": 4.939721792890262, "percentage": 99.01, "elapsed_time": "11:41:15", "remaining_time": "0:07:02"}
798
+ {"current_steps": 798, "total_steps": 805, "loss": 0.8421, "lr": 1.8450804109759745e-08, "epoch": 4.945904173106646, "percentage": 99.13, "elapsed_time": "11:42:07", "remaining_time": "0:06:09"}
799
+ {"current_steps": 799, "total_steps": 805, "loss": 0.8565, "lr": 1.3555969329037688e-08, "epoch": 4.95208655332303, "percentage": 99.25, "elapsed_time": "11:42:58", "remaining_time": "0:05:16"}
800
+ {"current_steps": 800, "total_steps": 805, "loss": 0.8638, "lr": 9.41403007340025e-09, "epoch": 4.958268933539412, "percentage": 99.38, "elapsed_time": "11:43:50", "remaining_time": "0:04:23"}
801
+ {"current_steps": 801, "total_steps": 805, "loss": 0.8553, "lr": 6.025064330463792e-09, "epoch": 4.964451313755796, "percentage": 99.5, "elapsed_time": "11:44:41", "remaining_time": "0:03:31"}
802
+ {"current_steps": 802, "total_steps": 805, "loss": 0.8633, "lr": 3.3891359102877773e-09, "epoch": 4.97063369397218, "percentage": 99.63, "elapsed_time": "11:45:32", "remaining_time": "0:02:38"}
803
+ {"current_steps": 803, "total_steps": 805, "loss": 0.8764, "lr": 1.506294444153511e-09, "epoch": 4.976816074188562, "percentage": 99.75, "elapsed_time": "11:46:24", "remaining_time": "0:01:45"}
804
+ {"current_steps": 804, "total_steps": 805, "loss": 0.8589, "lr": 3.7657538364932467e-10, "epoch": 4.982998454404946, "percentage": 99.88, "elapsed_time": "11:47:15", "remaining_time": "0:00:52"}
805
+ {"current_steps": 805, "total_steps": 805, "loss": 0.8693, "lr": 0.0, "epoch": 4.9891808346213296, "percentage": 100.0, "elapsed_time": "11:48:07", "remaining_time": "0:00:00"}
806
+ {"current_steps": 805, "total_steps": 805, "epoch": 4.9891808346213296, "percentage": 100.0, "elapsed_time": "11:49:37", "remaining_time": "0:00:00"}