Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e9591658ee43e4ffd112d9b68ec8286a91030372dabb5b772026464603ac1cb5
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13a623c1ffada540ad2467af9fbf641579a4bb56e6fc65569926ab28ea7a8be6
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ee3e383047de4040ee0197385e9548480640f76f40b2d0993415c854dd1a6d2
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:636f2050d218444939996c82c8726cf3e8ab3eb9c44598a7221d876c4c853691
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -1028,3 +1028,247 @@
|
|
| 1028 |
{"current_steps": 785, "total_steps": 1215, "loss": 0.2833, "lr": 1.3427372239824478e-05, "epoch": 3.2271325796505654, "percentage": 64.61, "elapsed_time": "5:05:34", "remaining_time": "2:47:23"}
|
| 1029 |
{"current_steps": 786, "total_steps": 1215, "loss": 0.2815, "lr": 1.3373106634813395e-05, "epoch": 3.2312435765673175, "percentage": 64.69, "elapsed_time": "5:05:57", "remaining_time": "2:46:59"}
|
| 1030 |
{"current_steps": 787, "total_steps": 1215, "loss": 0.2737, "lr": 1.3318895777908989e-05, "epoch": 3.23535457348407, "percentage": 64.77, "elapsed_time": "5:06:20", "remaining_time": "2:46:35"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1028 |
{"current_steps": 785, "total_steps": 1215, "loss": 0.2833, "lr": 1.3427372239824478e-05, "epoch": 3.2271325796505654, "percentage": 64.61, "elapsed_time": "5:05:34", "remaining_time": "2:47:23"}
|
| 1029 |
{"current_steps": 786, "total_steps": 1215, "loss": 0.2815, "lr": 1.3373106634813395e-05, "epoch": 3.2312435765673175, "percentage": 64.69, "elapsed_time": "5:05:57", "remaining_time": "2:46:59"}
|
| 1030 |
{"current_steps": 787, "total_steps": 1215, "loss": 0.2737, "lr": 1.3318895777908989e-05, "epoch": 3.23535457348407, "percentage": 64.77, "elapsed_time": "5:06:20", "remaining_time": "2:46:35"}
|
| 1031 |
+
{"current_steps": 788, "total_steps": 1215, "loss": 0.2784, "lr": 1.3264740116974477e-05, "epoch": 3.239465570400822, "percentage": 64.86, "elapsed_time": "5:06:44", "remaining_time": "2:46:12"}
|
| 1032 |
+
{"current_steps": 789, "total_steps": 1215, "loss": 0.2677, "lr": 1.3210640099417071e-05, "epoch": 3.2435765673175747, "percentage": 64.94, "elapsed_time": "5:07:06", "remaining_time": "2:45:49"}
|
| 1033 |
+
{"current_steps": 790, "total_steps": 1215, "loss": 0.2843, "lr": 1.3156596172184291e-05, "epoch": 3.247687564234327, "percentage": 65.02, "elapsed_time": "5:07:30", "remaining_time": "2:45:25"}
|
| 1034 |
+
{"current_steps": 791, "total_steps": 1215, "loss": 0.2783, "lr": 1.3102608781760262e-05, "epoch": 3.2517985611510793, "percentage": 65.1, "elapsed_time": "5:07:53", "remaining_time": "2:45:02"}
|
| 1035 |
+
{"current_steps": 792, "total_steps": 1215, "loss": 0.2764, "lr": 1.3048678374162033e-05, "epoch": 3.2559095580678314, "percentage": 65.19, "elapsed_time": "5:08:16", "remaining_time": "2:44:38"}
|
| 1036 |
+
{"current_steps": 793, "total_steps": 1215, "loss": 0.2783, "lr": 1.2994805394935883e-05, "epoch": 3.2600205549845835, "percentage": 65.27, "elapsed_time": "5:08:39", "remaining_time": "2:44:15"}
|
| 1037 |
+
{"current_steps": 794, "total_steps": 1215, "loss": 0.2818, "lr": 1.2940990289153654e-05, "epoch": 3.264131551901336, "percentage": 65.35, "elapsed_time": "5:09:01", "remaining_time": "2:43:50"}
|
| 1038 |
+
{"current_steps": 795, "total_steps": 1215, "loss": 0.2715, "lr": 1.2887233501409062e-05, "epoch": 3.2682425488180886, "percentage": 65.43, "elapsed_time": "5:09:24", "remaining_time": "2:43:27"}
|
| 1039 |
+
{"current_steps": 796, "total_steps": 1215, "loss": 0.2815, "lr": 1.283353547581403e-05, "epoch": 3.2723535457348407, "percentage": 65.51, "elapsed_time": "5:09:47", "remaining_time": "2:43:04"}
|
| 1040 |
+
{"current_steps": 797, "total_steps": 1215, "loss": 0.2649, "lr": 1.2779896655995012e-05, "epoch": 3.276464542651593, "percentage": 65.6, "elapsed_time": "5:10:11", "remaining_time": "2:42:41"}
|
| 1041 |
+
{"current_steps": 798, "total_steps": 1215, "loss": 0.2857, "lr": 1.2726317485089345e-05, "epoch": 3.2805755395683454, "percentage": 65.68, "elapsed_time": "5:10:34", "remaining_time": "2:42:17"}
|
| 1042 |
+
{"current_steps": 799, "total_steps": 1215, "loss": 0.2744, "lr": 1.2672798405741565e-05, "epoch": 3.2846865364850975, "percentage": 65.76, "elapsed_time": "5:10:58", "remaining_time": "2:41:54"}
|
| 1043 |
+
{"current_steps": 800, "total_steps": 1215, "loss": 0.2714, "lr": 1.261933986009976e-05, "epoch": 3.28879753340185, "percentage": 65.84, "elapsed_time": "5:11:20", "remaining_time": "2:41:30"}
|
| 1044 |
+
{"current_steps": 801, "total_steps": 1215, "loss": 0.2821, "lr": 1.2565942289811926e-05, "epoch": 3.292908530318602, "percentage": 65.93, "elapsed_time": "5:11:43", "remaining_time": "2:41:07"}
|
| 1045 |
+
{"current_steps": 802, "total_steps": 1215, "loss": 0.2684, "lr": 1.2512606136022316e-05, "epoch": 3.2970195272353546, "percentage": 66.01, "elapsed_time": "5:12:08", "remaining_time": "2:40:44"}
|
| 1046 |
+
{"current_steps": 803, "total_steps": 1215, "loss": 0.28, "lr": 1.245933183936778e-05, "epoch": 3.3011305241521067, "percentage": 66.09, "elapsed_time": "5:12:31", "remaining_time": "2:40:20"}
|
| 1047 |
+
{"current_steps": 804, "total_steps": 1215, "loss": 0.2791, "lr": 1.2406119839974137e-05, "epoch": 3.3052415210688593, "percentage": 66.17, "elapsed_time": "5:12:54", "remaining_time": "2:39:57"}
|
| 1048 |
+
{"current_steps": 805, "total_steps": 1215, "loss": 0.282, "lr": 1.2352970577452536e-05, "epoch": 3.3093525179856114, "percentage": 66.26, "elapsed_time": "5:13:17", "remaining_time": "2:39:34"}
|
| 1049 |
+
{"current_steps": 806, "total_steps": 1215, "loss": 0.2705, "lr": 1.2299884490895829e-05, "epoch": 3.313463514902364, "percentage": 66.34, "elapsed_time": "5:13:40", "remaining_time": "2:39:10"}
|
| 1050 |
+
{"current_steps": 807, "total_steps": 1215, "loss": 0.2675, "lr": 1.2246862018874937e-05, "epoch": 3.317574511819116, "percentage": 66.42, "elapsed_time": "5:14:04", "remaining_time": "2:38:47"}
|
| 1051 |
+
{"current_steps": 808, "total_steps": 1215, "loss": 0.2867, "lr": 1.2193903599435229e-05, "epoch": 3.3216855087358685, "percentage": 66.5, "elapsed_time": "5:14:27", "remaining_time": "2:38:23"}
|
| 1052 |
+
{"current_steps": 809, "total_steps": 1215, "loss": 0.263, "lr": 1.2141009670092905e-05, "epoch": 3.3257965056526206, "percentage": 66.58, "elapsed_time": "5:14:50", "remaining_time": "2:38:00"}
|
| 1053 |
+
{"current_steps": 810, "total_steps": 1215, "loss": 0.285, "lr": 1.2088180667831378e-05, "epoch": 3.329907502569373, "percentage": 66.67, "elapsed_time": "5:15:14", "remaining_time": "2:37:37"}
|
| 1054 |
+
{"current_steps": 811, "total_steps": 1215, "loss": 0.2794, "lr": 1.2035417029097669e-05, "epoch": 3.3340184994861253, "percentage": 66.75, "elapsed_time": "5:15:37", "remaining_time": "2:37:13"}
|
| 1055 |
+
{"current_steps": 812, "total_steps": 1215, "loss": 0.2661, "lr": 1.198271918979879e-05, "epoch": 3.338129496402878, "percentage": 66.83, "elapsed_time": "5:16:00", "remaining_time": "2:36:50"}
|
| 1056 |
+
{"current_steps": 813, "total_steps": 1215, "loss": 0.2691, "lr": 1.1930087585298163e-05, "epoch": 3.34224049331963, "percentage": 66.91, "elapsed_time": "5:16:23", "remaining_time": "2:36:26"}
|
| 1057 |
+
{"current_steps": 814, "total_steps": 1215, "loss": 0.2777, "lr": 1.1877522650412002e-05, "epoch": 3.3463514902363825, "percentage": 67.0, "elapsed_time": "5:16:47", "remaining_time": "2:36:03"}
|
| 1058 |
+
{"current_steps": 815, "total_steps": 1215, "loss": 0.2829, "lr": 1.1825024819405728e-05, "epoch": 3.3504624871531345, "percentage": 67.08, "elapsed_time": "5:17:11", "remaining_time": "2:35:40"}
|
| 1059 |
+
{"current_steps": 816, "total_steps": 1215, "loss": 0.2883, "lr": 1.177259452599039e-05, "epoch": 3.354573484069887, "percentage": 67.16, "elapsed_time": "5:17:35", "remaining_time": "2:35:17"}
|
| 1060 |
+
{"current_steps": 817, "total_steps": 1215, "loss": 0.2703, "lr": 1.1720232203319072e-05, "epoch": 3.358684480986639, "percentage": 67.24, "elapsed_time": "5:17:58", "remaining_time": "2:34:54"}
|
| 1061 |
+
{"current_steps": 818, "total_steps": 1215, "loss": 0.2818, "lr": 1.1667938283983318e-05, "epoch": 3.3627954779033917, "percentage": 67.33, "elapsed_time": "5:18:21", "remaining_time": "2:34:30"}
|
| 1062 |
+
{"current_steps": 819, "total_steps": 1215, "loss": 0.2894, "lr": 1.1615713200009555e-05, "epoch": 3.366906474820144, "percentage": 67.41, "elapsed_time": "5:18:44", "remaining_time": "2:34:06"}
|
| 1063 |
+
{"current_steps": 820, "total_steps": 1215, "loss": 0.2765, "lr": 1.1563557382855527e-05, "epoch": 3.3710174717368964, "percentage": 67.49, "elapsed_time": "5:19:07", "remaining_time": "2:33:43"}
|
| 1064 |
+
{"current_steps": 821, "total_steps": 1215, "loss": 0.2783, "lr": 1.1511471263406727e-05, "epoch": 3.3751284686536485, "percentage": 67.57, "elapsed_time": "5:19:31", "remaining_time": "2:33:20"}
|
| 1065 |
+
{"current_steps": 822, "total_steps": 1215, "loss": 0.2826, "lr": 1.1459455271972855e-05, "epoch": 3.379239465570401, "percentage": 67.65, "elapsed_time": "5:19:54", "remaining_time": "2:32:56"}
|
| 1066 |
+
{"current_steps": 823, "total_steps": 1215, "loss": 0.2702, "lr": 1.1407509838284234e-05, "epoch": 3.383350462487153, "percentage": 67.74, "elapsed_time": "5:20:16", "remaining_time": "2:32:32"}
|
| 1067 |
+
{"current_steps": 824, "total_steps": 1215, "loss": 0.2816, "lr": 1.1355635391488273e-05, "epoch": 3.3874614594039056, "percentage": 67.82, "elapsed_time": "5:20:39", "remaining_time": "2:32:09"}
|
| 1068 |
+
{"current_steps": 825, "total_steps": 1215, "loss": 0.2807, "lr": 1.130383236014593e-05, "epoch": 3.3915724563206577, "percentage": 67.9, "elapsed_time": "5:21:01", "remaining_time": "2:31:45"}
|
| 1069 |
+
{"current_steps": 826, "total_steps": 1215, "loss": 0.2812, "lr": 1.1252101172228161e-05, "epoch": 3.3956834532374103, "percentage": 67.98, "elapsed_time": "5:21:26", "remaining_time": "2:31:22"}
|
| 1070 |
+
{"current_steps": 827, "total_steps": 1215, "loss": 0.2781, "lr": 1.1200442255112382e-05, "epoch": 3.3997944501541624, "percentage": 68.07, "elapsed_time": "5:21:49", "remaining_time": "2:30:59"}
|
| 1071 |
+
{"current_steps": 828, "total_steps": 1215, "loss": 0.2793, "lr": 1.1148856035578954e-05, "epoch": 3.4039054470709145, "percentage": 68.15, "elapsed_time": "5:22:12", "remaining_time": "2:30:36"}
|
| 1072 |
+
{"current_steps": 829, "total_steps": 1215, "loss": 0.2826, "lr": 1.1097342939807639e-05, "epoch": 3.408016443987667, "percentage": 68.23, "elapsed_time": "5:22:36", "remaining_time": "2:30:12"}
|
| 1073 |
+
{"current_steps": 830, "total_steps": 1215, "loss": 0.2678, "lr": 1.1045903393374088e-05, "epoch": 3.4121274409044196, "percentage": 68.31, "elapsed_time": "5:22:59", "remaining_time": "2:29:49"}
|
| 1074 |
+
{"current_steps": 831, "total_steps": 1215, "loss": 0.2768, "lr": 1.0994537821246322e-05, "epoch": 3.4162384378211716, "percentage": 68.4, "elapsed_time": "5:23:22", "remaining_time": "2:29:25"}
|
| 1075 |
+
{"current_steps": 832, "total_steps": 1215, "loss": 0.2822, "lr": 1.0943246647781231e-05, "epoch": 3.4203494347379237, "percentage": 68.48, "elapsed_time": "5:23:43", "remaining_time": "2:29:01"}
|
| 1076 |
+
{"current_steps": 833, "total_steps": 1215, "loss": 0.274, "lr": 1.0892030296721053e-05, "epoch": 3.4244604316546763, "percentage": 68.56, "elapsed_time": "5:24:08", "remaining_time": "2:28:38"}
|
| 1077 |
+
{"current_steps": 834, "total_steps": 1215, "loss": 0.2815, "lr": 1.0840889191189881e-05, "epoch": 3.4285714285714284, "percentage": 68.64, "elapsed_time": "5:24:31", "remaining_time": "2:28:15"}
|
| 1078 |
+
{"current_steps": 835, "total_steps": 1215, "loss": 0.265, "lr": 1.0789823753690165e-05, "epoch": 3.432682425488181, "percentage": 68.72, "elapsed_time": "5:24:54", "remaining_time": "2:27:51"}
|
| 1079 |
+
{"current_steps": 836, "total_steps": 1215, "loss": 0.2819, "lr": 1.073883440609923e-05, "epoch": 3.436793422404933, "percentage": 68.81, "elapsed_time": "5:25:16", "remaining_time": "2:27:28"}
|
| 1080 |
+
{"current_steps": 837, "total_steps": 1215, "loss": 0.2743, "lr": 1.0687921569665778e-05, "epoch": 3.4409044193216856, "percentage": 68.89, "elapsed_time": "5:25:40", "remaining_time": "2:27:04"}
|
| 1081 |
+
{"current_steps": 838, "total_steps": 1215, "loss": 0.2757, "lr": 1.0637085665006416e-05, "epoch": 3.4450154162384377, "percentage": 68.97, "elapsed_time": "5:26:03", "remaining_time": "2:26:41"}
|
| 1082 |
+
{"current_steps": 839, "total_steps": 1215, "loss": 0.2867, "lr": 1.058632711210218e-05, "epoch": 3.44912641315519, "percentage": 69.05, "elapsed_time": "5:26:26", "remaining_time": "2:26:17"}
|
| 1083 |
+
{"current_steps": 840, "total_steps": 1215, "loss": 0.2775, "lr": 1.0535646330295064e-05, "epoch": 3.4532374100719423, "percentage": 69.14, "elapsed_time": "5:26:48", "remaining_time": "2:25:53"}
|
| 1084 |
+
{"current_steps": 841, "total_steps": 1215, "loss": 0.2772, "lr": 1.0485043738284543e-05, "epoch": 3.457348406988695, "percentage": 69.22, "elapsed_time": "5:27:11", "remaining_time": "2:25:30"}
|
| 1085 |
+
{"current_steps": 842, "total_steps": 1215, "loss": 0.2883, "lr": 1.0434519754124155e-05, "epoch": 3.461459403905447, "percentage": 69.3, "elapsed_time": "5:27:34", "remaining_time": "2:25:07"}
|
| 1086 |
+
{"current_steps": 843, "total_steps": 1215, "loss": 0.2729, "lr": 1.0384074795217995e-05, "epoch": 3.4655704008221995, "percentage": 69.38, "elapsed_time": "5:27:57", "remaining_time": "2:24:43"}
|
| 1087 |
+
{"current_steps": 844, "total_steps": 1215, "loss": 0.2794, "lr": 1.0333709278317295e-05, "epoch": 3.4696813977389516, "percentage": 69.47, "elapsed_time": "5:28:20", "remaining_time": "2:24:19"}
|
| 1088 |
+
{"current_steps": 845, "total_steps": 1215, "loss": 0.2831, "lr": 1.0283423619516984e-05, "epoch": 3.473792394655704, "percentage": 69.55, "elapsed_time": "5:28:44", "remaining_time": "2:23:56"}
|
| 1089 |
+
{"current_steps": 846, "total_steps": 1215, "loss": 0.2798, "lr": 1.0233218234252233e-05, "epoch": 3.477903391572456, "percentage": 69.63, "elapsed_time": "5:29:07", "remaining_time": "2:23:33"}
|
| 1090 |
+
{"current_steps": 847, "total_steps": 1215, "loss": 0.2834, "lr": 1.0183093537295038e-05, "epoch": 3.4820143884892087, "percentage": 69.71, "elapsed_time": "5:29:30", "remaining_time": "2:23:09"}
|
| 1091 |
+
{"current_steps": 848, "total_steps": 1215, "loss": 0.2815, "lr": 1.0133049942750794e-05, "epoch": 3.486125385405961, "percentage": 69.79, "elapsed_time": "5:29:52", "remaining_time": "2:22:45"}
|
| 1092 |
+
{"current_steps": 849, "total_steps": 1215, "loss": 0.2782, "lr": 1.0083087864054862e-05, "epoch": 3.4902363823227134, "percentage": 69.88, "elapsed_time": "5:30:15", "remaining_time": "2:22:22"}
|
| 1093 |
+
{"current_steps": 850, "total_steps": 1215, "loss": 0.2668, "lr": 1.0033207713969152e-05, "epoch": 3.4943473792394655, "percentage": 69.96, "elapsed_time": "5:30:38", "remaining_time": "2:21:58"}
|
| 1094 |
+
{"current_steps": 851, "total_steps": 1215, "loss": 0.2771, "lr": 9.983409904578732e-06, "epoch": 3.498458376156218, "percentage": 70.04, "elapsed_time": "5:31:00", "remaining_time": "2:21:34"}
|
| 1095 |
+
{"current_steps": 852, "total_steps": 1215, "loss": 0.2769, "lr": 9.93369484728841e-06, "epoch": 3.50256937307297, "percentage": 70.12, "elapsed_time": "5:31:22", "remaining_time": "2:21:10"}
|
| 1096 |
+
{"current_steps": 853, "total_steps": 1215, "loss": 0.2809, "lr": 9.884062952819336e-06, "epoch": 3.5066803699897227, "percentage": 70.21, "elapsed_time": "5:31:45", "remaining_time": "2:20:47"}
|
| 1097 |
+
{"current_steps": 854, "total_steps": 1215, "loss": 0.2826, "lr": 9.834514631205607e-06, "epoch": 3.5107913669064748, "percentage": 70.29, "elapsed_time": "5:32:09", "remaining_time": "2:20:24"}
|
| 1098 |
+
{"current_steps": 855, "total_steps": 1215, "loss": 0.27, "lr": 9.785050291790886e-06, "epoch": 3.5149023638232273, "percentage": 70.37, "elapsed_time": "5:32:33", "remaining_time": "2:20:01"}
|
| 1099 |
+
{"current_steps": 856, "total_steps": 1215, "loss": 0.2759, "lr": 9.735670343225015e-06, "epoch": 3.5190133607399794, "percentage": 70.45, "elapsed_time": "5:32:55", "remaining_time": "2:19:37"}
|
| 1100 |
+
{"current_steps": 857, "total_steps": 1215, "loss": 0.2842, "lr": 9.68637519346064e-06, "epoch": 3.523124357656732, "percentage": 70.53, "elapsed_time": "5:33:18", "remaining_time": "2:19:14"}
|
| 1101 |
+
{"current_steps": 858, "total_steps": 1215, "loss": 0.2677, "lr": 9.637165249749847e-06, "epoch": 3.527235354573484, "percentage": 70.62, "elapsed_time": "5:33:39", "remaining_time": "2:18:49"}
|
| 1102 |
+
{"current_steps": 859, "total_steps": 1215, "loss": 0.2819, "lr": 9.588040918640784e-06, "epoch": 3.531346351490236, "percentage": 70.7, "elapsed_time": "5:34:03", "remaining_time": "2:18:26"}
|
| 1103 |
+
{"current_steps": 860, "total_steps": 1215, "loss": 0.2762, "lr": 9.539002605974315e-06, "epoch": 3.5354573484069887, "percentage": 70.78, "elapsed_time": "5:34:25", "remaining_time": "2:18:02"}
|
| 1104 |
+
{"current_steps": 861, "total_steps": 1215, "loss": 0.2761, "lr": 9.490050716880652e-06, "epoch": 3.539568345323741, "percentage": 70.86, "elapsed_time": "5:34:48", "remaining_time": "2:17:39"}
|
| 1105 |
+
{"current_steps": 862, "total_steps": 1215, "loss": 0.2836, "lr": 9.441185655776044e-06, "epoch": 3.5436793422404933, "percentage": 70.95, "elapsed_time": "5:35:11", "remaining_time": "2:17:15"}
|
| 1106 |
+
{"current_steps": 863, "total_steps": 1215, "loss": 0.2797, "lr": 9.392407826359386e-06, "epoch": 3.5477903391572454, "percentage": 71.03, "elapsed_time": "5:35:34", "remaining_time": "2:16:52"}
|
| 1107 |
+
{"current_steps": 864, "total_steps": 1215, "loss": 0.2805, "lr": 9.343717631608913e-06, "epoch": 3.551901336073998, "percentage": 71.11, "elapsed_time": "5:35:57", "remaining_time": "2:16:28"}
|
| 1108 |
+
{"current_steps": 865, "total_steps": 1215, "loss": 0.2737, "lr": 9.295115473778871e-06, "epoch": 3.5560123329907505, "percentage": 71.19, "elapsed_time": "5:36:19", "remaining_time": "2:16:04"}
|
| 1109 |
+
{"current_steps": 866, "total_steps": 1215, "loss": 0.2775, "lr": 9.246601754396184e-06, "epoch": 3.5601233299075026, "percentage": 71.28, "elapsed_time": "5:36:42", "remaining_time": "2:15:41"}
|
| 1110 |
+
{"current_steps": 867, "total_steps": 1215, "loss": 0.2801, "lr": 9.198176874257147e-06, "epoch": 3.5642343268242547, "percentage": 71.36, "elapsed_time": "5:37:05", "remaining_time": "2:15:18"}
|
| 1111 |
+
{"current_steps": 868, "total_steps": 1215, "loss": 0.2903, "lr": 9.149841233424102e-06, "epoch": 3.568345323741007, "percentage": 71.44, "elapsed_time": "5:37:27", "remaining_time": "2:14:54"}
|
| 1112 |
+
{"current_steps": 869, "total_steps": 1215, "loss": 0.2714, "lr": 9.101595231222142e-06, "epoch": 3.5724563206577598, "percentage": 71.52, "elapsed_time": "5:37:50", "remaining_time": "2:14:30"}
|
| 1113 |
+
{"current_steps": 870, "total_steps": 1215, "loss": 0.2747, "lr": 9.053439266235817e-06, "epoch": 3.576567317574512, "percentage": 71.6, "elapsed_time": "5:38:13", "remaining_time": "2:14:07"}
|
| 1114 |
+
{"current_steps": 871, "total_steps": 1215, "loss": 0.2866, "lr": 9.005373736305827e-06, "epoch": 3.580678314491264, "percentage": 71.69, "elapsed_time": "5:38:37", "remaining_time": "2:13:44"}
|
| 1115 |
+
{"current_steps": 872, "total_steps": 1215, "loss": 0.2768, "lr": 8.957399038525742e-06, "epoch": 3.5847893114080165, "percentage": 71.77, "elapsed_time": "5:39:00", "remaining_time": "2:13:20"}
|
| 1116 |
+
{"current_steps": 873, "total_steps": 1215, "loss": 0.2805, "lr": 8.909515569238727e-06, "epoch": 3.588900308324769, "percentage": 71.85, "elapsed_time": "5:39:22", "remaining_time": "2:12:57"}
|
| 1117 |
+
{"current_steps": 874, "total_steps": 1215, "loss": 0.281, "lr": 8.861723724034256e-06, "epoch": 3.593011305241521, "percentage": 71.93, "elapsed_time": "5:39:45", "remaining_time": "2:12:33"}
|
| 1118 |
+
{"current_steps": 875, "total_steps": 1215, "loss": 0.2722, "lr": 8.814023897744861e-06, "epoch": 3.597122302158273, "percentage": 72.02, "elapsed_time": "5:40:08", "remaining_time": "2:12:09"}
|
| 1119 |
+
{"current_steps": 876, "total_steps": 1215, "loss": 0.288, "lr": 8.766416484442845e-06, "epoch": 3.6012332990750258, "percentage": 72.1, "elapsed_time": "5:40:31", "remaining_time": "2:11:46"}
|
| 1120 |
+
{"current_steps": 877, "total_steps": 1215, "loss": 0.2833, "lr": 8.71890187743705e-06, "epoch": 3.605344295991778, "percentage": 72.18, "elapsed_time": "5:40:55", "remaining_time": "2:11:23"}
|
| 1121 |
+
{"current_steps": 878, "total_steps": 1215, "loss": 0.2815, "lr": 8.6714804692696e-06, "epoch": 3.6094552929085304, "percentage": 72.26, "elapsed_time": "5:41:18", "remaining_time": "2:11:00"}
|
| 1122 |
+
{"current_steps": 879, "total_steps": 1215, "loss": 0.2796, "lr": 8.624152651712647e-06, "epoch": 3.6135662898252825, "percentage": 72.35, "elapsed_time": "5:41:41", "remaining_time": "2:10:36"}
|
| 1123 |
+
{"current_steps": 880, "total_steps": 1215, "loss": 0.276, "lr": 8.576918815765155e-06, "epoch": 3.617677286742035, "percentage": 72.43, "elapsed_time": "5:42:03", "remaining_time": "2:10:12"}
|
| 1124 |
+
{"current_steps": 881, "total_steps": 1215, "loss": 0.2793, "lr": 8.52977935164965e-06, "epoch": 3.621788283658787, "percentage": 72.51, "elapsed_time": "5:42:26", "remaining_time": "2:09:49"}
|
| 1125 |
+
{"current_steps": 882, "total_steps": 1215, "loss": 0.2828, "lr": 8.482734648808998e-06, "epoch": 3.6258992805755397, "percentage": 72.59, "elapsed_time": "5:42:49", "remaining_time": "2:09:26"}
|
| 1126 |
+
{"current_steps": 883, "total_steps": 1215, "loss": 0.2767, "lr": 8.435785095903226e-06, "epoch": 3.6300102774922918, "percentage": 72.67, "elapsed_time": "5:43:10", "remaining_time": "2:09:01"}
|
| 1127 |
+
{"current_steps": 884, "total_steps": 1215, "loss": 0.277, "lr": 8.388931080806244e-06, "epoch": 3.6341212744090443, "percentage": 72.76, "elapsed_time": "5:43:34", "remaining_time": "2:08:38"}
|
| 1128 |
+
{"current_steps": 885, "total_steps": 1215, "loss": 0.2743, "lr": 8.342172990602692e-06, "epoch": 3.6382322713257964, "percentage": 72.84, "elapsed_time": "5:43:56", "remaining_time": "2:08:14"}
|
| 1129 |
+
{"current_steps": 886, "total_steps": 1215, "loss": 0.2684, "lr": 8.295511211584726e-06, "epoch": 3.642343268242549, "percentage": 72.92, "elapsed_time": "5:44:19", "remaining_time": "2:07:51"}
|
| 1130 |
+
{"current_steps": 887, "total_steps": 1215, "loss": 0.2762, "lr": 8.248946129248821e-06, "epoch": 3.646454265159301, "percentage": 73.0, "elapsed_time": "5:44:42", "remaining_time": "2:07:28"}
|
| 1131 |
+
{"current_steps": 888, "total_steps": 1215, "loss": 0.279, "lr": 8.202478128292594e-06, "epoch": 3.6505652620760536, "percentage": 73.09, "elapsed_time": "5:45:06", "remaining_time": "2:07:04"}
|
| 1132 |
+
{"current_steps": 889, "total_steps": 1215, "loss": 0.2743, "lr": 8.15610759261163e-06, "epoch": 3.6546762589928057, "percentage": 73.17, "elapsed_time": "5:45:28", "remaining_time": "2:06:41"}
|
| 1133 |
+
{"current_steps": 890, "total_steps": 1215, "loss": 0.2687, "lr": 8.109834905296296e-06, "epoch": 3.6587872559095582, "percentage": 73.25, "elapsed_time": "5:45:50", "remaining_time": "2:06:17"}
|
| 1134 |
+
{"current_steps": 891, "total_steps": 1215, "loss": 0.2776, "lr": 8.06366044862859e-06, "epoch": 3.6628982528263103, "percentage": 73.33, "elapsed_time": "5:46:13", "remaining_time": "2:05:53"}
|
| 1135 |
+
{"current_steps": 892, "total_steps": 1215, "loss": 0.2801, "lr": 8.017584604078974e-06, "epoch": 3.667009249743063, "percentage": 73.42, "elapsed_time": "5:46:37", "remaining_time": "2:05:30"}
|
| 1136 |
+
{"current_steps": 893, "total_steps": 1215, "loss": 0.28, "lr": 7.971607752303226e-06, "epoch": 3.671120246659815, "percentage": 73.5, "elapsed_time": "5:47:00", "remaining_time": "2:05:07"}
|
| 1137 |
+
{"current_steps": 894, "total_steps": 1215, "loss": 0.2712, "lr": 7.925730273139294e-06, "epoch": 3.675231243576567, "percentage": 73.58, "elapsed_time": "5:47:22", "remaining_time": "2:04:43"}
|
| 1138 |
+
{"current_steps": 895, "total_steps": 1215, "loss": 0.2926, "lr": 7.879952545604163e-06, "epoch": 3.6793422404933196, "percentage": 73.66, "elapsed_time": "5:47:45", "remaining_time": "2:04:20"}
|
| 1139 |
+
{"current_steps": 896, "total_steps": 1215, "loss": 0.2798, "lr": 7.834274947890715e-06, "epoch": 3.683453237410072, "percentage": 73.74, "elapsed_time": "5:48:08", "remaining_time": "2:03:56"}
|
| 1140 |
+
{"current_steps": 897, "total_steps": 1215, "loss": 0.2694, "lr": 7.78869785736461e-06, "epoch": 3.6875642343268242, "percentage": 73.83, "elapsed_time": "5:48:30", "remaining_time": "2:03:32"}
|
| 1141 |
+
{"current_steps": 898, "total_steps": 1215, "loss": 0.2667, "lr": 7.74322165056117e-06, "epoch": 3.6916752312435763, "percentage": 73.91, "elapsed_time": "5:48:53", "remaining_time": "2:03:09"}
|
| 1142 |
+
{"current_steps": 899, "total_steps": 1215, "loss": 0.2784, "lr": 7.697846703182262e-06, "epoch": 3.695786228160329, "percentage": 73.99, "elapsed_time": "5:49:16", "remaining_time": "2:02:46"}
|
| 1143 |
+
{"current_steps": 900, "total_steps": 1215, "loss": 0.285, "lr": 7.652573390093199e-06, "epoch": 3.6998972250770814, "percentage": 74.07, "elapsed_time": "5:49:39", "remaining_time": "2:02:22"}
|
| 1144 |
+
{"current_steps": 901, "total_steps": 1215, "loss": 0.2759, "lr": 7.607402085319644e-06, "epoch": 3.7040082219938335, "percentage": 74.16, "elapsed_time": "5:50:02", "remaining_time": "2:01:59"}
|
| 1145 |
+
{"current_steps": 902, "total_steps": 1215, "loss": 0.2775, "lr": 7.562333162044508e-06, "epoch": 3.7081192189105856, "percentage": 74.24, "elapsed_time": "5:50:25", "remaining_time": "2:01:35"}
|
| 1146 |
+
{"current_steps": 903, "total_steps": 1215, "loss": 0.2767, "lr": 7.517366992604902e-06, "epoch": 3.712230215827338, "percentage": 74.32, "elapsed_time": "5:50:48", "remaining_time": "2:01:12"}
|
| 1147 |
+
{"current_steps": 904, "total_steps": 1215, "loss": 0.2874, "lr": 7.4725039484890094e-06, "epoch": 3.7163412127440907, "percentage": 74.4, "elapsed_time": "5:51:12", "remaining_time": "2:00:49"}
|
| 1148 |
+
{"current_steps": 905, "total_steps": 1215, "loss": 0.2789, "lr": 7.427744400333053e-06, "epoch": 3.720452209660843, "percentage": 74.49, "elapsed_time": "5:51:35", "remaining_time": "2:00:25"}
|
| 1149 |
+
{"current_steps": 906, "total_steps": 1215, "loss": 0.2748, "lr": 7.383088717918223e-06, "epoch": 3.724563206577595, "percentage": 74.57, "elapsed_time": "5:51:58", "remaining_time": "2:00:02"}
|
| 1150 |
+
{"current_steps": 907, "total_steps": 1215, "loss": 0.277, "lr": 7.338537270167625e-06, "epoch": 3.7286742034943474, "percentage": 74.65, "elapsed_time": "5:52:21", "remaining_time": "1:59:39"}
|
| 1151 |
+
{"current_steps": 908, "total_steps": 1215, "loss": 0.273, "lr": 7.294090425143225e-06, "epoch": 3.7327852004111, "percentage": 74.73, "elapsed_time": "5:52:41", "remaining_time": "1:59:14"}
|
| 1152 |
+
{"current_steps": 909, "total_steps": 1215, "loss": 0.2806, "lr": 7.249748550042817e-06, "epoch": 3.736896197327852, "percentage": 74.81, "elapsed_time": "5:53:04", "remaining_time": "1:58:51"}
|
| 1153 |
+
{"current_steps": 910, "total_steps": 1215, "loss": 0.2705, "lr": 7.20551201119698e-06, "epoch": 3.741007194244604, "percentage": 74.9, "elapsed_time": "5:53:26", "remaining_time": "1:58:27"}
|
| 1154 |
+
{"current_steps": 911, "total_steps": 1215, "loss": 0.2829, "lr": 7.161381174066065e-06, "epoch": 3.7451181911613567, "percentage": 74.98, "elapsed_time": "5:53:50", "remaining_time": "1:58:04"}
|
| 1155 |
+
{"current_steps": 912, "total_steps": 1215, "loss": 0.2813, "lr": 7.117356403237161e-06, "epoch": 3.749229188078109, "percentage": 75.06, "elapsed_time": "5:54:13", "remaining_time": "1:57:41"}
|
| 1156 |
+
{"current_steps": 913, "total_steps": 1215, "loss": 0.2782, "lr": 7.073438062421094e-06, "epoch": 3.7533401849948613, "percentage": 75.14, "elapsed_time": "5:54:36", "remaining_time": "1:57:17"}
|
| 1157 |
+
{"current_steps": 914, "total_steps": 1215, "loss": 0.27, "lr": 7.029626514449414e-06, "epoch": 3.7574511819116134, "percentage": 75.23, "elapsed_time": "5:54:59", "remaining_time": "1:56:54"}
|
| 1158 |
+
{"current_steps": 915, "total_steps": 1215, "loss": 0.2728, "lr": 6.985922121271409e-06, "epoch": 3.761562178828366, "percentage": 75.31, "elapsed_time": "5:55:22", "remaining_time": "1:56:30"}
|
| 1159 |
+
{"current_steps": 916, "total_steps": 1215, "loss": 0.2824, "lr": 6.942325243951098e-06, "epoch": 3.765673175745118, "percentage": 75.39, "elapsed_time": "5:55:44", "remaining_time": "1:56:07"}
|
| 1160 |
+
{"current_steps": 917, "total_steps": 1215, "loss": 0.282, "lr": 6.898836242664262e-06, "epoch": 3.7697841726618706, "percentage": 75.47, "elapsed_time": "5:56:07", "remaining_time": "1:55:43"}
|
| 1161 |
+
{"current_steps": 918, "total_steps": 1215, "loss": 0.2706, "lr": 6.855455476695465e-06, "epoch": 3.7738951695786227, "percentage": 75.56, "elapsed_time": "5:56:28", "remaining_time": "1:55:19"}
|
| 1162 |
+
{"current_steps": 919, "total_steps": 1215, "loss": 0.2801, "lr": 6.812183304435083e-06, "epoch": 3.7780061664953752, "percentage": 75.64, "elapsed_time": "5:56:52", "remaining_time": "1:54:56"}
|
| 1163 |
+
{"current_steps": 920, "total_steps": 1215, "loss": 0.2721, "lr": 6.769020083376341e-06, "epoch": 3.7821171634121273, "percentage": 75.72, "elapsed_time": "5:57:15", "remaining_time": "1:54:33"}
|
| 1164 |
+
{"current_steps": 921, "total_steps": 1215, "loss": 0.2686, "lr": 6.725966170112368e-06, "epoch": 3.78622816032888, "percentage": 75.8, "elapsed_time": "5:57:37", "remaining_time": "1:54:09"}
|
| 1165 |
+
{"current_steps": 922, "total_steps": 1215, "loss": 0.2721, "lr": 6.6830219203332415e-06, "epoch": 3.790339157245632, "percentage": 75.88, "elapsed_time": "5:57:58", "remaining_time": "1:53:45"}
|
| 1166 |
+
{"current_steps": 923, "total_steps": 1215, "loss": 0.2792, "lr": 6.640187688823065e-06, "epoch": 3.7944501541623845, "percentage": 75.97, "elapsed_time": "5:58:21", "remaining_time": "1:53:22"}
|
| 1167 |
+
{"current_steps": 924, "total_steps": 1215, "loss": 0.2799, "lr": 6.597463829457014e-06, "epoch": 3.7985611510791366, "percentage": 76.05, "elapsed_time": "5:58:44", "remaining_time": "1:52:58"}
|
| 1168 |
+
{"current_steps": 925, "total_steps": 1215, "loss": 0.2695, "lr": 6.554850695198427e-06, "epoch": 3.802672147995889, "percentage": 76.13, "elapsed_time": "5:59:06", "remaining_time": "1:52:35"}
|
| 1169 |
+
{"current_steps": 926, "total_steps": 1215, "loss": 0.2858, "lr": 6.512348638095887e-06, "epoch": 3.8067831449126412, "percentage": 76.21, "elapsed_time": "5:59:29", "remaining_time": "1:52:11"}
|
| 1170 |
+
{"current_steps": 927, "total_steps": 1215, "loss": 0.2681, "lr": 6.469958009280315e-06, "epoch": 3.810894141829394, "percentage": 76.3, "elapsed_time": "5:59:52", "remaining_time": "1:51:48"}
|
| 1171 |
+
{"current_steps": 928, "total_steps": 1215, "loss": 0.2852, "lr": 6.4276791589620595e-06, "epoch": 3.815005138746146, "percentage": 76.38, "elapsed_time": "6:00:15", "remaining_time": "1:51:25"}
|
| 1172 |
+
{"current_steps": 929, "total_steps": 1215, "loss": 0.2864, "lr": 6.385512436428021e-06, "epoch": 3.819116135662898, "percentage": 76.46, "elapsed_time": "6:00:37", "remaining_time": "1:51:01"}
|
| 1173 |
+
{"current_steps": 930, "total_steps": 1215, "loss": 0.2727, "lr": 6.343458190038747e-06, "epoch": 3.8232271325796505, "percentage": 76.54, "elapsed_time": "6:01:01", "remaining_time": "1:50:38"}
|
| 1174 |
+
{"current_steps": 931, "total_steps": 1215, "loss": 0.2739, "lr": 6.301516767225568e-06, "epoch": 3.827338129496403, "percentage": 76.63, "elapsed_time": "6:01:24", "remaining_time": "1:50:14"}
|
| 1175 |
+
{"current_steps": 932, "total_steps": 1215, "loss": 0.2758, "lr": 6.259688514487718e-06, "epoch": 3.831449126413155, "percentage": 76.71, "elapsed_time": "6:01:48", "remaining_time": "1:49:51"}
|
| 1176 |
+
{"current_steps": 933, "total_steps": 1215, "loss": 0.2761, "lr": 6.217973777389483e-06, "epoch": 3.8355601233299073, "percentage": 76.79, "elapsed_time": "6:02:11", "remaining_time": "1:49:28"}
|
| 1177 |
+
{"current_steps": 934, "total_steps": 1215, "loss": 0.2829, "lr": 6.1763729005573284e-06, "epoch": 3.83967112024666, "percentage": 76.87, "elapsed_time": "6:02:34", "remaining_time": "1:49:04"}
|
| 1178 |
+
{"current_steps": 935, "total_steps": 1215, "loss": 0.2922, "lr": 6.134886227677073e-06, "epoch": 3.8437821171634123, "percentage": 76.95, "elapsed_time": "6:02:57", "remaining_time": "1:48:41"}
|
| 1179 |
+
{"current_steps": 936, "total_steps": 1215, "loss": 0.2763, "lr": 6.093514101491034e-06, "epoch": 3.8478931140801644, "percentage": 77.04, "elapsed_time": "6:03:20", "remaining_time": "1:48:18"}
|
| 1180 |
+
{"current_steps": 937, "total_steps": 1215, "loss": 0.2711, "lr": 6.052256863795198e-06, "epoch": 3.8520041109969165, "percentage": 77.12, "elapsed_time": "6:03:44", "remaining_time": "1:47:55"}
|
| 1181 |
+
{"current_steps": 938, "total_steps": 1215, "loss": 0.2799, "lr": 6.0111148554364084e-06, "epoch": 3.856115107913669, "percentage": 77.2, "elapsed_time": "6:04:06", "remaining_time": "1:47:31"}
|
| 1182 |
+
{"current_steps": 939, "total_steps": 1215, "loss": 0.2689, "lr": 5.970088416309532e-06, "epoch": 3.8602261048304216, "percentage": 77.28, "elapsed_time": "6:04:29", "remaining_time": "1:47:08"}
|
| 1183 |
+
{"current_steps": 940, "total_steps": 1215, "loss": 0.279, "lr": 5.929177885354665e-06, "epoch": 3.8643371017471737, "percentage": 77.37, "elapsed_time": "6:04:51", "remaining_time": "1:46:44"}
|
| 1184 |
+
{"current_steps": 941, "total_steps": 1215, "loss": 0.2769, "lr": 5.888383600554326e-06, "epoch": 3.868448098663926, "percentage": 77.45, "elapsed_time": "6:05:14", "remaining_time": "1:46:21"}
|
| 1185 |
+
{"current_steps": 942, "total_steps": 1215, "loss": 0.2902, "lr": 5.8477058989306605e-06, "epoch": 3.8725590955806783, "percentage": 77.53, "elapsed_time": "6:05:37", "remaining_time": "1:45:57"}
|
| 1186 |
+
{"current_steps": 943, "total_steps": 1215, "loss": 0.2772, "lr": 5.807145116542678e-06, "epoch": 3.876670092497431, "percentage": 77.61, "elapsed_time": "6:06:00", "remaining_time": "1:45:34"}
|
| 1187 |
+
{"current_steps": 944, "total_steps": 1215, "loss": 0.2766, "lr": 5.766701588483443e-06, "epoch": 3.880781089414183, "percentage": 77.7, "elapsed_time": "6:06:24", "remaining_time": "1:45:11"}
|
| 1188 |
+
{"current_steps": 945, "total_steps": 1215, "loss": 0.2711, "lr": 5.726375648877329e-06, "epoch": 3.884892086330935, "percentage": 77.78, "elapsed_time": "6:06:47", "remaining_time": "1:44:47"}
|
| 1189 |
+
{"current_steps": 946, "total_steps": 1215, "loss": 0.2637, "lr": 5.68616763087725e-06, "epoch": 3.8890030832476876, "percentage": 77.86, "elapsed_time": "6:07:08", "remaining_time": "1:44:24"}
|
| 1190 |
+
{"current_steps": 947, "total_steps": 1215, "loss": 0.2728, "lr": 5.646077866661912e-06, "epoch": 3.8931140801644397, "percentage": 77.94, "elapsed_time": "6:07:32", "remaining_time": "1:44:00"}
|
| 1191 |
+
{"current_steps": 948, "total_steps": 1215, "loss": 0.277, "lr": 5.606106687433066e-06, "epoch": 3.8972250770811923, "percentage": 78.02, "elapsed_time": "6:07:55", "remaining_time": "1:43:37"}
|
| 1192 |
+
{"current_steps": 949, "total_steps": 1215, "loss": 0.2852, "lr": 5.5662544234127735e-06, "epoch": 3.9013360739979444, "percentage": 78.11, "elapsed_time": "6:08:18", "remaining_time": "1:43:14"}
|
| 1193 |
+
{"current_steps": 950, "total_steps": 1215, "loss": 0.2724, "lr": 5.526521403840677e-06, "epoch": 3.905447070914697, "percentage": 78.19, "elapsed_time": "6:08:41", "remaining_time": "1:42:50"}
|
| 1194 |
+
{"current_steps": 951, "total_steps": 1215, "loss": 0.2654, "lr": 5.486907956971277e-06, "epoch": 3.909558067831449, "percentage": 78.27, "elapsed_time": "6:09:03", "remaining_time": "1:42:26"}
|
| 1195 |
+
{"current_steps": 952, "total_steps": 1215, "loss": 0.28, "lr": 5.447414410071232e-06, "epoch": 3.9136690647482015, "percentage": 78.35, "elapsed_time": "6:09:24", "remaining_time": "1:42:03"}
|
| 1196 |
+
{"current_steps": 953, "total_steps": 1215, "loss": 0.2809, "lr": 5.40804108941664e-06, "epoch": 3.9177800616649536, "percentage": 78.44, "elapsed_time": "6:09:48", "remaining_time": "1:41:39"}
|
| 1197 |
+
{"current_steps": 954, "total_steps": 1215, "loss": 0.2753, "lr": 5.36878832029035e-06, "epoch": 3.921891058581706, "percentage": 78.52, "elapsed_time": "6:10:11", "remaining_time": "1:41:16"}
|
| 1198 |
+
{"current_steps": 955, "total_steps": 1215, "loss": 0.2844, "lr": 5.329656426979275e-06, "epoch": 3.9260020554984583, "percentage": 78.6, "elapsed_time": "6:10:35", "remaining_time": "1:40:53"}
|
| 1199 |
+
{"current_steps": 956, "total_steps": 1215, "loss": 0.2776, "lr": 5.290645732771711e-06, "epoch": 3.930113052415211, "percentage": 78.68, "elapsed_time": "6:10:59", "remaining_time": "1:40:30"}
|
| 1200 |
+
{"current_steps": 957, "total_steps": 1215, "loss": 0.2752, "lr": 5.251756559954668e-06, "epoch": 3.934224049331963, "percentage": 78.77, "elapsed_time": "6:11:21", "remaining_time": "1:40:07"}
|
| 1201 |
+
{"current_steps": 958, "total_steps": 1215, "loss": 0.2703, "lr": 5.212989229811209e-06, "epoch": 3.9383350462487154, "percentage": 78.85, "elapsed_time": "6:11:45", "remaining_time": "1:39:43"}
|
| 1202 |
+
{"current_steps": 959, "total_steps": 1215, "loss": 0.2817, "lr": 5.174344062617789e-06, "epoch": 3.9424460431654675, "percentage": 78.93, "elapsed_time": "6:12:07", "remaining_time": "1:39:20"}
|
| 1203 |
+
{"current_steps": 960, "total_steps": 1215, "loss": 0.2787, "lr": 5.135821377641616e-06, "epoch": 3.94655704008222, "percentage": 79.01, "elapsed_time": "6:12:30", "remaining_time": "1:38:56"}
|
| 1204 |
+
{"current_steps": 961, "total_steps": 1215, "loss": 0.2766, "lr": 5.097421493138008e-06, "epoch": 3.950668036998972, "percentage": 79.09, "elapsed_time": "6:12:53", "remaining_time": "1:38:33"}
|
| 1205 |
+
{"current_steps": 962, "total_steps": 1215, "loss": 0.2728, "lr": 5.059144726347765e-06, "epoch": 3.9547790339157247, "percentage": 79.18, "elapsed_time": "6:13:16", "remaining_time": "1:38:10"}
|
| 1206 |
+
{"current_steps": 963, "total_steps": 1215, "loss": 0.2867, "lr": 5.020991393494558e-06, "epoch": 3.958890030832477, "percentage": 79.26, "elapsed_time": "6:13:39", "remaining_time": "1:37:46"}
|
| 1207 |
+
{"current_steps": 964, "total_steps": 1215, "loss": 0.2675, "lr": 4.9829618097823055e-06, "epoch": 3.963001027749229, "percentage": 79.34, "elapsed_time": "6:14:03", "remaining_time": "1:37:23"}
|
| 1208 |
+
{"current_steps": 965, "total_steps": 1215, "loss": 0.2765, "lr": 4.945056289392565e-06, "epoch": 3.9671120246659815, "percentage": 79.42, "elapsed_time": "6:14:26", "remaining_time": "1:37:00"}
|
| 1209 |
+
{"current_steps": 966, "total_steps": 1215, "loss": 0.2731, "lr": 4.907275145481947e-06, "epoch": 3.971223021582734, "percentage": 79.51, "elapsed_time": "6:14:49", "remaining_time": "1:36:37"}
|
| 1210 |
+
{"current_steps": 967, "total_steps": 1215, "loss": 0.2817, "lr": 4.8696186901795275e-06, "epoch": 3.975334018499486, "percentage": 79.59, "elapsed_time": "6:15:13", "remaining_time": "1:36:13"}
|
| 1211 |
+
{"current_steps": 968, "total_steps": 1215, "loss": 0.2783, "lr": 4.832087234584266e-06, "epoch": 3.979445015416238, "percentage": 79.67, "elapsed_time": "6:15:36", "remaining_time": "1:35:50"}
|
| 1212 |
+
{"current_steps": 969, "total_steps": 1215, "loss": 0.2744, "lr": 4.794681088762438e-06, "epoch": 3.9835560123329907, "percentage": 79.75, "elapsed_time": "6:15:59", "remaining_time": "1:35:27"}
|
| 1213 |
+
{"current_steps": 970, "total_steps": 1215, "loss": 0.2762, "lr": 4.757400561745069e-06, "epoch": 3.9876670092497433, "percentage": 79.84, "elapsed_time": "6:16:21", "remaining_time": "1:35:03"}
|
| 1214 |
+
{"current_steps": 971, "total_steps": 1215, "loss": 0.2949, "lr": 4.720245961525387e-06, "epoch": 3.9917780061664954, "percentage": 79.92, "elapsed_time": "6:16:45", "remaining_time": "1:34:40"}
|
| 1215 |
+
{"current_steps": 972, "total_steps": 1215, "loss": 0.2746, "lr": 4.683217595056275e-06, "epoch": 3.9958890030832475, "percentage": 80.0, "elapsed_time": "6:17:08", "remaining_time": "1:34:17"}
|
| 1216 |
+
{"current_steps": 973, "total_steps": 1215, "loss": 0.2868, "lr": 4.646315768247731e-06, "epoch": 4.0, "percentage": 80.08, "elapsed_time": "6:17:31", "remaining_time": "1:33:53"}
|
| 1217 |
+
{"current_steps": 974, "total_steps": 1215, "loss": 0.2379, "lr": 4.609540785964348e-06, "epoch": 4.0041109969167525, "percentage": 80.16, "elapsed_time": "6:19:33", "remaining_time": "1:33:54"}
|
| 1218 |
+
{"current_steps": 975, "total_steps": 1215, "loss": 0.2495, "lr": 4.572892952022796e-06, "epoch": 4.008221993833504, "percentage": 80.25, "elapsed_time": "6:19:56", "remaining_time": "1:33:31"}
|
| 1219 |
+
{"current_steps": 976, "total_steps": 1215, "loss": 0.2434, "lr": 4.5363725691893045e-06, "epoch": 4.012332990750257, "percentage": 80.33, "elapsed_time": "6:20:20", "remaining_time": "1:33:08"}
|
| 1220 |
+
{"current_steps": 977, "total_steps": 1215, "loss": 0.2413, "lr": 4.499979939177164e-06, "epoch": 4.016443987667009, "percentage": 80.41, "elapsed_time": "6:20:43", "remaining_time": "1:32:44"}
|
| 1221 |
+
{"current_steps": 978, "total_steps": 1215, "loss": 0.2415, "lr": 4.463715362644239e-06, "epoch": 4.020554984583762, "percentage": 80.49, "elapsed_time": "6:21:07", "remaining_time": "1:32:21"}
|
| 1222 |
+
{"current_steps": 979, "total_steps": 1215, "loss": 0.2353, "lr": 4.427579139190474e-06, "epoch": 4.0246659815005135, "percentage": 80.58, "elapsed_time": "6:21:29", "remaining_time": "1:31:57"}
|
| 1223 |
+
{"current_steps": 980, "total_steps": 1215, "loss": 0.244, "lr": 4.391571567355428e-06, "epoch": 4.028776978417266, "percentage": 80.66, "elapsed_time": "6:21:52", "remaining_time": "1:31:34"}
|
| 1224 |
+
{"current_steps": 981, "total_steps": 1215, "loss": 0.2446, "lr": 4.355692944615806e-06, "epoch": 4.0328879753340185, "percentage": 80.74, "elapsed_time": "6:22:15", "remaining_time": "1:31:10"}
|
| 1225 |
+
{"current_steps": 982, "total_steps": 1215, "loss": 0.2446, "lr": 4.319943567382991e-06, "epoch": 4.036998972250771, "percentage": 80.82, "elapsed_time": "6:22:38", "remaining_time": "1:30:47"}
|
| 1226 |
+
{"current_steps": 983, "total_steps": 1215, "loss": 0.2383, "lr": 4.28432373100061e-06, "epoch": 4.041109969167523, "percentage": 80.91, "elapsed_time": "6:23:00", "remaining_time": "1:30:23"}
|
| 1227 |
+
{"current_steps": 984, "total_steps": 1215, "loss": 0.2335, "lr": 4.248833729742095e-06, "epoch": 4.045220966084275, "percentage": 80.99, "elapsed_time": "6:23:23", "remaining_time": "1:30:00"}
|
| 1228 |
+
{"current_steps": 985, "total_steps": 1215, "loss": 0.2388, "lr": 4.2134738568082325e-06, "epoch": 4.049331963001028, "percentage": 81.07, "elapsed_time": "6:23:46", "remaining_time": "1:29:36"}
|
| 1229 |
+
{"current_steps": 986, "total_steps": 1215, "loss": 0.2386, "lr": 4.1782444043247565e-06, "epoch": 4.05344295991778, "percentage": 81.15, "elapsed_time": "6:24:09", "remaining_time": "1:29:13"}
|
| 1230 |
+
{"current_steps": 987, "total_steps": 1215, "loss": 0.2447, "lr": 4.143145663339932e-06, "epoch": 4.057553956834532, "percentage": 81.23, "elapsed_time": "6:24:31", "remaining_time": "1:28:49"}
|
| 1231 |
+
{"current_steps": 988, "total_steps": 1215, "loss": 0.2426, "lr": 4.108177923822154e-06, "epoch": 4.061664953751285, "percentage": 81.32, "elapsed_time": "6:24:55", "remaining_time": "1:28:26"}
|
| 1232 |
+
{"current_steps": 989, "total_steps": 1215, "loss": 0.2482, "lr": 4.073341474657544e-06, "epoch": 4.065775950668037, "percentage": 81.4, "elapsed_time": "6:25:18", "remaining_time": "1:28:02"}
|
| 1233 |
+
{"current_steps": 990, "total_steps": 1215, "loss": 0.2389, "lr": 4.03863660364757e-06, "epoch": 4.06988694758479, "percentage": 81.48, "elapsed_time": "6:25:41", "remaining_time": "1:27:39"}
|
| 1234 |
+
{"current_steps": 991, "total_steps": 1215, "loss": 0.2337, "lr": 4.004063597506664e-06, "epoch": 4.073997944501541, "percentage": 81.56, "elapsed_time": "6:26:04", "remaining_time": "1:27:15"}
|
| 1235 |
+
{"current_steps": 992, "total_steps": 1215, "loss": 0.2477, "lr": 3.969622741859862e-06, "epoch": 4.078108941418294, "percentage": 81.65, "elapsed_time": "6:26:27", "remaining_time": "1:26:52"}
|
| 1236 |
+
{"current_steps": 993, "total_steps": 1215, "loss": 0.2405, "lr": 3.935314321240433e-06, "epoch": 4.082219938335046, "percentage": 81.73, "elapsed_time": "6:26:50", "remaining_time": "1:26:29"}
|
| 1237 |
+
{"current_steps": 994, "total_steps": 1215, "loss": 0.2394, "lr": 3.90113861908753e-06, "epoch": 4.086330935251799, "percentage": 81.81, "elapsed_time": "6:27:13", "remaining_time": "1:26:05"}
|
| 1238 |
+
{"current_steps": 995, "total_steps": 1215, "loss": 0.2326, "lr": 3.867095917743862e-06, "epoch": 4.090441932168551, "percentage": 81.89, "elapsed_time": "6:27:35", "remaining_time": "1:25:42"}
|
| 1239 |
+
{"current_steps": 996, "total_steps": 1215, "loss": 0.2362, "lr": 3.8331864984533404e-06, "epoch": 4.094552929085303, "percentage": 81.98, "elapsed_time": "6:27:57", "remaining_time": "1:25:18"}
|
| 1240 |
+
{"current_steps": 997, "total_steps": 1215, "loss": 0.2462, "lr": 3.799410641358776e-06, "epoch": 4.098663926002056, "percentage": 82.06, "elapsed_time": "6:28:20", "remaining_time": "1:24:54"}
|
| 1241 |
+
{"current_steps": 998, "total_steps": 1215, "loss": 0.2404, "lr": 3.7657686254995483e-06, "epoch": 4.102774922918808, "percentage": 82.14, "elapsed_time": "6:28:42", "remaining_time": "1:24:31"}
|
| 1242 |
+
{"current_steps": 999, "total_steps": 1215, "loss": 0.2398, "lr": 3.7322607288093117e-06, "epoch": 4.10688591983556, "percentage": 82.22, "elapsed_time": "6:29:05", "remaining_time": "1:24:07"}
|
| 1243 |
+
{"current_steps": 1000, "total_steps": 1215, "loss": 0.2363, "lr": 3.6988872281136855e-06, "epoch": 4.110996916752312, "percentage": 82.3, "elapsed_time": "6:29:27", "remaining_time": "1:23:44"}
|
| 1244 |
+
{"current_steps": 1001, "total_steps": 1215, "loss": 0.2318, "lr": 3.66564839912799e-06, "epoch": 4.115107913669065, "percentage": 82.39, "elapsed_time": "6:29:51", "remaining_time": "1:23:20"}
|
| 1245 |
+
{"current_steps": 1002, "total_steps": 1215, "loss": 0.2359, "lr": 3.632544516454941e-06, "epoch": 4.1192189105858175, "percentage": 82.47, "elapsed_time": "6:30:15", "remaining_time": "1:22:57"}
|
| 1246 |
+
{"current_steps": 1003, "total_steps": 1215, "loss": 0.2316, "lr": 3.5995758535823997e-06, "epoch": 4.123329907502569, "percentage": 82.55, "elapsed_time": "6:30:38", "remaining_time": "1:22:34"}
|
| 1247 |
+
{"current_steps": 1004, "total_steps": 1215, "loss": 0.2608, "lr": 3.566742682881119e-06, "epoch": 4.127440904419322, "percentage": 82.63, "elapsed_time": "6:31:00", "remaining_time": "1:22:10"}
|
| 1248 |
+
{"current_steps": 1005, "total_steps": 1215, "loss": 0.242, "lr": 3.534045275602467e-06, "epoch": 4.131551901336074, "percentage": 82.72, "elapsed_time": "6:31:22", "remaining_time": "1:21:46"}
|
| 1249 |
+
{"current_steps": 1006, "total_steps": 1215, "loss": 0.244, "lr": 3.501483901876208e-06, "epoch": 4.135662898252827, "percentage": 82.8, "elapsed_time": "6:31:44", "remaining_time": "1:21:23"}
|
| 1250 |
+
{"current_steps": 1007, "total_steps": 1215, "loss": 0.2324, "lr": 3.469058830708263e-06, "epoch": 4.139773895169578, "percentage": 82.88, "elapsed_time": "6:32:07", "remaining_time": "1:20:59"}
|
| 1251 |
+
{"current_steps": 1008, "total_steps": 1215, "loss": 0.2481, "lr": 3.436770329978494e-06, "epoch": 4.143884892086331, "percentage": 82.96, "elapsed_time": "6:32:30", "remaining_time": "1:20:36"}
|
| 1252 |
+
{"current_steps": 1009, "total_steps": 1215, "loss": 0.2432, "lr": 3.4046186664384795e-06, "epoch": 4.1479958890030835, "percentage": 83.05, "elapsed_time": "6:32:53", "remaining_time": "1:20:12"}
|
| 1253 |
+
{"current_steps": 1010, "total_steps": 1215, "loss": 0.2386, "lr": 3.3726041057093186e-06, "epoch": 4.152106885919835, "percentage": 83.13, "elapsed_time": "6:33:15", "remaining_time": "1:19:49"}
|
| 1254 |
+
{"current_steps": 1011, "total_steps": 1215, "loss": 0.2487, "lr": 3.3407269122794373e-06, "epoch": 4.156217882836588, "percentage": 83.21, "elapsed_time": "6:33:39", "remaining_time": "1:19:25"}
|
| 1255 |
+
{"current_steps": 1012, "total_steps": 1215, "loss": 0.234, "lr": 3.3089873495023995e-06, "epoch": 4.16032887975334, "percentage": 83.29, "elapsed_time": "6:34:01", "remaining_time": "1:19:02"}
|
| 1256 |
+
{"current_steps": 1013, "total_steps": 1215, "loss": 0.2339, "lr": 3.2773856795947336e-06, "epoch": 4.164439876670093, "percentage": 83.37, "elapsed_time": "6:34:24", "remaining_time": "1:18:38"}
|
| 1257 |
+
{"current_steps": 1014, "total_steps": 1215, "loss": 0.2379, "lr": 3.2459221636337633e-06, "epoch": 4.168550873586844, "percentage": 83.46, "elapsed_time": "6:34:46", "remaining_time": "1:18:15"}
|
| 1258 |
+
{"current_steps": 1015, "total_steps": 1215, "loss": 0.2292, "lr": 3.214597061555458e-06, "epoch": 4.172661870503597, "percentage": 83.54, "elapsed_time": "6:35:09", "remaining_time": "1:17:51"}
|
| 1259 |
+
{"current_steps": 1016, "total_steps": 1215, "loss": 0.2371, "lr": 3.1834106321522727e-06, "epoch": 4.1767728674203495, "percentage": 83.62, "elapsed_time": "6:35:32", "remaining_time": "1:17:28"}
|
| 1260 |
+
{"current_steps": 1017, "total_steps": 1215, "loss": 0.2433, "lr": 3.152363133071024e-06, "epoch": 4.180883864337102, "percentage": 83.7, "elapsed_time": "6:35:56", "remaining_time": "1:17:05"}
|
| 1261 |
+
{"current_steps": 1018, "total_steps": 1215, "loss": 0.2373, "lr": 3.12145482081075e-06, "epoch": 4.184994861253854, "percentage": 83.79, "elapsed_time": "6:36:19", "remaining_time": "1:16:41"}
|
| 1262 |
+
{"current_steps": 1019, "total_steps": 1215, "loss": 0.2425, "lr": 3.0906859507206044e-06, "epoch": 4.189105858170606, "percentage": 83.87, "elapsed_time": "6:36:42", "remaining_time": "1:16:18"}
|
| 1263 |
+
{"current_steps": 1020, "total_steps": 1215, "loss": 0.2388, "lr": 3.0600567769977286e-06, "epoch": 4.193216855087359, "percentage": 83.95, "elapsed_time": "6:37:05", "remaining_time": "1:15:54"}
|
| 1264 |
+
{"current_steps": 1021, "total_steps": 1215, "loss": 0.2327, "lr": 3.0295675526851686e-06, "epoch": 4.197327852004111, "percentage": 84.03, "elapsed_time": "6:37:26", "remaining_time": "1:15:31"}
|
| 1265 |
+
{"current_steps": 1022, "total_steps": 1215, "loss": 0.2494, "lr": 2.9992185296697763e-06, "epoch": 4.201438848920863, "percentage": 84.12, "elapsed_time": "6:37:50", "remaining_time": "1:15:07"}
|
| 1266 |
+
{"current_steps": 1023, "total_steps": 1215, "loss": 0.2431, "lr": 2.9690099586801223e-06, "epoch": 4.2055498458376155, "percentage": 84.2, "elapsed_time": "6:38:14", "remaining_time": "1:14:44"}
|
| 1267 |
+
{"current_steps": 1024, "total_steps": 1215, "loss": 0.2243, "lr": 2.938942089284453e-06, "epoch": 4.209660842754368, "percentage": 84.28, "elapsed_time": "6:38:36", "remaining_time": "1:14:20"}
|
| 1268 |
+
{"current_steps": 1025, "total_steps": 1215, "loss": 0.2361, "lr": 2.909015169888587e-06, "epoch": 4.213771839671121, "percentage": 84.36, "elapsed_time": "6:38:59", "remaining_time": "1:13:57"}
|
| 1269 |
+
{"current_steps": 1026, "total_steps": 1215, "loss": 0.2438, "lr": 2.879229447733893e-06, "epoch": 4.217882836587872, "percentage": 84.44, "elapsed_time": "6:39:22", "remaining_time": "1:13:34"}
|
| 1270 |
+
{"current_steps": 1027, "total_steps": 1215, "loss": 0.2372, "lr": 2.849585168895237e-06, "epoch": 4.221993833504625, "percentage": 84.53, "elapsed_time": "6:39:46", "remaining_time": "1:13:10"}
|
| 1271 |
+
{"current_steps": 1028, "total_steps": 1215, "loss": 0.2389, "lr": 2.8200825782789466e-06, "epoch": 4.226104830421377, "percentage": 84.61, "elapsed_time": "6:40:09", "remaining_time": "1:12:47"}
|
| 1272 |
+
{"current_steps": 1029, "total_steps": 1215, "loss": 0.2299, "lr": 2.790721919620798e-06, "epoch": 4.23021582733813, "percentage": 84.69, "elapsed_time": "6:40:32", "remaining_time": "1:12:24"}
|
| 1273 |
+
{"current_steps": 1030, "total_steps": 1215, "loss": 0.2346, "lr": 2.7615034354839942e-06, "epoch": 4.2343268242548815, "percentage": 84.77, "elapsed_time": "6:40:54", "remaining_time": "1:12:00"}
|
| 1274 |
+
{"current_steps": 1031, "total_steps": 1215, "loss": 0.2337, "lr": 2.7324273672571577e-06, "epoch": 4.238437821171634, "percentage": 84.86, "elapsed_time": "6:41:18", "remaining_time": "1:11:37"}
|