Training in progress, epoch 1
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +184 -0
- training_args.bin +1 -1
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c28f7d616133401fa097e96bb93608bc9c821a761c54e5851bdf3c2ebb5d2c0
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e6a5350c9ffd6c2c60990c003833a7509d71eca0a87c1afb3759f49d4919207
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa0fbae6565c6fe5e0c3dfbb8cdea9ae8462320cdcd363e94cc8db5b49cd1233
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96fa2b434d8b8e75863470ff4aaf86e3540056bf0f4706b1df21f807f9033739
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -899,3 +899,187 @@
|
|
| 899 |
{"current_steps": 404, "total_steps": 1230, "loss": 0.3535, "lr": 3.3970539735870996e-05, "epoch": 1.6379746835443036, "percentage": 32.85, "elapsed_time": "9:40:11", "remaining_time": "19:46:13"}
|
| 900 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.2471, "lr": 2.980274210295326e-05, "epoch": 2.012151898734177, "percentage": 40.33, "elapsed_time": "11:52:10", "remaining_time": "17:33:54"}
|
| 901 |
{"current_steps": 405, "total_steps": 1230, "loss": 0.3353, "lr": 3.392986794874714e-05, "epoch": 1.6420253164556962, "percentage": 32.93, "elapsed_time": "9:41:25", "remaining_time": "19:44:22"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 899 |
{"current_steps": 404, "total_steps": 1230, "loss": 0.3535, "lr": 3.3970539735870996e-05, "epoch": 1.6379746835443036, "percentage": 32.85, "elapsed_time": "9:40:11", "remaining_time": "19:46:13"}
|
| 900 |
{"current_steps": 496, "total_steps": 1230, "loss": 0.2471, "lr": 2.980274210295326e-05, "epoch": 2.012151898734177, "percentage": 40.33, "elapsed_time": "11:52:10", "remaining_time": "17:33:54"}
|
| 901 |
{"current_steps": 405, "total_steps": 1230, "loss": 0.3353, "lr": 3.392986794874714e-05, "epoch": 1.6420253164556962, "percentage": 32.93, "elapsed_time": "9:41:25", "remaining_time": "19:44:22"}
|
| 902 |
+
{"current_steps": 497, "total_steps": 1230, "loss": 0.238, "lr": 2.9753229259313578e-05, "epoch": 2.0162025316455696, "percentage": 40.41, "elapsed_time": "11:53:39", "remaining_time": "17:32:32"}
|
| 903 |
+
{"current_steps": 406, "total_steps": 1230, "loss": 0.3471, "lr": 3.388908397238184e-05, "epoch": 1.6460759493670887, "percentage": 33.01, "elapsed_time": "9:42:46", "remaining_time": "19:42:45"}
|
| 904 |
+
{"current_steps": 498, "total_steps": 1230, "loss": 0.24, "lr": 2.9703637864506274e-05, "epoch": 2.020253164556962, "percentage": 40.49, "elapsed_time": "11:54:53", "remaining_time": "17:30:48"}
|
| 905 |
+
{"current_steps": 407, "total_steps": 1230, "loss": 0.3343, "lr": 3.384818813524362e-05, "epoch": 1.650126582278481, "percentage": 33.09, "elapsed_time": "9:44:05", "remaining_time": "19:41:06"}
|
| 906 |
+
{"current_steps": 499, "total_steps": 1230, "loss": 0.2597, "lr": 2.965396831793362e-05, "epoch": 2.0243037974683546, "percentage": 40.57, "elapsed_time": "11:56:36", "remaining_time": "17:29:46"}
|
| 907 |
+
{"current_steps": 408, "total_steps": 1230, "loss": 0.3497, "lr": 3.380718076670195e-05, "epoch": 1.6541772151898733, "percentage": 33.17, "elapsed_time": "9:45:38", "remaining_time": "19:39:53"}
|
| 908 |
+
{"current_steps": 500, "total_steps": 1230, "loss": 0.2342, "lr": 2.9604221019627316e-05, "epoch": 2.0283544303797467, "percentage": 40.65, "elapsed_time": "11:58:02", "remaining_time": "17:28:20"}
|
| 909 |
+
{"current_steps": 409, "total_steps": 1230, "loss": 0.3512, "lr": 3.376606219702454e-05, "epoch": 1.6582278481012658, "percentage": 33.25, "elapsed_time": "9:46:55", "remaining_time": "19:38:09"}
|
| 910 |
+
{"current_steps": 410, "total_steps": 1230, "loss": 0.3333, "lr": 3.372483275737468e-05, "epoch": 1.6622784810126583, "percentage": 33.33, "elapsed_time": "9:48:09", "remaining_time": "19:36:18"}
|
| 911 |
+
{"current_steps": 501, "total_steps": 1230, "loss": 0.2568, "lr": 2.955439637024526e-05, "epoch": 2.0324050632911392, "percentage": 40.73, "elapsed_time": "11:59:24", "remaining_time": "17:26:48"}
|
| 912 |
+
{"current_steps": 502, "total_steps": 1230, "loss": 0.2616, "lr": 2.9504494771068334e-05, "epoch": 2.0364556962025318, "percentage": 40.81, "elapsed_time": "12:00:44", "remaining_time": "17:25:13"}
|
| 913 |
+
{"current_steps": 411, "total_steps": 1230, "loss": 0.3387, "lr": 3.368349277980861e-05, "epoch": 1.6663291139240506, "percentage": 33.41, "elapsed_time": "9:49:46", "remaining_time": "19:35:14"}
|
| 914 |
+
{"current_steps": 503, "total_steps": 1230, "loss": 0.2345, "lr": 2.9454516623997156e-05, "epoch": 2.0405063291139243, "percentage": 40.89, "elapsed_time": "12:02:04", "remaining_time": "17:23:37"}
|
| 915 |
+
{"current_steps": 412, "total_steps": 1230, "loss": 0.3445, "lr": 3.3642042597272844e-05, "epoch": 1.6703797468354429, "percentage": 33.5, "elapsed_time": "9:51:04", "remaining_time": "19:33:33"}
|
| 916 |
+
{"current_steps": 504, "total_steps": 1230, "loss": 0.2349, "lr": 2.9404462331548847e-05, "epoch": 2.0445569620253163, "percentage": 40.98, "elapsed_time": "12:03:19", "remaining_time": "17:21:55"}
|
| 917 |
+
{"current_steps": 413, "total_steps": 1230, "loss": 0.3215, "lr": 3.360048254360144e-05, "epoch": 1.6744303797468354, "percentage": 33.58, "elapsed_time": "9:52:24", "remaining_time": "19:31:54"}
|
| 918 |
+
{"current_steps": 505, "total_steps": 1230, "loss": 0.26, "lr": 2.93543322968538e-05, "epoch": 2.048607594936709, "percentage": 41.06, "elapsed_time": "12:04:51", "remaining_time": "17:20:38"}
|
| 919 |
+
{"current_steps": 414, "total_steps": 1230, "loss": 0.3425, "lr": 3.355881295351336e-05, "epoch": 1.678481012658228, "percentage": 33.66, "elapsed_time": "9:53:50", "remaining_time": "19:30:28"}
|
| 920 |
+
{"current_steps": 415, "total_steps": 1230, "loss": 0.3318, "lr": 3.351703416260975e-05, "epoch": 1.6825316455696202, "percentage": 33.74, "elapsed_time": "9:55:13", "remaining_time": "19:28:56"}
|
| 921 |
+
{"current_steps": 506, "total_steps": 1230, "loss": 0.2407, "lr": 2.9304126923652428e-05, "epoch": 2.0526582278481014, "percentage": 41.14, "elapsed_time": "12:06:36", "remaining_time": "17:19:39"}
|
| 922 |
+
{"current_steps": 416, "total_steps": 1230, "loss": 0.3405, "lr": 3.347514650737126e-05, "epoch": 1.6865822784810125, "percentage": 33.82, "elapsed_time": "9:56:38", "remaining_time": "19:27:27"}
|
| 923 |
+
{"current_steps": 507, "total_steps": 1230, "loss": 0.2789, "lr": 2.9253846616291896e-05, "epoch": 2.056708860759494, "percentage": 41.22, "elapsed_time": "12:08:03", "remaining_time": "17:18:14"}
|
| 924 |
+
{"current_steps": 417, "total_steps": 1230, "loss": 0.3529, "lr": 3.3433150325155295e-05, "epoch": 1.690632911392405, "percentage": 33.9, "elapsed_time": "9:57:55", "remaining_time": "19:25:43"}
|
| 925 |
+
{"current_steps": 508, "total_steps": 1230, "loss": 0.241, "lr": 2.9203491779722896e-05, "epoch": 2.060759493670886, "percentage": 41.3, "elapsed_time": "12:09:16", "remaining_time": "17:16:29"}
|
| 926 |
+
{"current_steps": 509, "total_steps": 1230, "loss": 0.254, "lr": 2.9153062819496357e-05, "epoch": 2.0648101265822785, "percentage": 41.38, "elapsed_time": "12:10:26", "remaining_time": "17:14:40"}
|
| 927 |
+
{"current_steps": 418, "total_steps": 1230, "loss": 0.3632, "lr": 3.339104595419334e-05, "epoch": 1.6946835443037975, "percentage": 33.98, "elapsed_time": "9:59:19", "remaining_time": "19:24:13"}
|
| 928 |
+
{"current_steps": 510, "total_steps": 1230, "loss": 0.2397, "lr": 2.9102560141760178e-05, "epoch": 2.068860759493671, "percentage": 41.46, "elapsed_time": "12:11:42", "remaining_time": "17:12:59"}
|
| 929 |
+
{"current_steps": 419, "total_steps": 1230, "loss": 0.3522, "lr": 3.3348833733588204e-05, "epoch": 1.6987341772151898, "percentage": 34.07, "elapsed_time": "10:00:50", "remaining_time": "19:22:58"}
|
| 930 |
+
{"current_steps": 511, "total_steps": 1230, "loss": 0.2572, "lr": 2.9051984153256004e-05, "epoch": 2.0729113924050635, "percentage": 41.54, "elapsed_time": "12:13:11", "remaining_time": "17:11:37"}
|
| 931 |
+
{"current_steps": 420, "total_steps": 1230, "loss": 0.3305, "lr": 3.3306514003311305e-05, "epoch": 1.7027848101265821, "percentage": 34.15, "elapsed_time": "10:02:24", "remaining_time": "19:21:46"}
|
| 932 |
+
{"current_steps": 512, "total_steps": 1230, "loss": 0.2628, "lr": 2.900133526131588e-05, "epoch": 2.0769620253164556, "percentage": 41.63, "elapsed_time": "12:14:33", "remaining_time": "17:10:05"}
|
| 933 |
+
{"current_steps": 421, "total_steps": 1230, "loss": 0.3516, "lr": 3.326408710419996e-05, "epoch": 1.7068354430379746, "percentage": 34.23, "elapsed_time": "10:03:36", "remaining_time": "19:19:53"}
|
| 934 |
+
{"current_steps": 422, "total_steps": 1230, "loss": 0.344, "lr": 3.322155337795454e-05, "epoch": 1.7108860759493671, "percentage": 34.31, "elapsed_time": "10:05:03", "remaining_time": "19:18:30"}
|
| 935 |
+
{"current_steps": 513, "total_steps": 1230, "loss": 0.2559, "lr": 2.8950613873859025e-05, "epoch": 2.081012658227848, "percentage": 41.71, "elapsed_time": "12:16:13", "remaining_time": "17:08:59"}
|
| 936 |
+
{"current_steps": 423, "total_steps": 1230, "loss": 0.3429, "lr": 3.317891316713587e-05, "epoch": 1.7149367088607594, "percentage": 34.39, "elapsed_time": "10:06:36", "remaining_time": "19:17:16"}
|
| 937 |
+
{"current_steps": 514, "total_steps": 1230, "loss": 0.2456, "lr": 2.8899820399388515e-05, "epoch": 2.0850632911392406, "percentage": 41.79, "elapsed_time": "12:17:46", "remaining_time": "17:07:43"}
|
| 938 |
+
{"current_steps": 424, "total_steps": 1230, "loss": 0.3387, "lr": 3.313616681516231e-05, "epoch": 1.7189873417721517, "percentage": 34.47, "elapsed_time": "10:08:01", "remaining_time": "19:15:48"}
|
| 939 |
+
{"current_steps": 515, "total_steps": 1230, "loss": 0.2487, "lr": 2.8848955246988012e-05, "epoch": 2.089113924050633, "percentage": 41.87, "elapsed_time": "12:19:23", "remaining_time": "17:06:32"}
|
| 940 |
+
{"current_steps": 425, "total_steps": 1230, "loss": 0.3447, "lr": 3.309331466630713e-05, "epoch": 1.7230379746835442, "percentage": 34.55, "elapsed_time": "10:09:27", "remaining_time": "19:14:22"}
|
| 941 |
+
{"current_steps": 516, "total_steps": 1230, "loss": 0.2345, "lr": 2.879801882631847e-05, "epoch": 2.093164556962025, "percentage": 41.95, "elapsed_time": "12:20:42", "remaining_time": "17:04:55"}
|
| 942 |
+
{"current_steps": 426, "total_steps": 1230, "loss": 0.332, "lr": 3.305035706569563e-05, "epoch": 1.7270886075949368, "percentage": 34.63, "elapsed_time": "10:10:43", "remaining_time": "19:12:37"}
|
| 943 |
+
{"current_steps": 517, "total_steps": 1230, "loss": 0.231, "lr": 2.8747011547614808e-05, "epoch": 2.0972151898734177, "percentage": 42.03, "elapsed_time": "12:21:54", "remaining_time": "17:03:10"}
|
| 944 |
+
{"current_steps": 427, "total_steps": 1230, "loss": 0.3259, "lr": 3.3007294359302433e-05, "epoch": 1.7311392405063293, "percentage": 34.72, "elapsed_time": "10:12:06", "remaining_time": "19:11:06"}
|
| 945 |
+
{"current_steps": 518, "total_steps": 1230, "loss": 0.2557, "lr": 2.8695933821682635e-05, "epoch": 2.1012658227848102, "percentage": 42.11, "elapsed_time": "12:23:30", "remaining_time": "17:01:57"}
|
| 946 |
+
{"current_steps": 428, "total_steps": 1230, "loss": 0.3263, "lr": 3.296412689394864e-05, "epoch": 1.7351898734177216, "percentage": 34.8, "elapsed_time": "10:13:19", "remaining_time": "19:09:16"}
|
| 947 |
+
{"current_steps": 519, "total_steps": 1230, "loss": 0.2393, "lr": 2.864478605989494e-05, "epoch": 2.1053164556962027, "percentage": 42.2, "elapsed_time": "12:24:30", "remaining_time": "16:59:55"}
|
| 948 |
+
{"current_steps": 520, "total_steps": 1230, "loss": 0.2538, "lr": 2.8593568674188765e-05, "epoch": 2.109367088607595, "percentage": 42.28, "elapsed_time": "12:25:50", "remaining_time": "16:58:21"}
|
| 949 |
+
{"current_steps": 429, "total_steps": 1230, "loss": 0.3439, "lr": 3.292085501729909e-05, "epoch": 1.7392405063291139, "percentage": 34.88, "elapsed_time": "10:15:00", "remaining_time": "19:08:17"}
|
| 950 |
+
{"current_steps": 521, "total_steps": 1230, "loss": 0.2301, "lr": 2.8542282077061892e-05, "epoch": 2.1134177215189873, "percentage": 42.36, "elapsed_time": "12:27:07", "remaining_time": "16:56:43"}
|
| 951 |
+
{"current_steps": 430, "total_steps": 1230, "loss": 0.3287, "lr": 3.2877479077859534e-05, "epoch": 1.7432911392405064, "percentage": 34.96, "elapsed_time": "10:16:05", "remaining_time": "19:06:13"}
|
| 952 |
+
{"current_steps": 522, "total_steps": 1230, "loss": 0.2343, "lr": 2.8490926681569523e-05, "epoch": 2.11746835443038, "percentage": 42.44, "elapsed_time": "12:28:24", "remaining_time": "16:55:05"}
|
| 953 |
+
{"current_steps": 431, "total_steps": 1230, "loss": 0.338, "lr": 3.283399942497381e-05, "epoch": 1.747341772151899, "percentage": 35.04, "elapsed_time": "10:17:41", "remaining_time": "19:05:04"}
|
| 954 |
+
{"current_steps": 523, "total_steps": 1230, "loss": 0.2353, "lr": 2.8439502901320956e-05, "epoch": 2.1215189873417724, "percentage": 42.52, "elapsed_time": "12:29:44", "remaining_time": "16:53:31"}
|
| 955 |
+
{"current_steps": 432, "total_steps": 1230, "loss": 0.3405, "lr": 3.279041640882108e-05, "epoch": 1.7513924050632912, "percentage": 35.12, "elapsed_time": "10:19:09", "remaining_time": "19:03:43"}
|
| 956 |
+
{"current_steps": 524, "total_steps": 1230, "loss": 0.2498, "lr": 2.8388011150476237e-05, "epoch": 2.1255696202531644, "percentage": 42.6, "elapsed_time": "12:31:20", "remaining_time": "16:52:18"}
|
| 957 |
+
{"current_steps": 433, "total_steps": 1230, "loss": 0.3378, "lr": 3.2746730380412964e-05, "epoch": 1.7554430379746835, "percentage": 35.2, "elapsed_time": "10:20:39", "remaining_time": "19:02:25"}
|
| 958 |
+
{"current_steps": 525, "total_steps": 1230, "loss": 0.2469, "lr": 2.8336451843742866e-05, "epoch": 2.129620253164557, "percentage": 42.68, "elapsed_time": "12:32:42", "remaining_time": "16:50:46"}
|
| 959 |
+
{"current_steps": 434, "total_steps": 1230, "loss": 0.3362, "lr": 3.2702941691590726e-05, "epoch": 1.759493670886076, "percentage": 35.28, "elapsed_time": "10:22:00", "remaining_time": "19:00:50"}
|
| 960 |
+
{"current_steps": 435, "total_steps": 1230, "loss": 0.3423, "lr": 3.265905069502244e-05, "epoch": 1.7635443037974685, "percentage": 35.37, "elapsed_time": "10:23:15", "remaining_time": "18:59:03"}
|
| 961 |
+
{"current_steps": 526, "total_steps": 1230, "loss": 0.2619, "lr": 2.8284825396372387e-05, "epoch": 2.1336708860759495, "percentage": 42.76, "elapsed_time": "12:34:34", "remaining_time": "16:49:56"}
|
| 962 |
+
{"current_steps": 436, "total_steps": 1230, "loss": 0.3525, "lr": 3.261505774420016e-05, "epoch": 1.7675949367088608, "percentage": 35.45, "elapsed_time": "10:24:43", "remaining_time": "18:57:41"}
|
| 963 |
+
{"current_steps": 527, "total_steps": 1230, "loss": 0.2611, "lr": 2.8233132224157132e-05, "epoch": 2.137721518987342, "percentage": 42.85, "elapsed_time": "12:35:57", "remaining_time": "16:48:24"}
|
| 964 |
+
{"current_steps": 528, "total_steps": 1230, "loss": 0.2462, "lr": 2.8181372743426805e-05, "epoch": 2.141772151898734, "percentage": 42.93, "elapsed_time": "12:37:09", "remaining_time": "16:46:40"}
|
| 965 |
+
{"current_steps": 437, "total_steps": 1230, "loss": 0.3393, "lr": 3.257096319343707e-05, "epoch": 1.771645569620253, "percentage": 35.53, "elapsed_time": "10:26:13", "remaining_time": "18:56:22"}
|
| 966 |
+
{"current_steps": 529, "total_steps": 1230, "loss": 0.2554, "lr": 2.8129547371045128e-05, "epoch": 2.1458227848101266, "percentage": 43.01, "elapsed_time": "12:38:26", "remaining_time": "16:45:02"}
|
| 967 |
+
{"current_steps": 438, "total_steps": 1230, "loss": 0.3373, "lr": 3.2526767397864614e-05, "epoch": 1.7756962025316456, "percentage": 35.61, "elapsed_time": "10:27:25", "remaining_time": "18:54:31"}
|
| 968 |
+
{"current_steps": 530, "total_steps": 1230, "loss": 0.2575, "lr": 2.8077656524406534e-05, "epoch": 2.149873417721519, "percentage": 43.09, "elapsed_time": "12:39:49", "remaining_time": "16:43:32"}
|
| 969 |
+
{"current_steps": 439, "total_steps": 1230, "loss": 0.3282, "lr": 3.248247071342966e-05, "epoch": 1.7797468354430381, "percentage": 35.69, "elapsed_time": "10:28:42", "remaining_time": "18:52:48"}
|
| 970 |
+
{"current_steps": 440, "total_steps": 1230, "loss": 0.3371, "lr": 3.243807349689161e-05, "epoch": 1.7837974683544304, "percentage": 35.77, "elapsed_time": "10:30:09", "remaining_time": "18:51:25"}
|
| 971 |
+
{"current_steps": 531, "total_steps": 1230, "loss": 0.2513, "lr": 2.802570062143278e-05, "epoch": 2.1539240506329116, "percentage": 43.17, "elapsed_time": "12:41:19", "remaining_time": "16:42:11"}
|
| 972 |
+
{"current_steps": 532, "total_steps": 1230, "loss": 0.2279, "lr": 2.7973680080569555e-05, "epoch": 2.1579746835443037, "percentage": 43.25, "elapsed_time": "12:42:31", "remaining_time": "16:40:26"}
|
| 973 |
+
{"current_steps": 441, "total_steps": 1230, "loss": 0.3569, "lr": 3.2393576105819544e-05, "epoch": 1.7878481012658227, "percentage": 35.85, "elapsed_time": "10:31:32", "remaining_time": "18:49:54"}
|
| 974 |
+
{"current_steps": 533, "total_steps": 1230, "loss": 0.2369, "lr": 2.792159532078314e-05, "epoch": 2.162025316455696, "percentage": 43.33, "elapsed_time": "12:43:43", "remaining_time": "16:38:42"}
|
| 975 |
+
{"current_steps": 442, "total_steps": 1230, "loss": 0.3287, "lr": 3.2348978898589333e-05, "epoch": 1.7918987341772152, "percentage": 35.93, "elapsed_time": "10:32:48", "remaining_time": "18:48:11"}
|
| 976 |
+
{"current_steps": 534, "total_steps": 1230, "loss": 0.2375, "lr": 2.7869446761557033e-05, "epoch": 2.1660759493670887, "percentage": 43.41, "elapsed_time": "12:44:45", "remaining_time": "16:36:46"}
|
| 977 |
+
{"current_steps": 443, "total_steps": 1230, "loss": 0.3336, "lr": 3.230428223438075e-05, "epoch": 1.7959493670886078, "percentage": 36.02, "elapsed_time": "10:34:05", "remaining_time": "18:46:29"}
|
| 978 |
+
{"current_steps": 535, "total_steps": 1230, "loss": 0.2475, "lr": 2.781723482288857e-05, "epoch": 2.170126582278481, "percentage": 43.5, "elapsed_time": "12:46:00", "remaining_time": "16:35:06"}
|
| 979 |
+
{"current_steps": 444, "total_steps": 1230, "loss": 0.3715, "lr": 3.225948647317459e-05, "epoch": 1.8, "percentage": 36.1, "elapsed_time": "10:35:41", "remaining_time": "18:45:21"}
|
| 980 |
+
{"current_steps": 536, "total_steps": 1230, "loss": 0.2655, "lr": 2.7764959925285517e-05, "epoch": 2.1741772151898733, "percentage": 43.58, "elapsed_time": "12:47:13", "remaining_time": "16:33:22"}
|
| 981 |
+
{"current_steps": 445, "total_steps": 1230, "loss": 0.3352, "lr": 3.2214591975749745e-05, "epoch": 1.8040506329113923, "percentage": 36.18, "elapsed_time": "10:37:12", "remaining_time": "18:44:03"}
|
| 982 |
+
{"current_steps": 537, "total_steps": 1230, "loss": 0.2565, "lr": 2.771262248976272e-05, "epoch": 2.178227848101266, "percentage": 43.66, "elapsed_time": "12:48:30", "remaining_time": "16:31:45"}
|
| 983 |
+
{"current_steps": 446, "total_steps": 1230, "loss": 0.355, "lr": 3.216959910368034e-05, "epoch": 1.8081012658227849, "percentage": 36.26, "elapsed_time": "10:38:36", "remaining_time": "18:42:33"}
|
| 984 |
+
{"current_steps": 538, "total_steps": 1230, "loss": 0.2595, "lr": 2.7660222937838677e-05, "epoch": 2.1822784810126583, "percentage": 43.74, "elapsed_time": "12:49:55", "remaining_time": "16:30:18"}
|
| 985 |
+
{"current_steps": 447, "total_steps": 1230, "loss": 0.3326, "lr": 3.212450821933277e-05, "epoch": 1.8121518987341774, "percentage": 36.34, "elapsed_time": "10:39:32", "remaining_time": "18:40:15"}
|
| 986 |
+
{"current_steps": 539, "total_steps": 1230, "loss": 0.2415, "lr": 2.7607761691532186e-05, "epoch": 2.186329113924051, "percentage": 43.82, "elapsed_time": "12:51:07", "remaining_time": "16:28:35"}
|
| 987 |
+
{"current_steps": 448, "total_steps": 1230, "loss": 0.3498, "lr": 3.207931968586281e-05, "epoch": 1.8162025316455697, "percentage": 36.42, "elapsed_time": "10:40:51", "remaining_time": "18:38:37"}
|
| 988 |
+
{"current_steps": 540, "total_steps": 1230, "loss": 0.2382, "lr": 2.7555239173358916e-05, "epoch": 2.190379746835443, "percentage": 43.9, "elapsed_time": "12:52:28", "remaining_time": "16:27:03"}
|
| 989 |
+
{"current_steps": 449, "total_steps": 1230, "loss": 0.3327, "lr": 3.203403386721272e-05, "epoch": 1.820253164556962, "percentage": 36.5, "elapsed_time": "10:42:19", "remaining_time": "18:37:16"}
|
| 990 |
+
{"current_steps": 541, "total_steps": 1230, "loss": 0.2588, "lr": 2.7502655806328e-05, "epoch": 2.1944303797468354, "percentage": 43.98, "elapsed_time": "12:53:56", "remaining_time": "16:25:39"}
|
| 991 |
+
{"current_steps": 450, "total_steps": 1230, "loss": 0.3498, "lr": 3.1988651128108245e-05, "epoch": 1.8243037974683545, "percentage": 36.59, "elapsed_time": "10:43:40", "remaining_time": "18:35:41"}
|
| 992 |
+
{"current_steps": 542, "total_steps": 1230, "loss": 0.2502, "lr": 2.7450012013938648e-05, "epoch": 2.198481012658228, "percentage": 44.07, "elapsed_time": "12:55:13", "remaining_time": "16:24:03"}
|
| 993 |
+
{"current_steps": 451, "total_steps": 1230, "loss": 0.3419, "lr": 3.194317183405573e-05, "epoch": 1.828354430379747, "percentage": 36.67, "elapsed_time": "10:44:54", "remaining_time": "18:33:55"}
|
| 994 |
+
{"current_steps": 543, "total_steps": 1230, "loss": 0.239, "lr": 2.739730822017673e-05, "epoch": 2.2025316455696204, "percentage": 44.15, "elapsed_time": "12:56:25", "remaining_time": "16:22:19"}
|
| 995 |
+
{"current_steps": 452, "total_steps": 1230, "loss": 0.3469, "lr": 3.189759635133914e-05, "epoch": 1.8324050632911393, "percentage": 36.75, "elapsed_time": "10:46:34", "remaining_time": "18:32:54"}
|
| 996 |
+
{"current_steps": 544, "total_steps": 1230, "loss": 0.2371, "lr": 2.7344544849511355e-05, "epoch": 2.2065822784810125, "percentage": 44.23, "elapsed_time": "12:57:53", "remaining_time": "16:20:56"}
|
| 997 |
+
{"current_steps": 453, "total_steps": 1230, "loss": 0.3325, "lr": 3.185192504701718e-05, "epoch": 1.8364556962025316, "percentage": 36.83, "elapsed_time": "10:47:51", "remaining_time": "18:31:14"}
|
| 998 |
+
{"current_steps": 545, "total_steps": 1230, "loss": 0.2607, "lr": 2.7291722326891456e-05, "epoch": 2.210632911392405, "percentage": 44.31, "elapsed_time": "12:59:08", "remaining_time": "16:19:17"}
|
| 999 |
+
{"current_steps": 454, "total_steps": 1230, "loss": 0.3341, "lr": 3.1806158288920234e-05, "epoch": 1.840506329113924, "percentage": 36.91, "elapsed_time": "10:49:06", "remaining_time": "18:29:29"}
|
| 1000 |
+
{"current_steps": 546, "total_steps": 1230, "loss": 0.2484, "lr": 2.723884107774236e-05, "epoch": 2.2146835443037975, "percentage": 44.39, "elapsed_time": "13:00:23", "remaining_time": "16:17:37"}
|
| 1001 |
+
{"current_steps": 455, "total_steps": 1230, "loss": 0.3381, "lr": 3.1760296445647477e-05, "epoch": 1.8445569620253166, "percentage": 36.99, "elapsed_time": "10:50:32", "remaining_time": "18:28:03"}
|
| 1002 |
+
{"current_steps": 547, "total_steps": 1230, "loss": 0.2722, "lr": 2.718590152796239e-05, "epoch": 2.21873417721519, "percentage": 44.47, "elapsed_time": "13:01:53", "remaining_time": "16:16:17"}
|
| 1003 |
+
{"current_steps": 456, "total_steps": 1230, "loss": 0.3313, "lr": 3.1714339886563896e-05, "epoch": 1.848607594936709, "percentage": 37.07, "elapsed_time": "10:51:42", "remaining_time": "18:26:11"}
|
| 1004 |
+
{"current_steps": 548, "total_steps": 1230, "loss": 0.2216, "lr": 2.71329041039194e-05, "epoch": 2.222784810126582, "percentage": 44.55, "elapsed_time": "13:02:52", "remaining_time": "16:14:18"}
|
| 1005 |
+
{"current_steps": 549, "total_steps": 1230, "loss": 0.2348, "lr": 2.7079849232447357e-05, "epoch": 2.2268354430379746, "percentage": 44.63, "elapsed_time": "13:04:18", "remaining_time": "16:12:52"}
|
| 1006 |
+
{"current_steps": 457, "total_steps": 1230, "loss": 0.3346, "lr": 3.166828898179731e-05, "epoch": 1.8526582278481012, "percentage": 37.15, "elapsed_time": "10:53:18", "remaining_time": "18:25:02"}
|
| 1007 |
+
{"current_steps": 458, "total_steps": 1230, "loss": 0.3167, "lr": 3.162214410223536e-05, "epoch": 1.8567088607594937, "percentage": 37.24, "elapsed_time": "10:54:18", "remaining_time": "18:22:54"}
|
| 1008 |
+
{"current_steps": 550, "total_steps": 1230, "loss": 0.2518, "lr": 2.7026737340842895e-05, "epoch": 2.230886075949367, "percentage": 44.72, "elapsed_time": "13:05:35", "remaining_time": "16:11:16"}
|
| 1009 |
+
{"current_steps": 459, "total_steps": 1230, "loss": 0.3382, "lr": 3.157590561952257e-05, "epoch": 1.8607594936708862, "percentage": 37.32, "elapsed_time": "10:55:35", "remaining_time": "18:21:13"}
|
| 1010 |
+
{"current_steps": 551, "total_steps": 1230, "loss": 0.2496, "lr": 2.697356885686189e-05, "epoch": 2.2349367088607597, "percentage": 44.8, "elapsed_time": "13:06:55", "remaining_time": "16:09:43"}
|
| 1011 |
+
{"current_steps": 460, "total_steps": 1230, "loss": 0.3496, "lr": 3.152957390605732e-05, "epoch": 1.8648101265822785, "percentage": 37.4, "elapsed_time": "10:56:41", "remaining_time": "18:19:14"}
|
| 1012 |
+
{"current_steps": 552, "total_steps": 1230, "loss": 0.2286, "lr": 2.6920344208716014e-05, "epoch": 2.2389873417721518, "percentage": 44.88, "elapsed_time": "13:08:06", "remaining_time": "16:07:59"}
|
| 1013 |
+
{"current_steps": 461, "total_steps": 1230, "loss": 0.3483, "lr": 3.148314933498886e-05, "epoch": 1.8688607594936708, "percentage": 37.48, "elapsed_time": "10:57:57", "remaining_time": "18:17:33"}
|
| 1014 |
+
{"current_steps": 553, "total_steps": 1230, "loss": 0.25, "lr": 2.6867063825069252e-05, "epoch": 2.2430379746835443, "percentage": 44.96, "elapsed_time": "13:09:17", "remaining_time": "16:06:16"}
|
| 1015 |
+
{"current_steps": 462, "total_steps": 1230, "loss": 0.336, "lr": 3.143663228021431e-05, "epoch": 1.8729113924050633, "percentage": 37.56, "elapsed_time": "10:59:28", "remaining_time": "18:16:16"}
|
| 1016 |
+
{"current_steps": 554, "total_steps": 1230, "loss": 0.2651, "lr": 2.6813728135034494e-05, "epoch": 2.247088607594937, "percentage": 45.04, "elapsed_time": "13:10:44", "remaining_time": "16:04:52"}
|
| 1017 |
+
{"current_steps": 555, "total_steps": 1230, "loss": 0.2323, "lr": 2.6760337568170056e-05, "epoch": 2.2511392405063293, "percentage": 45.12, "elapsed_time": "13:11:56", "remaining_time": "16:03:10"}
|
| 1018 |
+
{"current_steps": 463, "total_steps": 1230, "loss": 0.3547, "lr": 3.1390023116375624e-05, "epoch": 1.8769620253164558, "percentage": 37.64, "elapsed_time": "11:00:55", "remaining_time": "18:14:53"}
|
| 1019 |
+
{"current_steps": 556, "total_steps": 1230, "loss": 0.2354, "lr": 2.6706892554476226e-05, "epoch": 2.2551898734177214, "percentage": 45.2, "elapsed_time": "13:13:06", "remaining_time": "16:01:25"}
|
| 1020 |
+
{"current_steps": 464, "total_steps": 1230, "loss": 0.348, "lr": 3.134332221885661e-05, "epoch": 1.8810126582278481, "percentage": 37.72, "elapsed_time": "11:02:24", "remaining_time": "18:13:33"}
|
| 1021 |
+
{"current_steps": 557, "total_steps": 1230, "loss": 0.2367, "lr": 2.6653393524391795e-05, "epoch": 2.259240506329114, "percentage": 45.28, "elapsed_time": "13:14:33", "remaining_time": "16:00:01"}
|
| 1022 |
+
{"current_steps": 465, "total_steps": 1230, "loss": 0.3503, "lr": 3.129652996377987e-05, "epoch": 1.8850632911392404, "percentage": 37.8, "elapsed_time": "11:03:47", "remaining_time": "18:12:02"}
|
| 1023 |
+
{"current_steps": 558, "total_steps": 1230, "loss": 0.2472, "lr": 2.6599840908790592e-05, "epoch": 2.2632911392405064, "percentage": 45.37, "elapsed_time": "13:15:55", "remaining_time": "15:58:32"}
|
| 1024 |
+
{"current_steps": 466, "total_steps": 1230, "loss": 0.3189, "lr": 3.12496467280038e-05, "epoch": 1.889113924050633, "percentage": 37.89, "elapsed_time": "11:05:13", "remaining_time": "18:10:37"}
|
| 1025 |
+
{"current_steps": 467, "total_steps": 1230, "loss": 0.3401, "lr": 3.120267288911952e-05, "epoch": 1.8931645569620255, "percentage": 37.97, "elapsed_time": "11:06:12", "remaining_time": "18:08:28"}
|
| 1026 |
+
{"current_steps": 559, "total_steps": 1230, "loss": 0.2575, "lr": 2.6546235138978028e-05, "epoch": 2.267341772151899, "percentage": 45.45, "elapsed_time": "13:17:25", "remaining_time": "15:57:11"}
|
| 1027 |
+
{"current_steps": 468, "total_steps": 1230, "loss": 0.3315, "lr": 3.11556088254479e-05, "epoch": 1.8972151898734178, "percentage": 38.05, "elapsed_time": "11:07:21", "remaining_time": "18:06:36"}
|
| 1028 |
+
{"current_steps": 560, "total_steps": 1230, "loss": 0.2529, "lr": 2.6492576646687597e-05, "epoch": 2.271392405063291, "percentage": 45.53, "elapsed_time": "13:18:56", "remaining_time": "15:55:52"}
|
| 1029 |
+
{"current_steps": 469, "total_steps": 1230, "loss": 0.3445, "lr": 3.11084549160364e-05, "epoch": 1.90126582278481, "percentage": 38.13, "elapsed_time": "11:08:40", "remaining_time": "18:04:59"}
|
| 1030 |
+
{"current_steps": 561, "total_steps": 1230, "loss": 0.2467, "lr": 2.6438865864077425e-05, "epoch": 2.2754430379746835, "percentage": 45.61, "elapsed_time": "13:20:14", "remaining_time": "15:54:18"}
|
| 1031 |
+
{"current_steps": 470, "total_steps": 1230, "loss": 0.3304, "lr": 3.106121154065615e-05, "epoch": 1.9053164556962026, "percentage": 38.21, "elapsed_time": "11:10:08", "remaining_time": "18:03:37"}
|
| 1032 |
+
{"current_steps": 562, "total_steps": 1230, "loss": 0.2373, "lr": 2.6385103223726766e-05, "epoch": 2.279493670886076, "percentage": 45.69, "elapsed_time": "13:21:19", "remaining_time": "15:52:28"}
|
| 1033 |
+
{"current_steps": 471, "total_steps": 1230, "loss": 0.3532, "lr": 3.1013879079798805e-05, "epoch": 1.909367088607595, "percentage": 38.29, "elapsed_time": "11:11:35", "remaining_time": "18:02:14"}
|
| 1034 |
+
{"current_steps": 563, "total_steps": 1230, "loss": 0.2347, "lr": 2.6331289158632537e-05, "epoch": 2.2835443037974685, "percentage": 45.77, "elapsed_time": "13:22:47", "remaining_time": "15:51:04"}
|
| 1035 |
+
{"current_steps": 564, "total_steps": 1230, "loss": 0.261, "lr": 2.6277424102205817e-05, "epoch": 2.2875949367088606, "percentage": 45.85, "elapsed_time": "13:24:13", "remaining_time": "15:49:40"}
|
| 1036 |
+
{"current_steps": 472, "total_steps": 1230, "loss": 0.3438, "lr": 3.096645791467348e-05, "epoch": 1.9134177215189874, "percentage": 38.37, "elapsed_time": "11:13:11", "remaining_time": "18:01:05"}
|
| 1037 |
+
{"current_steps": 473, "total_steps": 1230, "loss": 0.321, "lr": 3.091894842720373e-05, "epoch": 1.9174683544303797, "percentage": 38.46, "elapsed_time": "11:14:21", "remaining_time": "17:59:15"}
|
| 1038 |
+
{"current_steps": 565, "total_steps": 1230, "loss": 0.2518, "lr": 2.6223508488268374e-05, "epoch": 2.291645569620253, "percentage": 45.93, "elapsed_time": "13:25:40", "remaining_time": "15:48:15"}
|
| 1039 |
+
{"current_steps": 474, "total_steps": 1230, "loss": 0.3296, "lr": 3.0871351000024425e-05, "epoch": 1.9215189873417722, "percentage": 38.54, "elapsed_time": "11:15:54", "remaining_time": "17:58:01"}
|
| 1040 |
+
{"current_steps": 566, "total_steps": 1230, "loss": 0.2513, "lr": 2.6169542751049148e-05, "epoch": 2.2956962025316456, "percentage": 46.02, "elapsed_time": "13:27:12", "remaining_time": "15:46:57"}
|
| 1041 |
+
{"current_steps": 475, "total_steps": 1230, "loss": 0.3308, "lr": 3.0823666016478716e-05, "epoch": 1.9255696202531647, "percentage": 38.62, "elapsed_time": "11:17:09", "remaining_time": "17:56:19"}
|
| 1042 |
+
{"current_steps": 567, "total_steps": 1230, "loss": 0.2717, "lr": 2.6115527325180754e-05, "epoch": 2.299746835443038, "percentage": 46.1, "elapsed_time": "13:28:43", "remaining_time": "15:45:39"}
|
| 1043 |
+
{"current_steps": 476, "total_steps": 1230, "loss": 0.331, "lr": 3.0775893860614896e-05, "epoch": 1.929620253164557, "percentage": 38.7, "elapsed_time": "11:18:31", "remaining_time": "17:54:49"}
|
| 1044 |
+
{"current_steps": 568, "total_steps": 1230, "loss": 0.2444, "lr": 2.606146264569603e-05, "epoch": 2.3037974683544302, "percentage": 46.18, "elapsed_time": "13:30:17", "remaining_time": "15:44:23"}
|
| 1045 |
+
{"current_steps": 477, "total_steps": 1230, "loss": 0.3349, "lr": 3.0728034917183336e-05, "epoch": 1.9336708860759493, "percentage": 38.78, "elapsed_time": "11:20:01", "remaining_time": "17:53:29"}
|
| 1046 |
+
{"current_steps": 569, "total_steps": 1230, "loss": 0.2469, "lr": 2.6007349148024447e-05, "epoch": 2.3078481012658227, "percentage": 46.26, "elapsed_time": "13:31:37", "remaining_time": "15:42:51"}
|
| 1047 |
+
{"current_steps": 478, "total_steps": 1230, "loss": 0.3508, "lr": 3.06800895716334e-05, "epoch": 1.9377215189873418, "percentage": 38.86, "elapsed_time": "11:21:17", "remaining_time": "17:51:49"}
|
| 1048 |
+
{"current_steps": 570, "total_steps": 1230, "loss": 0.2434, "lr": 2.5953187267988694e-05, "epoch": 2.3118987341772153, "percentage": 46.34, "elapsed_time": "13:32:59", "remaining_time": "15:41:21"}
|
| 1049 |
+
{"current_steps": 479, "total_steps": 1230, "loss": 0.3305, "lr": 3.063205821011029e-05, "epoch": 1.9417721518987343, "percentage": 38.94, "elapsed_time": "11:22:38", "remaining_time": "17:50:16"}
|
| 1050 |
+
{"current_steps": 571, "total_steps": 1230, "loss": 0.255, "lr": 2.5898977441801097e-05, "epoch": 2.3159493670886078, "percentage": 46.42, "elapsed_time": "13:34:17", "remaining_time": "15:39:47"}
|
| 1051 |
+
{"current_steps": 480, "total_steps": 1230, "loss": 0.3493, "lr": 3.0583941219452016e-05, "epoch": 1.9458227848101266, "percentage": 39.02, "elapsed_time": "11:24:14", "remaining_time": "17:49:07"}
|
| 1052 |
+
{"current_steps": 572, "total_steps": 1230, "loss": 0.2811, "lr": 2.584472010606015e-05, "epoch": 2.32, "percentage": 46.5, "elapsed_time": "13:36:08", "remaining_time": "15:38:50"}
|
| 1053 |
+
{"current_steps": 481, "total_steps": 1230, "loss": 0.3309, "lr": 3.053573898718618e-05, "epoch": 1.949873417721519, "percentage": 39.11, "elapsed_time": "11:25:31", "remaining_time": "17:47:29"}
|
| 1054 |
+
{"current_steps": 573, "total_steps": 1230, "loss": 0.2387, "lr": 2.5790415697746976e-05, "epoch": 2.3240506329113924, "percentage": 46.59, "elapsed_time": "13:37:19", "remaining_time": "15:37:08"}
|
| 1055 |
+
{"current_steps": 482, "total_steps": 1230, "loss": 0.3251, "lr": 3.0487451901526956e-05, "epoch": 1.9539240506329114, "percentage": 39.19, "elapsed_time": "11:26:57", "remaining_time": "17:46:04"}
|
| 1056 |
+
{"current_steps": 574, "total_steps": 1230, "loss": 0.2416, "lr": 2.5736064654221808e-05, "epoch": 2.328101265822785, "percentage": 46.67, "elapsed_time": "13:38:31", "remaining_time": "15:35:27"}
|
| 1057 |
+
{"current_steps": 483, "total_steps": 1230, "loss": 0.3379, "lr": 3.0439080351371875e-05, "epoch": 1.957974683544304, "percentage": 39.27, "elapsed_time": "11:28:14", "remaining_time": "17:44:26"}
|
| 1058 |
+
{"current_steps": 575, "total_steps": 1230, "loss": 0.2363, "lr": 2.568166741322048e-05, "epoch": 2.3321518987341774, "percentage": 46.75, "elapsed_time": "13:39:45", "remaining_time": "15:33:48"}
|
| 1059 |
+
{"current_steps": 484, "total_steps": 1230, "loss": 0.3385, "lr": 3.0390624726298764e-05, "epoch": 1.9620253164556962, "percentage": 39.35, "elapsed_time": "11:29:27", "remaining_time": "17:42:41"}
|
| 1060 |
+
{"current_steps": 576, "total_steps": 1230, "loss": 0.266, "lr": 2.56272244128509e-05, "epoch": 2.3362025316455695, "percentage": 46.83, "elapsed_time": "13:41:14", "remaining_time": "15:32:27"}
|
| 1061 |
+
{"current_steps": 485, "total_steps": 1230, "loss": 0.3474, "lr": 3.034208541656255e-05, "epoch": 1.9660759493670885, "percentage": 39.43, "elapsed_time": "11:31:02", "remaining_time": "17:41:30"}
|
| 1062 |
+
{"current_steps": 577, "total_steps": 1230, "loss": 0.2456, "lr": 2.55727360915895e-05, "epoch": 2.340253164556962, "percentage": 46.91, "elapsed_time": "13:42:34", "remaining_time": "15:30:55"}
|
| 1063 |
+
{"current_steps": 486, "total_steps": 1230, "loss": 0.3383, "lr": 3.029346281309218e-05, "epoch": 1.970126582278481, "percentage": 39.51, "elapsed_time": "11:32:27", "remaining_time": "17:40:03"}
|
| 1064 |
+
{"current_steps": 578, "total_steps": 1230, "loss": 0.2597, "lr": 2.5518202888277734e-05, "epoch": 2.3443037974683545, "percentage": 46.99, "elapsed_time": "13:43:53", "remaining_time": "15:29:22"}
|
| 1065 |
+
{"current_steps": 487, "total_steps": 1230, "loss": 0.3433, "lr": 3.0244757307487415e-05, "epoch": 1.9741772151898735, "percentage": 39.59, "elapsed_time": "11:33:53", "remaining_time": "17:38:38"}
|
| 1066 |
+
{"current_steps": 579, "total_steps": 1230, "loss": 0.2498, "lr": 2.5463625242118523e-05, "epoch": 2.348354430379747, "percentage": 47.07, "elapsed_time": "13:45:29", "remaining_time": "15:28:09"}
|
| 1067 |
+
{"current_steps": 488, "total_steps": 1230, "loss": 0.3508, "lr": 3.019596929201569e-05, "epoch": 1.9782278481012658, "percentage": 39.67, "elapsed_time": "11:35:12", "remaining_time": "17:37:04"}
|
| 1068 |
+
{"current_steps": 580, "total_steps": 1230, "loss": 0.2589, "lr": 2.5409003592672723e-05, "epoch": 2.352405063291139, "percentage": 47.15, "elapsed_time": "13:46:56", "remaining_time": "15:26:44"}
|
| 1069 |
+
{"current_steps": 489, "total_steps": 1230, "loss": 0.3548, "lr": 3.0147099159608985e-05, "epoch": 1.9822784810126581, "percentage": 39.76, "elapsed_time": "11:36:47", "remaining_time": "17:35:51"}
|
| 1070 |
+
{"current_steps": 581, "total_steps": 1230, "loss": 0.2528, "lr": 2.535433837985559e-05, "epoch": 2.3564556962025316, "percentage": 47.24, "elapsed_time": "13:48:05", "remaining_time": "15:25:00"}
|
| 1071 |
+
{"current_steps": 490, "total_steps": 1230, "loss": 0.3251, "lr": 3.0098147303860616e-05, "epoch": 1.9863291139240506, "percentage": 39.84, "elapsed_time": "11:38:03", "remaining_time": "17:34:11"}
|
| 1072 |
+
{"current_steps": 582, "total_steps": 1230, "loss": 0.2622, "lr": 2.529963004393324e-05, "epoch": 2.360506329113924, "percentage": 47.32, "elapsed_time": "13:49:32", "remaining_time": "15:23:36"}
|
| 1073 |
+
{"current_steps": 491, "total_steps": 1230, "loss": 0.3407, "lr": 3.0049114119022117e-05, "epoch": 1.9903797468354432, "percentage": 39.92, "elapsed_time": "11:39:17", "remaining_time": "17:32:29"}
|
| 1074 |
+
{"current_steps": 583, "total_steps": 1230, "loss": 0.2424, "lr": 2.524487902551908e-05, "epoch": 2.3645569620253166, "percentage": 47.4, "elapsed_time": "13:50:50", "remaining_time": "15:22:02"}
|
| 1075 |
+
{"current_steps": 492, "total_steps": 1230, "loss": 0.3289, "lr": 3.0000000000000004e-05, "epoch": 1.9944303797468355, "percentage": 40.0, "elapsed_time": "11:40:33", "remaining_time": "17:30:50"}
|
| 1076 |
+
{"current_steps": 584, "total_steps": 1230, "loss": 0.2423, "lr": 2.519008576557029e-05, "epoch": 2.3686075949367087, "percentage": 47.48, "elapsed_time": "13:52:10", "remaining_time": "15:20:30"}
|
| 1077 |
+
{"current_steps": 493, "total_steps": 1230, "loss": 0.3549, "lr": 2.995080534235264e-05, "epoch": 1.9984810126582278, "percentage": 40.08, "elapsed_time": "11:42:13", "remaining_time": "17:29:46"}
|
| 1078 |
+
{"current_steps": 585, "total_steps": 1230, "loss": 0.2867, "lr": 2.5135250705384254e-05, "epoch": 2.372658227848101, "percentage": 47.56, "elapsed_time": "13:53:54", "remaining_time": "15:19:25"}
|
| 1079 |
+
{"current_steps": 586, "total_steps": 1230, "loss": 0.2476, "lr": 2.5080374286595007e-05, "epoch": 2.3767088607594937, "percentage": 47.64, "elapsed_time": "13:55:27", "remaining_time": "15:18:08"}
|
| 1080 |
+
{"current_steps": 494, "total_steps": 1230, "loss": 0.2467, "lr": 2.9901530542287044e-05, "epoch": 2.0040506329113925, "percentage": 40.16, "elapsed_time": "11:44:53", "remaining_time": "17:30:12"}
|
| 1081 |
+
{"current_steps": 587, "total_steps": 1230, "loss": 0.2562, "lr": 2.5025456951169677e-05, "epoch": 2.3807594936708862, "percentage": 47.72, "elapsed_time": "13:56:50", "remaining_time": "15:16:40"}
|
| 1082 |
+
{"current_steps": 495, "total_steps": 1230, "loss": 0.2658, "lr": 2.9852175996655676e-05, "epoch": 2.008101265822785, "percentage": 40.24, "elapsed_time": "11:46:23", "remaining_time": "17:28:53"}
|
| 1083 |
+
{"current_steps": 588, "total_steps": 1230, "loss": 0.2393, "lr": 2.4970499141404942e-05, "epoch": 2.3848101265822783, "percentage": 47.8, "elapsed_time": "13:58:01", "remaining_time": "15:14:58"}
|
| 1084 |
+
{"current_steps": 496, "total_steps": 1230, "loss": 0.2479, "lr": 2.980274210295326e-05, "epoch": 2.012151898734177, "percentage": 40.33, "elapsed_time": "11:47:43", "remaining_time": "17:27:19"}
|
| 1085 |
+
{"current_steps": 589, "total_steps": 1230, "loss": 0.2506, "lr": 2.491550129992345e-05, "epoch": 2.388860759493671, "percentage": 47.89, "elapsed_time": "13:59:28", "remaining_time": "15:13:35"}
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7288
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbfe2753ce890402118e13912d3877e6acebdd7767919752be931aea1065b060
|
| 3 |
size 7288
|