sedrickkeh
commited on
Commit
•
0de8233
1
Parent(s):
1b0a94e
Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d78bdd1ce9243b007e37a2e15d2dd11ab1640ec958e842455be29d81fb41088
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1008f4134d79dabbad3958dded8f4a61d8aca02d3d07b39b9e6282c7897fdeb
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abf9e08fbc39abdef89de979395c7490295c8ec7b2ed12724651334c1771b7b1
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0c8e2a489a2c3a17c8ea89f222f5443abee7dd65ea8ec27ae2c36c6541e1974
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -175,3 +175,91 @@
|
|
175 |
{"current_steps": 1740, "total_steps": 2631, "loss": 0.5835, "learning_rate": 5e-06, "epoch": 1.982905982905983, "percentage": 66.13, "elapsed_time": "12:51:23", "remaining_time": "6:35:00"}
|
176 |
{"current_steps": 1750, "total_steps": 2631, "loss": 0.5823, "learning_rate": 5e-06, "epoch": 1.9943019943019942, "percentage": 66.51, "elapsed_time": "12:55:47", "remaining_time": "6:30:33"}
|
177 |
{"current_steps": 1755, "total_steps": 2631, "eval_loss": 0.6174917817115784, "epoch": 2.0, "percentage": 66.7, "elapsed_time": "13:05:18", "remaining_time": "6:31:59"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
175 |
{"current_steps": 1740, "total_steps": 2631, "loss": 0.5835, "learning_rate": 5e-06, "epoch": 1.982905982905983, "percentage": 66.13, "elapsed_time": "12:51:23", "remaining_time": "6:35:00"}
|
176 |
{"current_steps": 1750, "total_steps": 2631, "loss": 0.5823, "learning_rate": 5e-06, "epoch": 1.9943019943019942, "percentage": 66.51, "elapsed_time": "12:55:47", "remaining_time": "6:30:33"}
|
177 |
{"current_steps": 1755, "total_steps": 2631, "eval_loss": 0.6174917817115784, "epoch": 2.0, "percentage": 66.7, "elapsed_time": "13:05:18", "remaining_time": "6:31:59"}
|
178 |
+
{"current_steps": 1760, "total_steps": 2631, "loss": 0.6003, "learning_rate": 5e-06, "epoch": 2.005698005698006, "percentage": 66.89, "elapsed_time": "13:08:40", "remaining_time": "6:30:18"}
|
179 |
+
{"current_steps": 1770, "total_steps": 2631, "loss": 0.5295, "learning_rate": 5e-06, "epoch": 2.017094017094017, "percentage": 67.27, "elapsed_time": "13:13:03", "remaining_time": "6:25:46"}
|
180 |
+
{"current_steps": 1780, "total_steps": 2631, "loss": 0.5396, "learning_rate": 5e-06, "epoch": 2.0284900284900287, "percentage": 67.65, "elapsed_time": "13:17:26", "remaining_time": "6:21:14"}
|
181 |
+
{"current_steps": 1790, "total_steps": 2631, "loss": 0.5498, "learning_rate": 5e-06, "epoch": 2.03988603988604, "percentage": 68.03, "elapsed_time": "13:21:50", "remaining_time": "6:16:43"}
|
182 |
+
{"current_steps": 1800, "total_steps": 2631, "loss": 0.5485, "learning_rate": 5e-06, "epoch": 2.051282051282051, "percentage": 68.42, "elapsed_time": "13:26:12", "remaining_time": "6:12:12"}
|
183 |
+
{"current_steps": 1810, "total_steps": 2631, "loss": 0.5443, "learning_rate": 5e-06, "epoch": 2.0626780626780628, "percentage": 68.8, "elapsed_time": "13:30:36", "remaining_time": "6:07:40"}
|
184 |
+
{"current_steps": 1820, "total_steps": 2631, "loss": 0.5499, "learning_rate": 5e-06, "epoch": 2.074074074074074, "percentage": 69.18, "elapsed_time": "13:34:59", "remaining_time": "6:03:09"}
|
185 |
+
{"current_steps": 1830, "total_steps": 2631, "loss": 0.5472, "learning_rate": 5e-06, "epoch": 2.0854700854700856, "percentage": 69.56, "elapsed_time": "13:39:22", "remaining_time": "5:58:38"}
|
186 |
+
{"current_steps": 1840, "total_steps": 2631, "loss": 0.5557, "learning_rate": 5e-06, "epoch": 2.096866096866097, "percentage": 69.94, "elapsed_time": "13:43:46", "remaining_time": "5:54:07"}
|
187 |
+
{"current_steps": 1850, "total_steps": 2631, "loss": 0.5423, "learning_rate": 5e-06, "epoch": 2.1082621082621085, "percentage": 70.32, "elapsed_time": "13:48:09", "remaining_time": "5:49:37"}
|
188 |
+
{"current_steps": 1860, "total_steps": 2631, "loss": 0.5556, "learning_rate": 5e-06, "epoch": 2.1196581196581197, "percentage": 70.7, "elapsed_time": "13:52:32", "remaining_time": "5:45:06"}
|
189 |
+
{"current_steps": 1870, "total_steps": 2631, "loss": 0.5464, "learning_rate": 5e-06, "epoch": 2.131054131054131, "percentage": 71.08, "elapsed_time": "13:56:55", "remaining_time": "5:40:35"}
|
190 |
+
{"current_steps": 1880, "total_steps": 2631, "loss": 0.5459, "learning_rate": 5e-06, "epoch": 2.1424501424501425, "percentage": 71.46, "elapsed_time": "14:01:19", "remaining_time": "5:36:04"}
|
191 |
+
{"current_steps": 1890, "total_steps": 2631, "loss": 0.5432, "learning_rate": 5e-06, "epoch": 2.1538461538461537, "percentage": 71.84, "elapsed_time": "14:05:41", "remaining_time": "5:31:34"}
|
192 |
+
{"current_steps": 1900, "total_steps": 2631, "loss": 0.5434, "learning_rate": 5e-06, "epoch": 2.1652421652421654, "percentage": 72.22, "elapsed_time": "14:10:05", "remaining_time": "5:27:03"}
|
193 |
+
{"current_steps": 1910, "total_steps": 2631, "loss": 0.548, "learning_rate": 5e-06, "epoch": 2.1766381766381766, "percentage": 72.6, "elapsed_time": "14:14:28", "remaining_time": "5:22:33"}
|
194 |
+
{"current_steps": 1920, "total_steps": 2631, "loss": 0.551, "learning_rate": 5e-06, "epoch": 2.1880341880341883, "percentage": 72.98, "elapsed_time": "14:18:52", "remaining_time": "5:18:03"}
|
195 |
+
{"current_steps": 1930, "total_steps": 2631, "loss": 0.5487, "learning_rate": 5e-06, "epoch": 2.1994301994301995, "percentage": 73.36, "elapsed_time": "14:23:16", "remaining_time": "5:13:33"}
|
196 |
+
{"current_steps": 1940, "total_steps": 2631, "loss": 0.5518, "learning_rate": 5e-06, "epoch": 2.2108262108262107, "percentage": 73.74, "elapsed_time": "14:27:40", "remaining_time": "5:09:03"}
|
197 |
+
{"current_steps": 1950, "total_steps": 2631, "loss": 0.5455, "learning_rate": 5e-06, "epoch": 2.2222222222222223, "percentage": 74.12, "elapsed_time": "14:32:03", "remaining_time": "5:04:32"}
|
198 |
+
{"current_steps": 1960, "total_steps": 2631, "loss": 0.5371, "learning_rate": 5e-06, "epoch": 2.2336182336182335, "percentage": 74.5, "elapsed_time": "14:36:27", "remaining_time": "5:00:03"}
|
199 |
+
{"current_steps": 1970, "total_steps": 2631, "loss": 0.548, "learning_rate": 5e-06, "epoch": 2.245014245014245, "percentage": 74.88, "elapsed_time": "14:40:50", "remaining_time": "4:55:33"}
|
200 |
+
{"current_steps": 1980, "total_steps": 2631, "loss": 0.5489, "learning_rate": 5e-06, "epoch": 2.2564102564102564, "percentage": 75.26, "elapsed_time": "14:45:14", "remaining_time": "4:51:03"}
|
201 |
+
{"current_steps": 1990, "total_steps": 2631, "loss": 0.5452, "learning_rate": 5e-06, "epoch": 2.267806267806268, "percentage": 75.64, "elapsed_time": "14:49:36", "remaining_time": "4:46:33"}
|
202 |
+
{"current_steps": 2000, "total_steps": 2631, "loss": 0.5506, "learning_rate": 5e-06, "epoch": 2.2792022792022792, "percentage": 76.02, "elapsed_time": "14:53:59", "remaining_time": "4:42:03"}
|
203 |
+
{"current_steps": 2010, "total_steps": 2631, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.2905982905982905, "percentage": 76.4, "elapsed_time": "14:58:23", "remaining_time": "4:37:33"}
|
204 |
+
{"current_steps": 2020, "total_steps": 2631, "loss": 0.5447, "learning_rate": 5e-06, "epoch": 2.301994301994302, "percentage": 76.78, "elapsed_time": "15:02:47", "remaining_time": "4:33:04"}
|
205 |
+
{"current_steps": 2030, "total_steps": 2631, "loss": 0.5533, "learning_rate": 5e-06, "epoch": 2.3133903133903133, "percentage": 77.16, "elapsed_time": "15:07:09", "remaining_time": "4:28:34"}
|
206 |
+
{"current_steps": 2040, "total_steps": 2631, "loss": 0.5493, "learning_rate": 5e-06, "epoch": 2.324786324786325, "percentage": 77.54, "elapsed_time": "15:11:32", "remaining_time": "4:24:04"}
|
207 |
+
{"current_steps": 2050, "total_steps": 2631, "loss": 0.5484, "learning_rate": 5e-06, "epoch": 2.336182336182336, "percentage": 77.92, "elapsed_time": "15:15:55", "remaining_time": "4:19:35"}
|
208 |
+
{"current_steps": 2060, "total_steps": 2631, "loss": 0.5561, "learning_rate": 5e-06, "epoch": 2.347578347578348, "percentage": 78.3, "elapsed_time": "15:20:19", "remaining_time": "4:15:05"}
|
209 |
+
{"current_steps": 2070, "total_steps": 2631, "loss": 0.5479, "learning_rate": 5e-06, "epoch": 2.358974358974359, "percentage": 78.68, "elapsed_time": "15:24:41", "remaining_time": "4:10:36"}
|
210 |
+
{"current_steps": 2080, "total_steps": 2631, "loss": 0.5482, "learning_rate": 5e-06, "epoch": 2.3703703703703702, "percentage": 79.06, "elapsed_time": "15:29:04", "remaining_time": "4:06:06"}
|
211 |
+
{"current_steps": 2090, "total_steps": 2631, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.381766381766382, "percentage": 79.44, "elapsed_time": "15:33:27", "remaining_time": "4:01:37"}
|
212 |
+
{"current_steps": 2100, "total_steps": 2631, "loss": 0.5475, "learning_rate": 5e-06, "epoch": 2.393162393162393, "percentage": 79.82, "elapsed_time": "15:37:50", "remaining_time": "3:57:08"}
|
213 |
+
{"current_steps": 2110, "total_steps": 2631, "loss": 0.564, "learning_rate": 5e-06, "epoch": 2.4045584045584047, "percentage": 80.2, "elapsed_time": "15:42:12", "remaining_time": "3:52:39"}
|
214 |
+
{"current_steps": 2120, "total_steps": 2631, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.415954415954416, "percentage": 80.58, "elapsed_time": "15:46:36", "remaining_time": "3:48:10"}
|
215 |
+
{"current_steps": 2130, "total_steps": 2631, "loss": 0.56, "learning_rate": 5e-06, "epoch": 2.427350427350427, "percentage": 80.96, "elapsed_time": "15:50:59", "remaining_time": "3:43:41"}
|
216 |
+
{"current_steps": 2140, "total_steps": 2631, "loss": 0.5592, "learning_rate": 5e-06, "epoch": 2.438746438746439, "percentage": 81.34, "elapsed_time": "15:55:23", "remaining_time": "3:39:12"}
|
217 |
+
{"current_steps": 2150, "total_steps": 2631, "loss": 0.5633, "learning_rate": 5e-06, "epoch": 2.45014245014245, "percentage": 81.72, "elapsed_time": "15:59:47", "remaining_time": "3:34:43"}
|
218 |
+
{"current_steps": 2160, "total_steps": 2631, "loss": 0.5488, "learning_rate": 5e-06, "epoch": 2.4615384615384617, "percentage": 82.1, "elapsed_time": "16:04:11", "remaining_time": "3:30:14"}
|
219 |
+
{"current_steps": 2170, "total_steps": 2631, "loss": 0.5513, "learning_rate": 5e-06, "epoch": 2.472934472934473, "percentage": 82.48, "elapsed_time": "16:08:35", "remaining_time": "3:25:46"}
|
220 |
+
{"current_steps": 2180, "total_steps": 2631, "loss": 0.5554, "learning_rate": 5e-06, "epoch": 2.484330484330484, "percentage": 82.86, "elapsed_time": "16:12:59", "remaining_time": "3:21:17"}
|
221 |
+
{"current_steps": 2190, "total_steps": 2631, "loss": 0.5574, "learning_rate": 5e-06, "epoch": 2.4957264957264957, "percentage": 83.24, "elapsed_time": "16:17:23", "remaining_time": "3:16:49"}
|
222 |
+
{"current_steps": 2200, "total_steps": 2631, "loss": 0.5629, "learning_rate": 5e-06, "epoch": 2.5071225071225074, "percentage": 83.62, "elapsed_time": "16:21:46", "remaining_time": "3:12:20"}
|
223 |
+
{"current_steps": 2210, "total_steps": 2631, "loss": 0.5444, "learning_rate": 5e-06, "epoch": 2.5185185185185186, "percentage": 84.0, "elapsed_time": "16:26:09", "remaining_time": "3:07:51"}
|
224 |
+
{"current_steps": 2220, "total_steps": 2631, "loss": 0.5591, "learning_rate": 5e-06, "epoch": 2.52991452991453, "percentage": 84.38, "elapsed_time": "16:30:33", "remaining_time": "3:03:23"}
|
225 |
+
{"current_steps": 2230, "total_steps": 2631, "loss": 0.5513, "learning_rate": 5e-06, "epoch": 2.5413105413105415, "percentage": 84.76, "elapsed_time": "16:34:57", "remaining_time": "2:58:54"}
|
226 |
+
{"current_steps": 2240, "total_steps": 2631, "loss": 0.5501, "learning_rate": 5e-06, "epoch": 2.5527065527065527, "percentage": 85.14, "elapsed_time": "16:39:20", "remaining_time": "2:54:26"}
|
227 |
+
{"current_steps": 2250, "total_steps": 2631, "loss": 0.5488, "learning_rate": 5e-06, "epoch": 2.564102564102564, "percentage": 85.52, "elapsed_time": "16:43:44", "remaining_time": "2:49:58"}
|
228 |
+
{"current_steps": 2260, "total_steps": 2631, "loss": 0.5534, "learning_rate": 5e-06, "epoch": 2.5754985754985755, "percentage": 85.9, "elapsed_time": "16:48:07", "remaining_time": "2:45:29"}
|
229 |
+
{"current_steps": 2270, "total_steps": 2631, "loss": 0.5509, "learning_rate": 5e-06, "epoch": 2.5868945868945867, "percentage": 86.28, "elapsed_time": "16:52:30", "remaining_time": "2:41:01"}
|
230 |
+
{"current_steps": 2280, "total_steps": 2631, "loss": 0.5515, "learning_rate": 5e-06, "epoch": 2.5982905982905984, "percentage": 86.66, "elapsed_time": "16:56:54", "remaining_time": "2:36:33"}
|
231 |
+
{"current_steps": 2290, "total_steps": 2631, "loss": 0.5567, "learning_rate": 5e-06, "epoch": 2.6096866096866096, "percentage": 87.04, "elapsed_time": "17:01:18", "remaining_time": "2:32:04"}
|
232 |
+
{"current_steps": 2300, "total_steps": 2631, "loss": 0.5429, "learning_rate": 5e-06, "epoch": 2.6210826210826212, "percentage": 87.42, "elapsed_time": "17:05:40", "remaining_time": "2:27:36"}
|
233 |
+
{"current_steps": 2310, "total_steps": 2631, "loss": 0.553, "learning_rate": 5e-06, "epoch": 2.6324786324786325, "percentage": 87.8, "elapsed_time": "17:10:03", "remaining_time": "2:23:08"}
|
234 |
+
{"current_steps": 2320, "total_steps": 2631, "loss": 0.5524, "learning_rate": 5e-06, "epoch": 2.6438746438746437, "percentage": 88.18, "elapsed_time": "17:14:27", "remaining_time": "2:18:40"}
|
235 |
+
{"current_steps": 2330, "total_steps": 2631, "loss": 0.5552, "learning_rate": 5e-06, "epoch": 2.6552706552706553, "percentage": 88.56, "elapsed_time": "17:18:51", "remaining_time": "2:14:12"}
|
236 |
+
{"current_steps": 2340, "total_steps": 2631, "loss": 0.5534, "learning_rate": 5e-06, "epoch": 2.6666666666666665, "percentage": 88.94, "elapsed_time": "17:23:14", "remaining_time": "2:09:44"}
|
237 |
+
{"current_steps": 2350, "total_steps": 2631, "loss": 0.5467, "learning_rate": 5e-06, "epoch": 2.678062678062678, "percentage": 89.32, "elapsed_time": "17:27:37", "remaining_time": "2:05:16"}
|
238 |
+
{"current_steps": 2360, "total_steps": 2631, "loss": 0.5565, "learning_rate": 5e-06, "epoch": 2.6894586894586894, "percentage": 89.7, "elapsed_time": "17:32:00", "remaining_time": "2:00:48"}
|
239 |
+
{"current_steps": 2370, "total_steps": 2631, "loss": 0.5444, "learning_rate": 5e-06, "epoch": 2.700854700854701, "percentage": 90.08, "elapsed_time": "17:36:24", "remaining_time": "1:56:20"}
|
240 |
+
{"current_steps": 2380, "total_steps": 2631, "loss": 0.5563, "learning_rate": 5e-06, "epoch": 2.7122507122507122, "percentage": 90.46, "elapsed_time": "17:40:48", "remaining_time": "1:51:52"}
|
241 |
+
{"current_steps": 2390, "total_steps": 2631, "loss": 0.5551, "learning_rate": 5e-06, "epoch": 2.7236467236467234, "percentage": 90.84, "elapsed_time": "17:45:11", "remaining_time": "1:47:24"}
|
242 |
+
{"current_steps": 2400, "total_steps": 2631, "loss": 0.5539, "learning_rate": 5e-06, "epoch": 2.735042735042735, "percentage": 91.22, "elapsed_time": "17:49:34", "remaining_time": "1:42:56"}
|
243 |
+
{"current_steps": 2410, "total_steps": 2631, "loss": 0.5588, "learning_rate": 5e-06, "epoch": 2.7464387464387463, "percentage": 91.6, "elapsed_time": "17:53:57", "remaining_time": "1:38:28"}
|
244 |
+
{"current_steps": 2420, "total_steps": 2631, "loss": 0.5575, "learning_rate": 5e-06, "epoch": 2.757834757834758, "percentage": 91.98, "elapsed_time": "17:58:20", "remaining_time": "1:34:01"}
|
245 |
+
{"current_steps": 2430, "total_steps": 2631, "loss": 0.5471, "learning_rate": 5e-06, "epoch": 2.769230769230769, "percentage": 92.36, "elapsed_time": "18:02:43", "remaining_time": "1:29:33"}
|
246 |
+
{"current_steps": 2440, "total_steps": 2631, "loss": 0.5468, "learning_rate": 5e-06, "epoch": 2.780626780626781, "percentage": 92.74, "elapsed_time": "18:07:05", "remaining_time": "1:25:05"}
|
247 |
+
{"current_steps": 2450, "total_steps": 2631, "loss": 0.5501, "learning_rate": 5e-06, "epoch": 2.792022792022792, "percentage": 93.12, "elapsed_time": "18:11:29", "remaining_time": "1:20:38"}
|
248 |
+
{"current_steps": 2460, "total_steps": 2631, "loss": 0.5444, "learning_rate": 5e-06, "epoch": 2.8034188034188032, "percentage": 93.5, "elapsed_time": "18:15:53", "remaining_time": "1:16:10"}
|
249 |
+
{"current_steps": 2470, "total_steps": 2631, "loss": 0.5601, "learning_rate": 5e-06, "epoch": 2.814814814814815, "percentage": 93.88, "elapsed_time": "18:20:16", "remaining_time": "1:11:43"}
|
250 |
+
{"current_steps": 2480, "total_steps": 2631, "loss": 0.5623, "learning_rate": 5e-06, "epoch": 2.826210826210826, "percentage": 94.26, "elapsed_time": "18:24:38", "remaining_time": "1:07:15"}
|
251 |
+
{"current_steps": 2490, "total_steps": 2631, "loss": 0.5543, "learning_rate": 5e-06, "epoch": 2.8376068376068377, "percentage": 94.64, "elapsed_time": "18:29:02", "remaining_time": "1:02:48"}
|
252 |
+
{"current_steps": 2500, "total_steps": 2631, "loss": 0.562, "learning_rate": 5e-06, "epoch": 2.849002849002849, "percentage": 95.02, "elapsed_time": "18:33:25", "remaining_time": "0:58:20"}
|
253 |
+
{"current_steps": 2510, "total_steps": 2631, "loss": 0.5536, "learning_rate": 5e-06, "epoch": 2.8603988603988606, "percentage": 95.4, "elapsed_time": "18:37:48", "remaining_time": "0:53:53"}
|
254 |
+
{"current_steps": 2520, "total_steps": 2631, "loss": 0.5539, "learning_rate": 5e-06, "epoch": 2.871794871794872, "percentage": 95.78, "elapsed_time": "18:42:12", "remaining_time": "0:49:25"}
|
255 |
+
{"current_steps": 2530, "total_steps": 2631, "loss": 0.5601, "learning_rate": 5e-06, "epoch": 2.883190883190883, "percentage": 96.16, "elapsed_time": "18:46:36", "remaining_time": "0:44:58"}
|
256 |
+
{"current_steps": 2540, "total_steps": 2631, "loss": 0.5557, "learning_rate": 5e-06, "epoch": 2.8945868945868947, "percentage": 96.54, "elapsed_time": "18:50:59", "remaining_time": "0:40:31"}
|
257 |
+
{"current_steps": 2550, "total_steps": 2631, "loss": 0.5528, "learning_rate": 5e-06, "epoch": 2.905982905982906, "percentage": 96.92, "elapsed_time": "18:55:22", "remaining_time": "0:36:03"}
|
258 |
+
{"current_steps": 2560, "total_steps": 2631, "loss": 0.5416, "learning_rate": 5e-06, "epoch": 2.9173789173789175, "percentage": 97.3, "elapsed_time": "18:59:45", "remaining_time": "0:31:36"}
|
259 |
+
{"current_steps": 2570, "total_steps": 2631, "loss": 0.5471, "learning_rate": 5e-06, "epoch": 2.9287749287749287, "percentage": 97.68, "elapsed_time": "19:04:09", "remaining_time": "0:27:09"}
|
260 |
+
{"current_steps": 2580, "total_steps": 2631, "loss": 0.5438, "learning_rate": 5e-06, "epoch": 2.9401709401709404, "percentage": 98.06, "elapsed_time": "19:08:33", "remaining_time": "0:22:42"}
|
261 |
+
{"current_steps": 2590, "total_steps": 2631, "loss": 0.5533, "learning_rate": 5e-06, "epoch": 2.9515669515669516, "percentage": 98.44, "elapsed_time": "19:12:56", "remaining_time": "0:18:15"}
|
262 |
+
{"current_steps": 2600, "total_steps": 2631, "loss": 0.5446, "learning_rate": 5e-06, "epoch": 2.962962962962963, "percentage": 98.82, "elapsed_time": "19:17:19", "remaining_time": "0:13:47"}
|
263 |
+
{"current_steps": 2610, "total_steps": 2631, "loss": 0.556, "learning_rate": 5e-06, "epoch": 2.9743589743589745, "percentage": 99.2, "elapsed_time": "19:21:43", "remaining_time": "0:09:20"}
|
264 |
+
{"current_steps": 2620, "total_steps": 2631, "loss": 0.5571, "learning_rate": 5e-06, "epoch": 2.9857549857549857, "percentage": 99.58, "elapsed_time": "19:26:07", "remaining_time": "0:04:53"}
|
265 |
+
{"current_steps": 2630, "total_steps": 2631, "loss": 0.5443, "learning_rate": 5e-06, "epoch": 2.9971509971509973, "percentage": 99.96, "elapsed_time": "19:30:29", "remaining_time": "0:00:26"}
|