File size: 123,383 Bytes
16bdc67
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
{"current_steps": 1, "total_steps": 501, "loss": 5.1027, "learning_rate": 0.0, "epoch": 0.001996007984031936, "percentage": 0.2, "elapsed_time": "0:00:06", "remaining_time": "0:52:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2, "total_steps": 501, "loss": 5.1552, "learning_rate": 5.017166594399687e-06, "epoch": 0.003992015968063872, "percentage": 0.4, "elapsed_time": "0:00:08", "remaining_time": "0:36:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3, "total_steps": 501, "loss": 5.1408, "learning_rate": 7.952020911994375e-06, "epoch": 0.005988023952095809, "percentage": 0.6, "elapsed_time": "0:00:11", "remaining_time": "0:30:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4, "total_steps": 501, "loss": 3.2825, "learning_rate": 1.0034333188799373e-05, "epoch": 0.007984031936127744, "percentage": 0.8, "elapsed_time": "0:00:13", "remaining_time": "0:27:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5, "total_steps": 501, "loss": 2.5601, "learning_rate": 1.164950007226698e-05, "epoch": 0.00998003992015968, "percentage": 1.0, "elapsed_time": "0:00:15", "remaining_time": "0:25:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 6, "total_steps": 501, "loss": 1.994, "learning_rate": 1.2969187506394062e-05, "epoch": 0.011976047904191617, "percentage": 1.2, "elapsed_time": "0:00:18", "remaining_time": "0:24:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 7, "total_steps": 501, "loss": 1.8568, "learning_rate": 1.4084967333570947e-05, "epoch": 0.013972055888223553, "percentage": 1.4, "elapsed_time": "0:00:20", "remaining_time": "0:23:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 8, "total_steps": 501, "loss": 1.59, "learning_rate": 1.505149978319906e-05, "epoch": 0.015968063872255488, "percentage": 1.6, "elapsed_time": "0:00:22", "remaining_time": "0:23:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 9, "total_steps": 501, "loss": 1.3238, "learning_rate": 1.590404182398875e-05, "epoch": 0.017964071856287425, "percentage": 1.8, "elapsed_time": "0:00:25", "remaining_time": "0:22:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 10, "total_steps": 501, "loss": 1.267, "learning_rate": 1.666666666666667e-05, "epoch": 0.01996007984031936, "percentage": 2.0, "elapsed_time": "0:00:27", "remaining_time": "0:22:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 11, "total_steps": 501, "loss": 1.2438, "learning_rate": 1.7356544752637084e-05, "epoch": 0.021956087824351298, "percentage": 2.2, "elapsed_time": "0:00:29", "remaining_time": "0:22:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 12, "total_steps": 501, "loss": 1.1196, "learning_rate": 1.7986354100793748e-05, "epoch": 0.023952095808383235, "percentage": 2.4, "elapsed_time": "0:00:32", "remaining_time": "0:21:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 13, "total_steps": 501, "loss": 1.0148, "learning_rate": 1.8565722538447282e-05, "epoch": 0.02594810379241517, "percentage": 2.59, "elapsed_time": "0:00:34", "remaining_time": "0:21:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 14, "total_steps": 501, "loss": 1.0081, "learning_rate": 1.9102133927970633e-05, "epoch": 0.027944111776447105, "percentage": 2.79, "elapsed_time": "0:00:36", "remaining_time": "0:21:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 15, "total_steps": 501, "loss": 0.9228, "learning_rate": 1.9601520984261358e-05, "epoch": 0.029940119760479042, "percentage": 2.99, "elapsed_time": "0:00:39", "remaining_time": "0:21:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 16, "total_steps": 501, "loss": 0.8351, "learning_rate": 2.0068666377598747e-05, "epoch": 0.031936127744510975, "percentage": 3.19, "elapsed_time": "0:00:41", "remaining_time": "0:20:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 17, "total_steps": 501, "loss": 0.8303, "learning_rate": 2.0507482022971233e-05, "epoch": 0.033932135728542916, "percentage": 3.39, "elapsed_time": "0:00:43", "remaining_time": "0:20:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 18, "total_steps": 501, "loss": 0.7769, "learning_rate": 2.0921208418388435e-05, "epoch": 0.03592814371257485, "percentage": 3.59, "elapsed_time": "0:00:46", "remaining_time": "0:20:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 19, "total_steps": 501, "loss": 0.8032, "learning_rate": 2.1312560015880482e-05, "epoch": 0.03792415169660679, "percentage": 3.79, "elapsed_time": "0:00:48", "remaining_time": "0:20:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 501, "loss": 0.7759, "learning_rate": 2.1683833261066357e-05, "epoch": 0.03992015968063872, "percentage": 3.99, "elapsed_time": "0:00:50", "remaining_time": "0:20:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 21, "total_steps": 501, "loss": 0.7805, "learning_rate": 2.2036988245565324e-05, "epoch": 0.041916167664670656, "percentage": 4.19, "elapsed_time": "0:00:53", "remaining_time": "0:20:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 22, "total_steps": 501, "loss": 0.735, "learning_rate": 2.2373711347036773e-05, "epoch": 0.043912175648702596, "percentage": 4.39, "elapsed_time": "0:00:55", "remaining_time": "0:20:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 23, "total_steps": 501, "loss": 0.6523, "learning_rate": 2.269546393362655e-05, "epoch": 0.04590818363273453, "percentage": 4.59, "elapsed_time": "0:00:57", "remaining_time": "0:19:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 24, "total_steps": 501, "loss": 0.6623, "learning_rate": 2.3003520695193437e-05, "epoch": 0.04790419161676647, "percentage": 4.79, "elapsed_time": "0:01:00", "remaining_time": "0:19:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 25, "total_steps": 501, "loss": 0.6503, "learning_rate": 2.329900014453396e-05, "epoch": 0.0499001996007984, "percentage": 4.99, "elapsed_time": "0:01:02", "remaining_time": "0:19:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 26, "total_steps": 501, "loss": 0.636, "learning_rate": 2.3582889132846968e-05, "epoch": 0.05189620758483034, "percentage": 5.19, "elapsed_time": "0:01:04", "remaining_time": "0:19:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 27, "total_steps": 501, "loss": 0.7242, "learning_rate": 2.3856062735983123e-05, "epoch": 0.05389221556886228, "percentage": 5.39, "elapsed_time": "0:01:07", "remaining_time": "0:19:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 28, "total_steps": 501, "loss": 0.5819, "learning_rate": 2.4119300522370322e-05, "epoch": 0.05588822355289421, "percentage": 5.59, "elapsed_time": "0:01:09", "remaining_time": "0:19:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 29, "total_steps": 501, "loss": 0.6788, "learning_rate": 2.4373299964982603e-05, "epoch": 0.05788423153692615, "percentage": 5.79, "elapsed_time": "0:01:11", "remaining_time": "0:19:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 501, "loss": 0.7346, "learning_rate": 2.4618687578661044e-05, "epoch": 0.059880239520958084, "percentage": 5.99, "elapsed_time": "0:01:14", "remaining_time": "0:19:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 31, "total_steps": 501, "loss": 0.4835, "learning_rate": 2.4856028230571212e-05, "epoch": 0.06187624750499002, "percentage": 6.19, "elapsed_time": "0:01:16", "remaining_time": "0:19:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 32, "total_steps": 501, "loss": 0.6537, "learning_rate": 2.5085832971998436e-05, "epoch": 0.06387225548902195, "percentage": 6.39, "elapsed_time": "0:01:18", "remaining_time": "0:19:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 33, "total_steps": 501, "loss": 0.6633, "learning_rate": 2.530856566463146e-05, "epoch": 0.0658682634730539, "percentage": 6.59, "elapsed_time": "0:01:21", "remaining_time": "0:19:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 34, "total_steps": 501, "loss": 0.6268, "learning_rate": 2.552464861737092e-05, "epoch": 0.06786427145708583, "percentage": 6.79, "elapsed_time": "0:01:23", "remaining_time": "0:19:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 35, "total_steps": 501, "loss": 0.6355, "learning_rate": 2.5734467405837933e-05, "epoch": 0.06986027944111776, "percentage": 6.99, "elapsed_time": "0:01:25", "remaining_time": "0:19:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 36, "total_steps": 501, "loss": 0.6168, "learning_rate": 2.5938375012788124e-05, "epoch": 0.0718562874251497, "percentage": 7.19, "elapsed_time": "0:01:28", "remaining_time": "0:18:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 37, "total_steps": 501, "loss": 0.6583, "learning_rate": 2.6136695401116585e-05, "epoch": 0.07385229540918163, "percentage": 7.39, "elapsed_time": "0:01:30", "remaining_time": "0:18:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 38, "total_steps": 501, "loss": 0.565, "learning_rate": 2.6329726610280168e-05, "epoch": 0.07584830339321358, "percentage": 7.58, "elapsed_time": "0:01:32", "remaining_time": "0:18:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 39, "total_steps": 501, "loss": 0.6409, "learning_rate": 2.651774345044166e-05, "epoch": 0.07784431137724551, "percentage": 7.78, "elapsed_time": "0:01:35", "remaining_time": "0:18:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 501, "loss": 0.5335, "learning_rate": 2.6700999855466042e-05, "epoch": 0.07984031936127745, "percentage": 7.98, "elapsed_time": "0:01:37", "remaining_time": "0:18:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 41, "total_steps": 501, "loss": 0.4502, "learning_rate": 2.687973094532893e-05, "epoch": 0.08183632734530938, "percentage": 8.18, "elapsed_time": "0:01:39", "remaining_time": "0:18:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 42, "total_steps": 501, "loss": 0.607, "learning_rate": 2.7054154839965013e-05, "epoch": 0.08383233532934131, "percentage": 8.38, "elapsed_time": "0:01:42", "remaining_time": "0:18:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 43, "total_steps": 501, "loss": 0.5033, "learning_rate": 2.722447425965978e-05, "epoch": 0.08582834331337326, "percentage": 8.58, "elapsed_time": "0:01:44", "remaining_time": "0:18:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 44, "total_steps": 501, "loss": 0.5956, "learning_rate": 2.739087794143646e-05, "epoch": 0.08782435129740519, "percentage": 8.78, "elapsed_time": "0:01:46", "remaining_time": "0:18:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 45, "total_steps": 501, "loss": 0.575, "learning_rate": 2.755354189625573e-05, "epoch": 0.08982035928143713, "percentage": 8.98, "elapsed_time": "0:01:49", "remaining_time": "0:18:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 46, "total_steps": 501, "loss": 0.6473, "learning_rate": 2.771263052802624e-05, "epoch": 0.09181636726546906, "percentage": 9.18, "elapsed_time": "0:01:51", "remaining_time": "0:18:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 47, "total_steps": 501, "loss": 0.6273, "learning_rate": 2.7868297632261957e-05, "epoch": 0.09381237524950099, "percentage": 9.38, "elapsed_time": "0:01:53", "remaining_time": "0:18:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 48, "total_steps": 501, "loss": 0.618, "learning_rate": 2.8020687289593123e-05, "epoch": 0.09580838323353294, "percentage": 9.58, "elapsed_time": "0:01:56", "remaining_time": "0:18:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 49, "total_steps": 501, "loss": 0.625, "learning_rate": 2.8169934667141895e-05, "epoch": 0.09780439121756487, "percentage": 9.78, "elapsed_time": "0:01:58", "remaining_time": "0:18:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 501, "loss": 0.6372, "learning_rate": 2.8316166738933646e-05, "epoch": 0.0998003992015968, "percentage": 9.98, "elapsed_time": "0:02:00", "remaining_time": "0:18:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 51, "total_steps": 501, "loss": 0.539, "learning_rate": 2.845950293496561e-05, "epoch": 0.10179640718562874, "percentage": 10.18, "elapsed_time": "0:02:03", "remaining_time": "0:18:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 52, "total_steps": 501, "loss": 0.388, "learning_rate": 2.8600055727246657e-05, "epoch": 0.10379241516966067, "percentage": 10.38, "elapsed_time": "0:02:05", "remaining_time": "0:18:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 53, "total_steps": 501, "loss": 0.5401, "learning_rate": 2.8737931160013153e-05, "epoch": 0.10578842315369262, "percentage": 10.58, "elapsed_time": "0:02:07", "remaining_time": "0:18:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 54, "total_steps": 501, "loss": 0.5695, "learning_rate": 2.8873229330382812e-05, "epoch": 0.10778443113772455, "percentage": 10.78, "elapsed_time": "0:02:10", "remaining_time": "0:17:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 55, "total_steps": 501, "loss": 0.4986, "learning_rate": 2.9006044824904066e-05, "epoch": 0.10978043912175649, "percentage": 10.98, "elapsed_time": "0:02:12", "remaining_time": "0:17:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 56, "total_steps": 501, "loss": 0.5629, "learning_rate": 2.913646711677001e-05, "epoch": 0.11177644710578842, "percentage": 11.18, "elapsed_time": "0:02:14", "remaining_time": "0:17:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 57, "total_steps": 501, "loss": 0.605, "learning_rate": 2.926458092787486e-05, "epoch": 0.11377245508982035, "percentage": 11.38, "elapsed_time": "0:02:17", "remaining_time": "0:17:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 58, "total_steps": 501, "loss": 0.5247, "learning_rate": 2.939046655938229e-05, "epoch": 0.1157684630738523, "percentage": 11.58, "elapsed_time": "0:02:19", "remaining_time": "0:17:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 59, "total_steps": 501, "loss": 0.5797, "learning_rate": 2.951420019403574e-05, "epoch": 0.11776447105788423, "percentage": 11.78, "elapsed_time": "0:02:21", "remaining_time": "0:17:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 501, "loss": 0.5689, "learning_rate": 2.963585417306073e-05, "epoch": 0.11976047904191617, "percentage": 11.98, "elapsed_time": "0:02:24", "remaining_time": "0:17:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 61, "total_steps": 501, "loss": 0.5559, "learning_rate": 2.9755497250179453e-05, "epoch": 0.1217564870259481, "percentage": 12.18, "elapsed_time": "0:02:26", "remaining_time": "0:17:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 62, "total_steps": 501, "loss": 0.4973, "learning_rate": 2.98731948249709e-05, "epoch": 0.12375249500998003, "percentage": 12.38, "elapsed_time": "0:02:28", "remaining_time": "0:17:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 63, "total_steps": 501, "loss": 0.5439, "learning_rate": 2.9989009157559694e-05, "epoch": 0.12574850299401197, "percentage": 12.57, "elapsed_time": "0:02:31", "remaining_time": "0:17:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 64, "total_steps": 501, "loss": 0.5472, "learning_rate": 3.010299956639812e-05, "epoch": 0.1277445109780439, "percentage": 12.77, "elapsed_time": "0:02:33", "remaining_time": "0:17:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 65, "total_steps": 501, "loss": 0.6008, "learning_rate": 3.021522261071426e-05, "epoch": 0.12974051896207583, "percentage": 12.97, "elapsed_time": "0:02:35", "remaining_time": "0:17:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 66, "total_steps": 501, "loss": 0.4552, "learning_rate": 3.0325732259031143e-05, "epoch": 0.1317365269461078, "percentage": 13.17, "elapsed_time": "0:02:38", "remaining_time": "0:17:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 67, "total_steps": 501, "loss": 0.4661, "learning_rate": 3.043458004501377e-05, "epoch": 0.13373253493013973, "percentage": 13.37, "elapsed_time": "0:02:40", "remaining_time": "0:17:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 68, "total_steps": 501, "loss": 0.4996, "learning_rate": 3.054181521177061e-05, "epoch": 0.13572854291417166, "percentage": 13.57, "elapsed_time": "0:02:42", "remaining_time": "0:17:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 69, "total_steps": 501, "loss": 0.5589, "learning_rate": 3.064748484562093e-05, "epoch": 0.1377245508982036, "percentage": 13.77, "elapsed_time": "0:02:45", "remaining_time": "0:17:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 501, "loss": 0.5948, "learning_rate": 3.0751634000237615e-05, "epoch": 0.13972055888223553, "percentage": 13.97, "elapsed_time": "0:02:47", "remaining_time": "0:17:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 71, "total_steps": 501, "loss": 0.5384, "learning_rate": 3.085430581198459e-05, "epoch": 0.14171656686626746, "percentage": 14.17, "elapsed_time": "0:02:49", "remaining_time": "0:17:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 72, "total_steps": 501, "loss": 0.4915, "learning_rate": 3.095554160718781e-05, "epoch": 0.1437125748502994, "percentage": 14.37, "elapsed_time": "0:02:52", "remaining_time": "0:17:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 73, "total_steps": 501, "loss": 0.5405, "learning_rate": 3.10553810020076e-05, "epoch": 0.14570858283433133, "percentage": 14.57, "elapsed_time": "0:02:54", "remaining_time": "0:17:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 74, "total_steps": 501, "loss": 0.4313, "learning_rate": 3.115386199551628e-05, "epoch": 0.14770459081836326, "percentage": 14.77, "elapsed_time": "0:02:56", "remaining_time": "0:17:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 75, "total_steps": 501, "loss": 0.5154, "learning_rate": 3.1251021056528336e-05, "epoch": 0.1497005988023952, "percentage": 14.97, "elapsed_time": "0:02:59", "remaining_time": "0:16:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 76, "total_steps": 501, "loss": 0.5097, "learning_rate": 3.134689320467986e-05, "epoch": 0.15169660678642716, "percentage": 15.17, "elapsed_time": "0:03:01", "remaining_time": "0:16:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 77, "total_steps": 501, "loss": 0.4365, "learning_rate": 3.144151208620804e-05, "epoch": 0.1536926147704591, "percentage": 15.37, "elapsed_time": "0:03:03", "remaining_time": "0:16:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 78, "total_steps": 501, "loss": 0.5734, "learning_rate": 3.1534910044841344e-05, "epoch": 0.15568862275449102, "percentage": 15.57, "elapsed_time": "0:03:06", "remaining_time": "0:16:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 79, "total_steps": 501, "loss": 0.42, "learning_rate": 3.1627118188174024e-05, "epoch": 0.15768463073852296, "percentage": 15.77, "elapsed_time": "0:03:08", "remaining_time": "0:16:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 501, "loss": 0.4796, "learning_rate": 3.171816644986573e-05, "epoch": 0.1596806387225549, "percentage": 15.97, "elapsed_time": "0:03:10", "remaining_time": "0:16:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 81, "total_steps": 501, "loss": 0.5675, "learning_rate": 3.18080836479775e-05, "epoch": 0.16167664670658682, "percentage": 16.17, "elapsed_time": "0:03:13", "remaining_time": "0:16:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 82, "total_steps": 501, "loss": 0.5183, "learning_rate": 3.1896897539728616e-05, "epoch": 0.16367265469061876, "percentage": 16.37, "elapsed_time": "0:03:15", "remaining_time": "0:16:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 83, "total_steps": 501, "loss": 0.4513, "learning_rate": 3.198463487293457e-05, "epoch": 0.1656686626746507, "percentage": 16.57, "elapsed_time": "0:03:17", "remaining_time": "0:16:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 84, "total_steps": 501, "loss": 0.589, "learning_rate": 3.207132143436469e-05, "epoch": 0.16766467065868262, "percentage": 16.77, "elapsed_time": "0:03:20", "remaining_time": "0:16:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 85, "total_steps": 501, "loss": 0.5101, "learning_rate": 3.215698209523821e-05, "epoch": 0.16966067864271456, "percentage": 16.97, "elapsed_time": "0:03:22", "remaining_time": "0:16:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 86, "total_steps": 501, "loss": 0.4349, "learning_rate": 3.224164085405946e-05, "epoch": 0.17165668662674652, "percentage": 17.17, "elapsed_time": "0:03:24", "remaining_time": "0:16:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 87, "total_steps": 501, "loss": 0.4965, "learning_rate": 3.232532087697698e-05, "epoch": 0.17365269461077845, "percentage": 17.37, "elapsed_time": "0:03:27", "remaining_time": "0:16:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 88, "total_steps": 501, "loss": 0.4444, "learning_rate": 3.240804453583615e-05, "epoch": 0.17564870259481039, "percentage": 17.56, "elapsed_time": "0:03:29", "remaining_time": "0:16:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 89, "total_steps": 501, "loss": 0.4379, "learning_rate": 3.248983344408188e-05, "epoch": 0.17764471057884232, "percentage": 17.76, "elapsed_time": "0:03:31", "remaining_time": "0:16:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 90, "total_steps": 501, "loss": 0.453, "learning_rate": 3.2570708490655414e-05, "epoch": 0.17964071856287425, "percentage": 17.96, "elapsed_time": "0:03:34", "remaining_time": "0:16:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 91, "total_steps": 501, "loss": 0.519, "learning_rate": 3.265068987201822e-05, "epoch": 0.18163672654690619, "percentage": 18.16, "elapsed_time": "0:03:36", "remaining_time": "0:16:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 92, "total_steps": 501, "loss": 0.5112, "learning_rate": 3.2729797122425925e-05, "epoch": 0.18363273453093812, "percentage": 18.36, "elapsed_time": "0:03:38", "remaining_time": "0:16:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 93, "total_steps": 501, "loss": 0.4302, "learning_rate": 3.280804914256559e-05, "epoch": 0.18562874251497005, "percentage": 18.56, "elapsed_time": "0:03:41", "remaining_time": "0:16:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 94, "total_steps": 501, "loss": 0.4814, "learning_rate": 3.288546422666164e-05, "epoch": 0.18762475049900199, "percentage": 18.76, "elapsed_time": "0:03:43", "remaining_time": "0:16:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 95, "total_steps": 501, "loss": 0.5035, "learning_rate": 3.2962060088147464e-05, "epoch": 0.18962075848303392, "percentage": 18.96, "elapsed_time": "0:03:45", "remaining_time": "0:16:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 96, "total_steps": 501, "loss": 0.5718, "learning_rate": 3.3037853883992805e-05, "epoch": 0.19161676646706588, "percentage": 19.16, "elapsed_time": "0:03:48", "remaining_time": "0:16:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 97, "total_steps": 501, "loss": 0.5522, "learning_rate": 3.3112862237770756e-05, "epoch": 0.1936127744510978, "percentage": 19.36, "elapsed_time": "0:03:50", "remaining_time": "0:16:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 98, "total_steps": 501, "loss": 0.5257, "learning_rate": 3.3187101261541584e-05, "epoch": 0.19560878243512975, "percentage": 19.56, "elapsed_time": "0:03:52", "remaining_time": "0:15:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 99, "total_steps": 501, "loss": 0.511, "learning_rate": 3.326058657662584e-05, "epoch": 0.19760479041916168, "percentage": 19.76, "elapsed_time": "0:03:55", "remaining_time": "0:15:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 100, "total_steps": 501, "loss": 0.5182, "learning_rate": 3.333333333333334e-05, "epoch": 0.1996007984031936, "percentage": 19.96, "elapsed_time": "0:03:57", "remaining_time": "0:15:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 101, "total_steps": 501, "loss": 0.4776, "learning_rate": 3.340535622971072e-05, "epoch": 0.20159680638722555, "percentage": 20.16, "elapsed_time": "0:04:30", "remaining_time": "0:17:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 102, "total_steps": 501, "loss": 0.4915, "learning_rate": 3.3476669529365295e-05, "epoch": 0.20359281437125748, "percentage": 20.36, "elapsed_time": "0:04:32", "remaining_time": "0:17:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 103, "total_steps": 501, "loss": 0.3955, "learning_rate": 3.3547287078419544e-05, "epoch": 0.2055888223552894, "percentage": 20.56, "elapsed_time": "0:04:34", "remaining_time": "0:17:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 104, "total_steps": 501, "loss": 0.4132, "learning_rate": 3.361722232164634e-05, "epoch": 0.20758483033932135, "percentage": 20.76, "elapsed_time": "0:04:37", "remaining_time": "0:17:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 105, "total_steps": 501, "loss": 0.5133, "learning_rate": 3.3686488317832306e-05, "epoch": 0.20958083832335328, "percentage": 20.96, "elapsed_time": "0:04:39", "remaining_time": "0:17:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 106, "total_steps": 501, "loss": 0.3898, "learning_rate": 3.375509775441284e-05, "epoch": 0.21157684630738524, "percentage": 21.16, "elapsed_time": "0:04:41", "remaining_time": "0:17:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 107, "total_steps": 501, "loss": 0.4353, "learning_rate": 3.382306296142016e-05, "epoch": 0.21357285429141717, "percentage": 21.36, "elapsed_time": "0:04:44", "remaining_time": "0:17:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 108, "total_steps": 501, "loss": 0.5008, "learning_rate": 3.38903959247825e-05, "epoch": 0.2155688622754491, "percentage": 21.56, "elapsed_time": "0:04:46", "remaining_time": "0:17:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 109, "total_steps": 501, "loss": 0.4203, "learning_rate": 3.395710829901039e-05, "epoch": 0.21756487025948104, "percentage": 21.76, "elapsed_time": "0:04:48", "remaining_time": "0:17:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 110, "total_steps": 501, "loss": 0.4798, "learning_rate": 3.402321141930376e-05, "epoch": 0.21956087824351297, "percentage": 21.96, "elapsed_time": "0:04:51", "remaining_time": "0:17:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 111, "total_steps": 501, "loss": 0.4855, "learning_rate": 3.4088716313110955e-05, "epoch": 0.2215568862275449, "percentage": 22.16, "elapsed_time": "0:04:53", "remaining_time": "0:17:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 112, "total_steps": 501, "loss": 0.4973, "learning_rate": 3.415363371116969e-05, "epoch": 0.22355289421157684, "percentage": 22.36, "elapsed_time": "0:04:55", "remaining_time": "0:17:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 113, "total_steps": 501, "loss": 0.5217, "learning_rate": 3.4217974058057e-05, "epoch": 0.22554890219560877, "percentage": 22.55, "elapsed_time": "0:04:58", "remaining_time": "0:17:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 114, "total_steps": 501, "loss": 0.3906, "learning_rate": 3.428174752227455e-05, "epoch": 0.2275449101796407, "percentage": 22.75, "elapsed_time": "0:05:00", "remaining_time": "0:17:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 115, "total_steps": 501, "loss": 0.4958, "learning_rate": 3.434496400589353e-05, "epoch": 0.22954091816367264, "percentage": 22.95, "elapsed_time": "0:05:03", "remaining_time": "0:16:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 116, "total_steps": 501, "loss": 0.4526, "learning_rate": 3.440763315378198e-05, "epoch": 0.2315369261477046, "percentage": 23.15, "elapsed_time": "0:05:05", "remaining_time": "0:16:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 117, "total_steps": 501, "loss": 0.4559, "learning_rate": 3.446976436243603e-05, "epoch": 0.23353293413173654, "percentage": 23.35, "elapsed_time": "0:05:07", "remaining_time": "0:16:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 118, "total_steps": 501, "loss": 0.5048, "learning_rate": 3.4531366788435425e-05, "epoch": 0.23552894211576847, "percentage": 23.55, "elapsed_time": "0:05:10", "remaining_time": "0:16:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 119, "total_steps": 501, "loss": 0.4128, "learning_rate": 3.459244935654219e-05, "epoch": 0.2375249500998004, "percentage": 23.75, "elapsed_time": "0:05:12", "remaining_time": "0:16:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 120, "total_steps": 501, "loss": 0.4602, "learning_rate": 3.465302076746041e-05, "epoch": 0.23952095808383234, "percentage": 23.95, "elapsed_time": "0:05:14", "remaining_time": "0:16:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 121, "total_steps": 501, "loss": 0.4791, "learning_rate": 3.471308950527417e-05, "epoch": 0.24151696606786427, "percentage": 24.15, "elapsed_time": "0:05:17", "remaining_time": "0:16:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 122, "total_steps": 501, "loss": 0.4741, "learning_rate": 3.477266384457914e-05, "epoch": 0.2435129740518962, "percentage": 24.35, "elapsed_time": "0:05:19", "remaining_time": "0:16:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 123, "total_steps": 501, "loss": 0.4292, "learning_rate": 3.48317518573233e-05, "epoch": 0.24550898203592814, "percentage": 24.55, "elapsed_time": "0:05:21", "remaining_time": "0:16:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 124, "total_steps": 501, "loss": 0.5069, "learning_rate": 3.489036141937059e-05, "epoch": 0.24750499001996007, "percentage": 24.75, "elapsed_time": "0:05:24", "remaining_time": "0:16:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 125, "total_steps": 501, "loss": 0.4823, "learning_rate": 3.494850021680094e-05, "epoch": 0.249500998003992, "percentage": 24.95, "elapsed_time": "0:05:26", "remaining_time": "0:16:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 126, "total_steps": 501, "loss": 0.3732, "learning_rate": 3.500617575195938e-05, "epoch": 0.25149700598802394, "percentage": 25.15, "elapsed_time": "0:05:28", "remaining_time": "0:16:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 127, "total_steps": 501, "loss": 0.4284, "learning_rate": 3.5063395349265945e-05, "epoch": 0.25349301397205587, "percentage": 25.35, "elapsed_time": "0:05:31", "remaining_time": "0:16:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 128, "total_steps": 501, "loss": 0.4322, "learning_rate": 3.5120166160797804e-05, "epoch": 0.2554890219560878, "percentage": 25.55, "elapsed_time": "0:05:33", "remaining_time": "0:16:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 129, "total_steps": 501, "loss": 0.4465, "learning_rate": 3.517649517165415e-05, "epoch": 0.25748502994011974, "percentage": 25.75, "elapsed_time": "0:05:35", "remaining_time": "0:16:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 130, "total_steps": 501, "loss": 0.4093, "learning_rate": 3.523238920511395e-05, "epoch": 0.25948103792415167, "percentage": 25.95, "elapsed_time": "0:05:38", "remaining_time": "0:16:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 131, "total_steps": 501, "loss": 0.4735, "learning_rate": 3.528785492759607e-05, "epoch": 0.26147704590818366, "percentage": 26.15, "elapsed_time": "0:05:40", "remaining_time": "0:16:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 132, "total_steps": 501, "loss": 0.4952, "learning_rate": 3.5342898853430836e-05, "epoch": 0.2634730538922156, "percentage": 26.35, "elapsed_time": "0:05:42", "remaining_time": "0:15:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 133, "total_steps": 501, "loss": 0.4516, "learning_rate": 3.539752734945143e-05, "epoch": 0.2654690618762475, "percentage": 26.55, "elapsed_time": "0:05:45", "remaining_time": "0:15:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 134, "total_steps": 501, "loss": 0.3785, "learning_rate": 3.5451746639413466e-05, "epoch": 0.26746506986027946, "percentage": 26.75, "elapsed_time": "0:05:47", "remaining_time": "0:15:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 135, "total_steps": 501, "loss": 0.4324, "learning_rate": 3.550556280825011e-05, "epoch": 0.2694610778443114, "percentage": 26.95, "elapsed_time": "0:05:49", "remaining_time": "0:15:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 136, "total_steps": 501, "loss": 0.3836, "learning_rate": 3.55589818061703e-05, "epoch": 0.2714570858283433, "percentage": 27.15, "elapsed_time": "0:05:52", "remaining_time": "0:15:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 137, "total_steps": 501, "loss": 0.4462, "learning_rate": 3.561200945260678e-05, "epoch": 0.27345309381237526, "percentage": 27.35, "elapsed_time": "0:05:54", "remaining_time": "0:15:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 138, "total_steps": 501, "loss": 0.4749, "learning_rate": 3.5664651440020616e-05, "epoch": 0.2754491017964072, "percentage": 27.54, "elapsed_time": "0:05:56", "remaining_time": "0:15:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 139, "total_steps": 501, "loss": 0.4782, "learning_rate": 3.571691333756825e-05, "epoch": 0.2774451097804391, "percentage": 27.74, "elapsed_time": "0:05:59", "remaining_time": "0:15:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 140, "total_steps": 501, "loss": 0.4401, "learning_rate": 3.5768800594637304e-05, "epoch": 0.27944111776447106, "percentage": 27.94, "elapsed_time": "0:06:01", "remaining_time": "0:15:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 141, "total_steps": 501, "loss": 0.4992, "learning_rate": 3.582031854425634e-05, "epoch": 0.281437125748503, "percentage": 28.14, "elapsed_time": "0:06:03", "remaining_time": "0:15:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 142, "total_steps": 501, "loss": 0.5009, "learning_rate": 3.587147240638428e-05, "epoch": 0.2834331337325349, "percentage": 28.34, "elapsed_time": "0:06:06", "remaining_time": "0:15:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 143, "total_steps": 501, "loss": 0.3891, "learning_rate": 3.5922267291084366e-05, "epoch": 0.28542914171656686, "percentage": 28.54, "elapsed_time": "0:06:08", "remaining_time": "0:15:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 144, "total_steps": 501, "loss": 0.442, "learning_rate": 3.5972708201587496e-05, "epoch": 0.2874251497005988, "percentage": 28.74, "elapsed_time": "0:06:10", "remaining_time": "0:15:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 145, "total_steps": 501, "loss": 0.5065, "learning_rate": 3.6022800037249585e-05, "epoch": 0.2894211576846307, "percentage": 28.94, "elapsed_time": "0:06:13", "remaining_time": "0:15:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 146, "total_steps": 501, "loss": 0.4617, "learning_rate": 3.607254759640729e-05, "epoch": 0.29141716566866266, "percentage": 29.14, "elapsed_time": "0:06:15", "remaining_time": "0:15:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 147, "total_steps": 501, "loss": 0.4633, "learning_rate": 3.612195557913627e-05, "epoch": 0.2934131736526946, "percentage": 29.34, "elapsed_time": "0:06:17", "remaining_time": "0:15:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 148, "total_steps": 501, "loss": 0.434, "learning_rate": 3.6171028589915954e-05, "epoch": 0.2954091816367265, "percentage": 29.54, "elapsed_time": "0:06:20", "remaining_time": "0:15:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 149, "total_steps": 501, "loss": 0.4627, "learning_rate": 3.6219771140204575e-05, "epoch": 0.29740518962075846, "percentage": 29.74, "elapsed_time": "0:06:22", "remaining_time": "0:15:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 150, "total_steps": 501, "loss": 0.4152, "learning_rate": 3.626818765092802e-05, "epoch": 0.2994011976047904, "percentage": 29.94, "elapsed_time": "0:06:24", "remaining_time": "0:15:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 151, "total_steps": 501, "loss": 0.4912, "learning_rate": 3.6316282454886157e-05, "epoch": 0.3013972055888224, "percentage": 30.14, "elapsed_time": "0:06:27", "remaining_time": "0:14:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 152, "total_steps": 501, "loss": 0.3153, "learning_rate": 3.636405979907955e-05, "epoch": 0.3033932135728543, "percentage": 30.34, "elapsed_time": "0:06:29", "remaining_time": "0:14:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 153, "total_steps": 501, "loss": 0.4619, "learning_rate": 3.6411523846959985e-05, "epoch": 0.30538922155688625, "percentage": 30.54, "elapsed_time": "0:06:31", "remaining_time": "0:14:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 154, "total_steps": 501, "loss": 0.5165, "learning_rate": 3.645867868060772e-05, "epoch": 0.3073852295409182, "percentage": 30.74, "elapsed_time": "0:06:34", "remaining_time": "0:14:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 155, "total_steps": 501, "loss": 0.4222, "learning_rate": 3.6505528302838193e-05, "epoch": 0.3093812375249501, "percentage": 30.94, "elapsed_time": "0:06:36", "remaining_time": "0:14:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 156, "total_steps": 501, "loss": 0.4882, "learning_rate": 3.6552076639241027e-05, "epoch": 0.31137724550898205, "percentage": 31.14, "elapsed_time": "0:06:38", "remaining_time": "0:14:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 157, "total_steps": 501, "loss": 0.4171, "learning_rate": 3.65983275401539e-05, "epoch": 0.313373253493014, "percentage": 31.34, "elapsed_time": "0:06:41", "remaining_time": "0:14:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 158, "total_steps": 501, "loss": 0.4342, "learning_rate": 3.664428478257371e-05, "epoch": 0.3153692614770459, "percentage": 31.54, "elapsed_time": "0:06:43", "remaining_time": "0:14:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 159, "total_steps": 501, "loss": 0.4698, "learning_rate": 3.668995207200753e-05, "epoch": 0.31736526946107785, "percentage": 31.74, "elapsed_time": "0:06:45", "remaining_time": "0:14:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 160, "total_steps": 501, "loss": 0.4896, "learning_rate": 3.673533304426541e-05, "epoch": 0.3193612774451098, "percentage": 31.94, "elapsed_time": "0:06:48", "remaining_time": "0:14:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 161, "total_steps": 501, "loss": 0.4997, "learning_rate": 3.67804312671975e-05, "epoch": 0.3213572854291417, "percentage": 32.14, "elapsed_time": "0:06:50", "remaining_time": "0:14:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 162, "total_steps": 501, "loss": 0.47, "learning_rate": 3.682525024237719e-05, "epoch": 0.32335329341317365, "percentage": 32.34, "elapsed_time": "0:06:52", "remaining_time": "0:14:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 163, "total_steps": 501, "loss": 0.4085, "learning_rate": 3.6869793406732636e-05, "epoch": 0.3253493013972056, "percentage": 32.53, "elapsed_time": "0:06:55", "remaining_time": "0:14:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 164, "total_steps": 501, "loss": 0.4329, "learning_rate": 3.69140641341283e-05, "epoch": 0.3273453093812375, "percentage": 32.73, "elapsed_time": "0:06:57", "remaining_time": "0:14:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 165, "total_steps": 501, "loss": 0.348, "learning_rate": 3.695806573689844e-05, "epoch": 0.32934131736526945, "percentage": 32.93, "elapsed_time": "0:07:00", "remaining_time": "0:14:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 166, "total_steps": 501, "loss": 0.4342, "learning_rate": 3.700180146733426e-05, "epoch": 0.3313373253493014, "percentage": 33.13, "elapsed_time": "0:07:02", "remaining_time": "0:14:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 167, "total_steps": 501, "loss": 0.4809, "learning_rate": 3.704527451912639e-05, "epoch": 0.3333333333333333, "percentage": 33.33, "elapsed_time": "0:07:04", "remaining_time": "0:14:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 168, "total_steps": 501, "loss": 0.4586, "learning_rate": 3.708848802876438e-05, "epoch": 0.33532934131736525, "percentage": 33.53, "elapsed_time": "0:07:07", "remaining_time": "0:14:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 169, "total_steps": 501, "loss": 0.4471, "learning_rate": 3.7131445076894564e-05, "epoch": 0.3373253493013972, "percentage": 33.73, "elapsed_time": "0:07:09", "remaining_time": "0:14:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 170, "total_steps": 501, "loss": 0.3867, "learning_rate": 3.717414868963791e-05, "epoch": 0.3393213572854291, "percentage": 33.93, "elapsed_time": "0:07:11", "remaining_time": "0:14:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 171, "total_steps": 501, "loss": 0.4502, "learning_rate": 3.721660183986924e-05, "epoch": 0.3413173652694611, "percentage": 34.13, "elapsed_time": "0:07:14", "remaining_time": "0:13:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 172, "total_steps": 501, "loss": 0.3507, "learning_rate": 3.725880744845915e-05, "epoch": 0.34331337325349304, "percentage": 34.33, "elapsed_time": "0:07:16", "remaining_time": "0:13:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 173, "total_steps": 501, "loss": 0.3512, "learning_rate": 3.730076838547993e-05, "epoch": 0.34530938123752497, "percentage": 34.53, "elapsed_time": "0:07:18", "remaining_time": "0:13:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 174, "total_steps": 501, "loss": 0.4263, "learning_rate": 3.734248747137666e-05, "epoch": 0.3473053892215569, "percentage": 34.73, "elapsed_time": "0:07:21", "remaining_time": "0:13:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 175, "total_steps": 501, "loss": 0.3923, "learning_rate": 3.738396747810492e-05, "epoch": 0.34930139720558884, "percentage": 34.93, "elapsed_time": "0:07:23", "remaining_time": "0:13:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 176, "total_steps": 501, "loss": 0.3811, "learning_rate": 3.7425211130235834e-05, "epoch": 0.35129740518962077, "percentage": 35.13, "elapsed_time": "0:07:25", "remaining_time": "0:13:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 177, "total_steps": 501, "loss": 0.4152, "learning_rate": 3.7466221106030115e-05, "epoch": 0.3532934131736527, "percentage": 35.33, "elapsed_time": "0:07:28", "remaining_time": "0:13:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 178, "total_steps": 501, "loss": 0.3321, "learning_rate": 3.750700003848157e-05, "epoch": 0.35528942115768464, "percentage": 35.53, "elapsed_time": "0:07:30", "remaining_time": "0:13:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 179, "total_steps": 501, "loss": 0.4008, "learning_rate": 3.7547550516331555e-05, "epoch": 0.35728542914171657, "percentage": 35.73, "elapsed_time": "0:07:32", "remaining_time": "0:13:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 180, "total_steps": 501, "loss": 0.408, "learning_rate": 3.75878750850551e-05, "epoch": 0.3592814371257485, "percentage": 35.93, "elapsed_time": "0:07:35", "remaining_time": "0:13:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 181, "total_steps": 501, "loss": 0.4076, "learning_rate": 3.7627976247819744e-05, "epoch": 0.36127744510978044, "percentage": 36.13, "elapsed_time": "0:07:37", "remaining_time": "0:13:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 182, "total_steps": 501, "loss": 0.4311, "learning_rate": 3.766785646641792e-05, "epoch": 0.36327345309381237, "percentage": 36.33, "elapsed_time": "0:07:39", "remaining_time": "0:13:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 183, "total_steps": 501, "loss": 0.422, "learning_rate": 3.770751816217383e-05, "epoch": 0.3652694610778443, "percentage": 36.53, "elapsed_time": "0:07:42", "remaining_time": "0:13:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 184, "total_steps": 501, "loss": 0.4475, "learning_rate": 3.7746963716825615e-05, "epoch": 0.36726546906187624, "percentage": 36.73, "elapsed_time": "0:07:44", "remaining_time": "0:13:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 185, "total_steps": 501, "loss": 0.3981, "learning_rate": 3.778619547338356e-05, "epoch": 0.36926147704590817, "percentage": 36.93, "elapsed_time": "0:07:46", "remaining_time": "0:13:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 186, "total_steps": 501, "loss": 0.4482, "learning_rate": 3.782521573696528e-05, "epoch": 0.3712574850299401, "percentage": 37.13, "elapsed_time": "0:07:49", "remaining_time": "0:13:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 187, "total_steps": 501, "loss": 0.3413, "learning_rate": 3.786402677560832e-05, "epoch": 0.37325349301397204, "percentage": 37.33, "elapsed_time": "0:07:51", "remaining_time": "0:13:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 188, "total_steps": 501, "loss": 0.4207, "learning_rate": 3.790263082106134e-05, "epoch": 0.37524950099800397, "percentage": 37.52, "elapsed_time": "0:07:53", "remaining_time": "0:13:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 189, "total_steps": 501, "loss": 0.4521, "learning_rate": 3.794103006955407e-05, "epoch": 0.3772455089820359, "percentage": 37.72, "elapsed_time": "0:07:56", "remaining_time": "0:13:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 190, "total_steps": 501, "loss": 0.3653, "learning_rate": 3.797922668254715e-05, "epoch": 0.37924151696606784, "percentage": 37.92, "elapsed_time": "0:07:58", "remaining_time": "0:13:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 191, "total_steps": 501, "loss": 0.3662, "learning_rate": 3.801722278746213e-05, "epoch": 0.3812375249500998, "percentage": 38.12, "elapsed_time": "0:08:00", "remaining_time": "0:13:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 192, "total_steps": 501, "loss": 0.2939, "learning_rate": 3.8055020478392495e-05, "epoch": 0.38323353293413176, "percentage": 38.32, "elapsed_time": "0:08:03", "remaining_time": "0:12:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 193, "total_steps": 501, "loss": 0.4302, "learning_rate": 3.809262181679623e-05, "epoch": 0.3852295409181637, "percentage": 38.52, "elapsed_time": "0:08:05", "remaining_time": "0:12:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 194, "total_steps": 501, "loss": 0.3984, "learning_rate": 3.813002883217044e-05, "epoch": 0.3872255489021956, "percentage": 38.72, "elapsed_time": "0:08:07", "remaining_time": "0:12:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 195, "total_steps": 501, "loss": 0.3839, "learning_rate": 3.816724352270863e-05, "epoch": 0.38922155688622756, "percentage": 38.92, "elapsed_time": "0:08:10", "remaining_time": "0:12:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 196, "total_steps": 501, "loss": 0.4014, "learning_rate": 3.8204267855941266e-05, "epoch": 0.3912175648702595, "percentage": 39.12, "elapsed_time": "0:08:12", "remaining_time": "0:12:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 197, "total_steps": 501, "loss": 0.3791, "learning_rate": 3.824110376935989e-05, "epoch": 0.3932135728542914, "percentage": 39.32, "elapsed_time": "0:08:14", "remaining_time": "0:12:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 198, "total_steps": 501, "loss": 0.3904, "learning_rate": 3.827775317102552e-05, "epoch": 0.39520958083832336, "percentage": 39.52, "elapsed_time": "0:08:17", "remaining_time": "0:12:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 199, "total_steps": 501, "loss": 0.3933, "learning_rate": 3.831421794016178e-05, "epoch": 0.3972055888223553, "percentage": 39.72, "elapsed_time": "0:08:19", "remaining_time": "0:12:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 501, "loss": 0.439, "learning_rate": 3.835049992773302e-05, "epoch": 0.3992015968063872, "percentage": 39.92, "elapsed_time": "0:08:21", "remaining_time": "0:12:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 201, "total_steps": 501, "loss": 0.4462, "learning_rate": 3.838660095700815e-05, "epoch": 0.40119760479041916, "percentage": 40.12, "elapsed_time": "0:09:13", "remaining_time": "0:13:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 202, "total_steps": 501, "loss": 0.4621, "learning_rate": 3.84225228241104e-05, "epoch": 0.4031936127744511, "percentage": 40.32, "elapsed_time": "0:09:15", "remaining_time": "0:13:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 203, "total_steps": 501, "loss": 0.4888, "learning_rate": 3.8458267298553554e-05, "epoch": 0.405189620758483, "percentage": 40.52, "elapsed_time": "0:09:17", "remaining_time": "0:13:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 204, "total_steps": 501, "loss": 0.3836, "learning_rate": 3.8493836123764984e-05, "epoch": 0.40718562874251496, "percentage": 40.72, "elapsed_time": "0:09:20", "remaining_time": "0:13:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 205, "total_steps": 501, "loss": 0.3993, "learning_rate": 3.852923101759591e-05, "epoch": 0.4091816367265469, "percentage": 40.92, "elapsed_time": "0:09:22", "remaining_time": "0:13:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 206, "total_steps": 501, "loss": 0.3948, "learning_rate": 3.856445367281923e-05, "epoch": 0.4111776447105788, "percentage": 41.12, "elapsed_time": "0:09:24", "remaining_time": "0:13:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 207, "total_steps": 501, "loss": 0.4305, "learning_rate": 3.859950575761529e-05, "epoch": 0.41317365269461076, "percentage": 41.32, "elapsed_time": "0:09:27", "remaining_time": "0:13:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 208, "total_steps": 501, "loss": 0.4982, "learning_rate": 3.8634388916046025e-05, "epoch": 0.4151696606786427, "percentage": 41.52, "elapsed_time": "0:09:29", "remaining_time": "0:13:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 209, "total_steps": 501, "loss": 0.4147, "learning_rate": 3.866910476851757e-05, "epoch": 0.4171656686626746, "percentage": 41.72, "elapsed_time": "0:09:31", "remaining_time": "0:13:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 210, "total_steps": 501, "loss": 0.4125, "learning_rate": 3.870365491223199e-05, "epoch": 0.41916167664670656, "percentage": 41.92, "elapsed_time": "0:09:34", "remaining_time": "0:13:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 211, "total_steps": 501, "loss": 0.3941, "learning_rate": 3.8738040921628215e-05, "epoch": 0.42115768463073855, "percentage": 42.12, "elapsed_time": "0:09:36", "remaining_time": "0:13:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 212, "total_steps": 501, "loss": 0.4327, "learning_rate": 3.877226434881253e-05, "epoch": 0.4231536926147705, "percentage": 42.32, "elapsed_time": "0:09:39", "remaining_time": "0:13:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 213, "total_steps": 501, "loss": 0.4303, "learning_rate": 3.880632672397897e-05, "epoch": 0.4251497005988024, "percentage": 42.51, "elapsed_time": "0:09:41", "remaining_time": "0:13:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 214, "total_steps": 501, "loss": 0.4301, "learning_rate": 3.884022955581985e-05, "epoch": 0.42714570858283435, "percentage": 42.71, "elapsed_time": "0:09:43", "remaining_time": "0:13:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 215, "total_steps": 501, "loss": 0.4208, "learning_rate": 3.887397433192676e-05, "epoch": 0.4291417165668663, "percentage": 42.91, "elapsed_time": "0:09:46", "remaining_time": "0:12:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 216, "total_steps": 501, "loss": 0.3384, "learning_rate": 3.890756251918219e-05, "epoch": 0.4311377245508982, "percentage": 43.11, "elapsed_time": "0:09:48", "remaining_time": "0:12:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 217, "total_steps": 501, "loss": 0.3797, "learning_rate": 3.894099556414216e-05, "epoch": 0.43313373253493015, "percentage": 43.31, "elapsed_time": "0:09:50", "remaining_time": "0:12:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 218, "total_steps": 501, "loss": 0.4325, "learning_rate": 3.897427489341009e-05, "epoch": 0.4351297405189621, "percentage": 43.51, "elapsed_time": "0:09:53", "remaining_time": "0:12:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 219, "total_steps": 501, "loss": 0.4466, "learning_rate": 3.900740191400198e-05, "epoch": 0.437125748502994, "percentage": 43.71, "elapsed_time": "0:09:55", "remaining_time": "0:12:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 220, "total_steps": 501, "loss": 0.4355, "learning_rate": 3.904037801370344e-05, "epoch": 0.43912175648702595, "percentage": 43.91, "elapsed_time": "0:09:57", "remaining_time": "0:12:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 221, "total_steps": 501, "loss": 0.3465, "learning_rate": 3.9073204561418514e-05, "epoch": 0.4411177644710579, "percentage": 44.11, "elapsed_time": "0:10:00", "remaining_time": "0:12:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 222, "total_steps": 501, "loss": 0.4004, "learning_rate": 3.9105882907510644e-05, "epoch": 0.4431137724550898, "percentage": 44.31, "elapsed_time": "0:10:02", "remaining_time": "0:12:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 223, "total_steps": 501, "loss": 0.4261, "learning_rate": 3.913841438413601e-05, "epoch": 0.44510978043912175, "percentage": 44.51, "elapsed_time": "0:10:04", "remaining_time": "0:12:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 224, "total_steps": 501, "loss": 0.3192, "learning_rate": 3.917080030556938e-05, "epoch": 0.4471057884231537, "percentage": 44.71, "elapsed_time": "0:10:07", "remaining_time": "0:12:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 225, "total_steps": 501, "loss": 0.4663, "learning_rate": 3.9203041968522716e-05, "epoch": 0.4491017964071856, "percentage": 44.91, "elapsed_time": "0:10:09", "remaining_time": "0:12:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 226, "total_steps": 501, "loss": 0.4558, "learning_rate": 3.923514065245669e-05, "epoch": 0.45109780439121755, "percentage": 45.11, "elapsed_time": "0:10:11", "remaining_time": "0:12:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 227, "total_steps": 501, "loss": 0.4546, "learning_rate": 3.926709761988538e-05, "epoch": 0.4530938123752495, "percentage": 45.31, "elapsed_time": "0:10:14", "remaining_time": "0:12:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 228, "total_steps": 501, "loss": 0.3762, "learning_rate": 3.929891411667424e-05, "epoch": 0.4550898203592814, "percentage": 45.51, "elapsed_time": "0:10:16", "remaining_time": "0:12:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 229, "total_steps": 501, "loss": 0.4447, "learning_rate": 3.933059137233147e-05, "epoch": 0.45708582834331335, "percentage": 45.71, "elapsed_time": "0:10:18", "remaining_time": "0:12:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 230, "total_steps": 501, "loss": 0.4366, "learning_rate": 3.9362130600293214e-05, "epoch": 0.4590818363273453, "percentage": 45.91, "elapsed_time": "0:10:21", "remaining_time": "0:12:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 231, "total_steps": 501, "loss": 0.4434, "learning_rate": 3.9393532998202405e-05, "epoch": 0.46107784431137727, "percentage": 46.11, "elapsed_time": "0:10:23", "remaining_time": "0:12:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 232, "total_steps": 501, "loss": 0.3755, "learning_rate": 3.942479974818166e-05, "epoch": 0.4630738522954092, "percentage": 46.31, "elapsed_time": "0:10:25", "remaining_time": "0:12:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 233, "total_steps": 501, "loss": 0.375, "learning_rate": 3.945593201710032e-05, "epoch": 0.46506986027944114, "percentage": 46.51, "elapsed_time": "0:10:28", "remaining_time": "0:12:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 234, "total_steps": 501, "loss": 0.3985, "learning_rate": 3.9486930956835724e-05, "epoch": 0.46706586826347307, "percentage": 46.71, "elapsed_time": "0:10:30", "remaining_time": "0:11:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 235, "total_steps": 501, "loss": 0.421, "learning_rate": 3.951779770452894e-05, "epoch": 0.469061876247505, "percentage": 46.91, "elapsed_time": "0:10:32", "remaining_time": "0:11:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 236, "total_steps": 501, "loss": 0.4592, "learning_rate": 3.954853338283512e-05, "epoch": 0.47105788423153694, "percentage": 47.11, "elapsed_time": "0:10:35", "remaining_time": "0:11:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 237, "total_steps": 501, "loss": 0.3732, "learning_rate": 3.9579139100168404e-05, "epoch": 0.47305389221556887, "percentage": 47.31, "elapsed_time": "0:10:37", "remaining_time": "0:11:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 238, "total_steps": 501, "loss": 0.4038, "learning_rate": 3.960961595094187e-05, "epoch": 0.4750499001996008, "percentage": 47.5, "elapsed_time": "0:10:39", "remaining_time": "0:11:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 239, "total_steps": 501, "loss": 0.4348, "learning_rate": 3.96399650158023e-05, "epoch": 0.47704590818363274, "percentage": 47.7, "elapsed_time": "0:10:42", "remaining_time": "0:11:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 240, "total_steps": 501, "loss": 0.4704, "learning_rate": 3.96701873618601e-05, "epoch": 0.47904191616766467, "percentage": 47.9, "elapsed_time": "0:10:44", "remaining_time": "0:11:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 241, "total_steps": 501, "loss": 0.381, "learning_rate": 3.970028404291448e-05, "epoch": 0.4810379241516966, "percentage": 48.1, "elapsed_time": "0:10:46", "remaining_time": "0:11:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 242, "total_steps": 501, "loss": 0.3282, "learning_rate": 3.9730256099673865e-05, "epoch": 0.48303393213572854, "percentage": 48.3, "elapsed_time": "0:10:49", "remaining_time": "0:11:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 243, "total_steps": 501, "loss": 0.3794, "learning_rate": 3.976010455997187e-05, "epoch": 0.48502994011976047, "percentage": 48.5, "elapsed_time": "0:10:51", "remaining_time": "0:11:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 244, "total_steps": 501, "loss": 0.4222, "learning_rate": 3.978983043897883e-05, "epoch": 0.4870259481037924, "percentage": 48.7, "elapsed_time": "0:10:53", "remaining_time": "0:11:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 245, "total_steps": 501, "loss": 0.3682, "learning_rate": 3.981943473940888e-05, "epoch": 0.48902195608782434, "percentage": 48.9, "elapsed_time": "0:10:56", "remaining_time": "0:11:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 246, "total_steps": 501, "loss": 0.3546, "learning_rate": 3.984891845172299e-05, "epoch": 0.49101796407185627, "percentage": 49.1, "elapsed_time": "0:10:58", "remaining_time": "0:11:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 247, "total_steps": 501, "loss": 0.3764, "learning_rate": 3.987828255432777e-05, "epoch": 0.4930139720558882, "percentage": 49.3, "elapsed_time": "0:11:00", "remaining_time": "0:11:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 248, "total_steps": 501, "loss": 0.4436, "learning_rate": 3.9907528013770276e-05, "epoch": 0.49500998003992014, "percentage": 49.5, "elapsed_time": "0:11:03", "remaining_time": "0:11:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 249, "total_steps": 501, "loss": 0.4477, "learning_rate": 3.993665578492894e-05, "epoch": 0.49700598802395207, "percentage": 49.7, "elapsed_time": "0:11:05", "remaining_time": "0:11:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 501, "loss": 0.355, "learning_rate": 3.9965666811200624e-05, "epoch": 0.499001996007984, "percentage": 49.9, "elapsed_time": "0:11:07", "remaining_time": "0:11:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 251, "total_steps": 501, "loss": 0.4044, "learning_rate": 3.999456202468397e-05, "epoch": 0.500998003992016, "percentage": 50.1, "elapsed_time": "0:11:10", "remaining_time": "0:11:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 252, "total_steps": 501, "loss": 0.3515, "learning_rate": 4.002334234635907e-05, "epoch": 0.5029940119760479, "percentage": 50.3, "elapsed_time": "0:11:12", "remaining_time": "0:11:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 253, "total_steps": 501, "loss": 0.4055, "learning_rate": 4.005200868626364e-05, "epoch": 0.5049900199600799, "percentage": 50.5, "elapsed_time": "0:11:15", "remaining_time": "0:11:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 254, "total_steps": 501, "loss": 0.4327, "learning_rate": 4.008056194366564e-05, "epoch": 0.5069860279441117, "percentage": 50.7, "elapsed_time": "0:11:17", "remaining_time": "0:10:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 255, "total_steps": 501, "loss": 0.4187, "learning_rate": 4.010900300723259e-05, "epoch": 0.5089820359281437, "percentage": 50.9, "elapsed_time": "0:11:19", "remaining_time": "0:10:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 256, "total_steps": 501, "loss": 0.3947, "learning_rate": 4.013733275519749e-05, "epoch": 0.5109780439121756, "percentage": 51.1, "elapsed_time": "0:11:22", "remaining_time": "0:10:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 257, "total_steps": 501, "loss": 0.3808, "learning_rate": 4.016555205552158e-05, "epoch": 0.5129740518962076, "percentage": 51.3, "elapsed_time": "0:11:24", "remaining_time": "0:10:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 258, "total_steps": 501, "loss": 0.4408, "learning_rate": 4.0193661766053834e-05, "epoch": 0.5149700598802395, "percentage": 51.5, "elapsed_time": "0:11:26", "remaining_time": "0:10:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 259, "total_steps": 501, "loss": 0.3826, "learning_rate": 4.022166273468753e-05, "epoch": 0.5169660678642715, "percentage": 51.7, "elapsed_time": "0:11:29", "remaining_time": "0:10:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 260, "total_steps": 501, "loss": 0.3403, "learning_rate": 4.024955579951363e-05, "epoch": 0.5189620758483033, "percentage": 51.9, "elapsed_time": "0:11:31", "remaining_time": "0:10:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 261, "total_steps": 501, "loss": 0.3927, "learning_rate": 4.027734178897136e-05, "epoch": 0.5209580838323353, "percentage": 52.1, "elapsed_time": "0:11:33", "remaining_time": "0:10:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 262, "total_steps": 501, "loss": 0.4247, "learning_rate": 4.030502152199576e-05, "epoch": 0.5229540918163673, "percentage": 52.3, "elapsed_time": "0:11:36", "remaining_time": "0:10:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 263, "total_steps": 501, "loss": 0.4284, "learning_rate": 4.033259580816264e-05, "epoch": 0.5249500998003992, "percentage": 52.5, "elapsed_time": "0:11:38", "remaining_time": "0:10:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 264, "total_steps": 501, "loss": 0.4534, "learning_rate": 4.036006544783052e-05, "epoch": 0.5269461077844312, "percentage": 52.69, "elapsed_time": "0:11:40", "remaining_time": "0:10:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 265, "total_steps": 501, "loss": 0.3404, "learning_rate": 4.0387431232280135e-05, "epoch": 0.5289421157684631, "percentage": 52.89, "elapsed_time": "0:11:43", "remaining_time": "0:10:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 266, "total_steps": 501, "loss": 0.4455, "learning_rate": 4.041469394385112e-05, "epoch": 0.530938123752495, "percentage": 53.09, "elapsed_time": "0:11:45", "remaining_time": "0:10:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 267, "total_steps": 501, "loss": 0.4636, "learning_rate": 4.0441854356076257e-05, "epoch": 0.5329341317365269, "percentage": 53.29, "elapsed_time": "0:11:47", "remaining_time": "0:10:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 268, "total_steps": 501, "loss": 0.3777, "learning_rate": 4.046891323381315e-05, "epoch": 0.5349301397205589, "percentage": 53.49, "elapsed_time": "0:11:50", "remaining_time": "0:10:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 269, "total_steps": 501, "loss": 0.4006, "learning_rate": 4.049587133337347e-05, "epoch": 0.5369261477045908, "percentage": 53.69, "elapsed_time": "0:11:52", "remaining_time": "0:10:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 270, "total_steps": 501, "loss": 0.418, "learning_rate": 4.0522729402649793e-05, "epoch": 0.5389221556886228, "percentage": 53.89, "elapsed_time": "0:11:54", "remaining_time": "0:10:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 271, "total_steps": 501, "loss": 0.3358, "learning_rate": 4.0549488181240096e-05, "epoch": 0.5409181636726547, "percentage": 54.09, "elapsed_time": "0:11:57", "remaining_time": "0:10:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 272, "total_steps": 501, "loss": 0.4008, "learning_rate": 4.057614840056998e-05, "epoch": 0.5429141716566867, "percentage": 54.29, "elapsed_time": "0:11:59", "remaining_time": "0:10:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 273, "total_steps": 501, "loss": 0.3607, "learning_rate": 4.06027107840126e-05, "epoch": 0.5449101796407185, "percentage": 54.49, "elapsed_time": "0:12:01", "remaining_time": "0:10:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 274, "total_steps": 501, "loss": 0.3567, "learning_rate": 4.0629176047006474e-05, "epoch": 0.5469061876247505, "percentage": 54.69, "elapsed_time": "0:12:04", "remaining_time": "0:10:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 275, "total_steps": 501, "loss": 0.3528, "learning_rate": 4.065554489717105e-05, "epoch": 0.5489021956087824, "percentage": 54.89, "elapsed_time": "0:12:06", "remaining_time": "0:09:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 276, "total_steps": 501, "loss": 0.4062, "learning_rate": 4.068181803442029e-05, "epoch": 0.5508982035928144, "percentage": 55.09, "elapsed_time": "0:12:08", "remaining_time": "0:09:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 277, "total_steps": 501, "loss": 0.4374, "learning_rate": 4.0707996151074147e-05, "epoch": 0.5528942115768463, "percentage": 55.29, "elapsed_time": "0:12:11", "remaining_time": "0:09:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 278, "total_steps": 501, "loss": 0.4121, "learning_rate": 4.073407993196794e-05, "epoch": 0.5548902195608783, "percentage": 55.49, "elapsed_time": "0:12:13", "remaining_time": "0:09:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 279, "total_steps": 501, "loss": 0.4702, "learning_rate": 4.076007005455996e-05, "epoch": 0.5568862275449101, "percentage": 55.69, "elapsed_time": "0:12:16", "remaining_time": "0:09:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 280, "total_steps": 501, "loss": 0.3581, "learning_rate": 4.0785967189036986e-05, "epoch": 0.5588822355289421, "percentage": 55.89, "elapsed_time": "0:12:18", "remaining_time": "0:09:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 281, "total_steps": 501, "loss": 0.414, "learning_rate": 4.0811771998418e-05, "epoch": 0.5608782435129741, "percentage": 56.09, "elapsed_time": "0:12:20", "remaining_time": "0:09:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 282, "total_steps": 501, "loss": 0.3549, "learning_rate": 4.083748513865602e-05, "epoch": 0.562874251497006, "percentage": 56.29, "elapsed_time": "0:12:23", "remaining_time": "0:09:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 283, "total_steps": 501, "loss": 0.4977, "learning_rate": 4.086310725873818e-05, "epoch": 0.564870259481038, "percentage": 56.49, "elapsed_time": "0:12:25", "remaining_time": "0:09:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 284, "total_steps": 501, "loss": 0.4646, "learning_rate": 4.0888639000783966e-05, "epoch": 0.5668662674650699, "percentage": 56.69, "elapsed_time": "0:12:27", "remaining_time": "0:09:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 285, "total_steps": 501, "loss": 0.4295, "learning_rate": 4.0914081000141844e-05, "epoch": 0.5688622754491018, "percentage": 56.89, "elapsed_time": "0:12:30", "remaining_time": "0:09:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 286, "total_steps": 501, "loss": 0.3168, "learning_rate": 4.0939433885484055e-05, "epoch": 0.5708582834331337, "percentage": 57.09, "elapsed_time": "0:12:32", "remaining_time": "0:09:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 287, "total_steps": 501, "loss": 0.3373, "learning_rate": 4.0964698278899874e-05, "epoch": 0.5728542914171657, "percentage": 57.29, "elapsed_time": "0:12:34", "remaining_time": "0:09:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 288, "total_steps": 501, "loss": 0.3705, "learning_rate": 4.0989874795987185e-05, "epoch": 0.5748502994011976, "percentage": 57.49, "elapsed_time": "0:12:37", "remaining_time": "0:09:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 289, "total_steps": 501, "loss": 0.366, "learning_rate": 4.1014964045942465e-05, "epoch": 0.5768463073852296, "percentage": 57.68, "elapsed_time": "0:12:39", "remaining_time": "0:09:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 290, "total_steps": 501, "loss": 0.4435, "learning_rate": 4.103996663164927e-05, "epoch": 0.5788423153692615, "percentage": 57.88, "elapsed_time": "0:12:41", "remaining_time": "0:09:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 291, "total_steps": 501, "loss": 0.471, "learning_rate": 4.106488314976513e-05, "epoch": 0.5808383233532934, "percentage": 58.08, "elapsed_time": "0:12:44", "remaining_time": "0:09:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 292, "total_steps": 501, "loss": 0.3138, "learning_rate": 4.108971419080698e-05, "epoch": 0.5828343313373253, "percentage": 58.28, "elapsed_time": "0:12:46", "remaining_time": "0:09:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 293, "total_steps": 501, "loss": 0.4394, "learning_rate": 4.111446033923516e-05, "epoch": 0.5848303393213573, "percentage": 58.48, "elapsed_time": "0:12:48", "remaining_time": "0:09:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 294, "total_steps": 501, "loss": 0.3741, "learning_rate": 4.113912217353596e-05, "epoch": 0.5868263473053892, "percentage": 58.68, "elapsed_time": "0:12:51", "remaining_time": "0:09:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 295, "total_steps": 501, "loss": 0.3116, "learning_rate": 4.116370026630272e-05, "epoch": 0.5888223552894212, "percentage": 58.88, "elapsed_time": "0:12:53", "remaining_time": "0:09:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 296, "total_steps": 501, "loss": 0.4048, "learning_rate": 4.118819518431564e-05, "epoch": 0.590818363273453, "percentage": 59.08, "elapsed_time": "0:12:55", "remaining_time": "0:08:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 297, "total_steps": 501, "loss": 0.4346, "learning_rate": 4.121260748862021e-05, "epoch": 0.592814371257485, "percentage": 59.28, "elapsed_time": "0:12:58", "remaining_time": "0:08:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 298, "total_steps": 501, "loss": 0.3629, "learning_rate": 4.123693773460426e-05, "epoch": 0.5948103792415169, "percentage": 59.48, "elapsed_time": "0:13:00", "remaining_time": "0:08:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 299, "total_steps": 501, "loss": 0.4248, "learning_rate": 4.126118647207383e-05, "epoch": 0.5968063872255489, "percentage": 59.68, "elapsed_time": "0:13:02", "remaining_time": "0:08:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 300, "total_steps": 501, "loss": 0.2834, "learning_rate": 4.1285354245327715e-05, "epoch": 0.5988023952095808, "percentage": 59.88, "elapsed_time": "0:13:05", "remaining_time": "0:08:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 301, "total_steps": 501, "loss": 0.4276, "learning_rate": 4.1309441593230726e-05, "epoch": 0.6007984031936128, "percentage": 60.08, "elapsed_time": "0:13:37", "remaining_time": "0:09:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 302, "total_steps": 501, "loss": 0.3925, "learning_rate": 4.133344904928585e-05, "epoch": 0.6027944111776448, "percentage": 60.28, "elapsed_time": "0:13:40", "remaining_time": "0:09:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 303, "total_steps": 501, "loss": 0.2589, "learning_rate": 4.1357377141705084e-05, "epoch": 0.6047904191616766, "percentage": 60.48, "elapsed_time": "0:13:42", "remaining_time": "0:08:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 304, "total_steps": 501, "loss": 0.3705, "learning_rate": 4.1381226393479236e-05, "epoch": 0.6067864271457086, "percentage": 60.68, "elapsed_time": "0:13:44", "remaining_time": "0:08:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 305, "total_steps": 501, "loss": 0.3637, "learning_rate": 4.1404997322446435e-05, "epoch": 0.6087824351297405, "percentage": 60.88, "elapsed_time": "0:13:47", "remaining_time": "0:08:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 306, "total_steps": 501, "loss": 0.477, "learning_rate": 4.142869044135967e-05, "epoch": 0.6107784431137725, "percentage": 61.08, "elapsed_time": "0:13:49", "remaining_time": "0:08:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 307, "total_steps": 501, "loss": 0.4123, "learning_rate": 4.145230625795311e-05, "epoch": 0.6127744510978044, "percentage": 61.28, "elapsed_time": "0:13:51", "remaining_time": "0:08:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 308, "total_steps": 501, "loss": 0.3382, "learning_rate": 4.14758452750074e-05, "epoch": 0.6147704590818364, "percentage": 61.48, "elapsed_time": "0:13:54", "remaining_time": "0:08:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 309, "total_steps": 501, "loss": 0.4246, "learning_rate": 4.149930799041392e-05, "epoch": 0.6167664670658682, "percentage": 61.68, "elapsed_time": "0:13:56", "remaining_time": "0:08:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 310, "total_steps": 501, "loss": 0.4338, "learning_rate": 4.152269489723788e-05, "epoch": 0.6187624750499002, "percentage": 61.88, "elapsed_time": "0:13:58", "remaining_time": "0:08:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 311, "total_steps": 501, "loss": 0.3202, "learning_rate": 4.1546006483780626e-05, "epoch": 0.6207584830339321, "percentage": 62.08, "elapsed_time": "0:14:01", "remaining_time": "0:08:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 312, "total_steps": 501, "loss": 0.3778, "learning_rate": 4.156924323364072e-05, "epoch": 0.6227544910179641, "percentage": 62.28, "elapsed_time": "0:14:03", "remaining_time": "0:08:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 313, "total_steps": 501, "loss": 0.346, "learning_rate": 4.1592405625774144e-05, "epoch": 0.624750499001996, "percentage": 62.48, "elapsed_time": "0:14:05", "remaining_time": "0:08:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 314, "total_steps": 501, "loss": 0.3827, "learning_rate": 4.161549413455358e-05, "epoch": 0.626746506986028, "percentage": 62.67, "elapsed_time": "0:14:08", "remaining_time": "0:08:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 315, "total_steps": 501, "loss": 0.401, "learning_rate": 4.163850922982668e-05, "epoch": 0.6287425149700598, "percentage": 62.87, "elapsed_time": "0:14:10", "remaining_time": "0:08:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 316, "total_steps": 501, "loss": 0.376, "learning_rate": 4.16614513769734e-05, "epoch": 0.6307385229540918, "percentage": 63.07, "elapsed_time": "0:14:12", "remaining_time": "0:08:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 317, "total_steps": 501, "loss": 0.3638, "learning_rate": 4.1684321036962526e-05, "epoch": 0.6327345309381237, "percentage": 63.27, "elapsed_time": "0:14:15", "remaining_time": "0:08:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 318, "total_steps": 501, "loss": 0.3558, "learning_rate": 4.170711866640721e-05, "epoch": 0.6347305389221557, "percentage": 63.47, "elapsed_time": "0:14:17", "remaining_time": "0:08:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 319, "total_steps": 501, "loss": 0.4159, "learning_rate": 4.1729844717619684e-05, "epoch": 0.6367265469061876, "percentage": 63.67, "elapsed_time": "0:14:19", "remaining_time": "0:08:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 320, "total_steps": 501, "loss": 0.3942, "learning_rate": 4.17524996386651e-05, "epoch": 0.6387225548902196, "percentage": 63.87, "elapsed_time": "0:14:22", "remaining_time": "0:08:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 321, "total_steps": 501, "loss": 0.3563, "learning_rate": 4.177508387341454e-05, "epoch": 0.6407185628742516, "percentage": 64.07, "elapsed_time": "0:14:24", "remaining_time": "0:08:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 322, "total_steps": 501, "loss": 0.4169, "learning_rate": 4.179759786159719e-05, "epoch": 0.6427145708582834, "percentage": 64.27, "elapsed_time": "0:14:26", "remaining_time": "0:08:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 323, "total_steps": 501, "loss": 0.3595, "learning_rate": 4.182004203885172e-05, "epoch": 0.6447105788423154, "percentage": 64.47, "elapsed_time": "0:14:29", "remaining_time": "0:07:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 324, "total_steps": 501, "loss": 0.3945, "learning_rate": 4.184241683677687e-05, "epoch": 0.6467065868263473, "percentage": 64.67, "elapsed_time": "0:14:31", "remaining_time": "0:07:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 325, "total_steps": 501, "loss": 0.3682, "learning_rate": 4.1864722682981245e-05, "epoch": 0.6487025948103793, "percentage": 64.87, "elapsed_time": "0:14:33", "remaining_time": "0:07:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 326, "total_steps": 501, "loss": 0.4012, "learning_rate": 4.188696000113232e-05, "epoch": 0.6506986027944112, "percentage": 65.07, "elapsed_time": "0:14:36", "remaining_time": "0:07:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 327, "total_steps": 501, "loss": 0.2982, "learning_rate": 4.190912921100477e-05, "epoch": 0.6526946107784432, "percentage": 65.27, "elapsed_time": "0:14:38", "remaining_time": "0:07:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 328, "total_steps": 501, "loss": 0.3767, "learning_rate": 4.1931230728527994e-05, "epoch": 0.654690618762475, "percentage": 65.47, "elapsed_time": "0:14:41", "remaining_time": "0:07:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 329, "total_steps": 501, "loss": 0.3918, "learning_rate": 4.195326496583291e-05, "epoch": 0.656686626746507, "percentage": 65.67, "elapsed_time": "0:14:43", "remaining_time": "0:07:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 330, "total_steps": 501, "loss": 0.3727, "learning_rate": 4.1975232331298125e-05, "epoch": 0.6586826347305389, "percentage": 65.87, "elapsed_time": "0:14:45", "remaining_time": "0:07:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 331, "total_steps": 501, "loss": 0.4168, "learning_rate": 4.1997133229595316e-05, "epoch": 0.6606786427145709, "percentage": 66.07, "elapsed_time": "0:14:48", "remaining_time": "0:07:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 332, "total_steps": 501, "loss": 0.406, "learning_rate": 4.201896806173394e-05, "epoch": 0.6626746506986028, "percentage": 66.27, "elapsed_time": "0:14:50", "remaining_time": "0:07:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 333, "total_steps": 501, "loss": 0.3348, "learning_rate": 4.2040737225105335e-05, "epoch": 0.6646706586826348, "percentage": 66.47, "elapsed_time": "0:14:52", "remaining_time": "0:07:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 334, "total_steps": 501, "loss": 0.3134, "learning_rate": 4.206244111352608e-05, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "0:14:55", "remaining_time": "0:07:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 335, "total_steps": 501, "loss": 0.3855, "learning_rate": 4.2084080117280756e-05, "epoch": 0.6686626746506986, "percentage": 66.87, "elapsed_time": "0:14:57", "remaining_time": "0:07:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 336, "total_steps": 501, "loss": 0.4388, "learning_rate": 4.210565462316407e-05, "epoch": 0.6706586826347305, "percentage": 67.07, "elapsed_time": "0:14:59", "remaining_time": "0:07:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 337, "total_steps": 501, "loss": 0.4084, "learning_rate": 4.2127165014522315e-05, "epoch": 0.6726546906187625, "percentage": 67.27, "elapsed_time": "0:15:02", "remaining_time": "0:07:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 338, "total_steps": 501, "loss": 0.3971, "learning_rate": 4.214861167129425e-05, "epoch": 0.6746506986027944, "percentage": 67.47, "elapsed_time": "0:15:04", "remaining_time": "0:07:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 339, "total_steps": 501, "loss": 0.3184, "learning_rate": 4.2169994970051365e-05, "epoch": 0.6766467065868264, "percentage": 67.66, "elapsed_time": "0:15:06", "remaining_time": "0:07:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 340, "total_steps": 501, "loss": 0.4085, "learning_rate": 4.219131528403759e-05, "epoch": 0.6786427145708582, "percentage": 67.86, "elapsed_time": "0:15:09", "remaining_time": "0:07:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 341, "total_steps": 501, "loss": 0.3799, "learning_rate": 4.22125729832083e-05, "epoch": 0.6806387225548902, "percentage": 68.06, "elapsed_time": "0:15:11", "remaining_time": "0:07:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 342, "total_steps": 501, "loss": 0.3615, "learning_rate": 4.2233768434268914e-05, "epoch": 0.6826347305389222, "percentage": 68.26, "elapsed_time": "0:15:13", "remaining_time": "0:07:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 343, "total_steps": 501, "loss": 0.397, "learning_rate": 4.225490200071284e-05, "epoch": 0.6846307385229541, "percentage": 68.46, "elapsed_time": "0:15:16", "remaining_time": "0:07:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 344, "total_steps": 501, "loss": 0.3192, "learning_rate": 4.227597404285883e-05, "epoch": 0.6866267465069861, "percentage": 68.66, "elapsed_time": "0:15:18", "remaining_time": "0:06:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 345, "total_steps": 501, "loss": 0.3409, "learning_rate": 4.229698491788791e-05, "epoch": 0.688622754491018, "percentage": 68.86, "elapsed_time": "0:15:20", "remaining_time": "0:06:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 346, "total_steps": 501, "loss": 0.3506, "learning_rate": 4.231793497987961e-05, "epoch": 0.6906187624750499, "percentage": 69.06, "elapsed_time": "0:15:23", "remaining_time": "0:06:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 347, "total_steps": 501, "loss": 0.3697, "learning_rate": 4.2338824579847904e-05, "epoch": 0.6926147704590818, "percentage": 69.26, "elapsed_time": "0:15:25", "remaining_time": "0:06:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 348, "total_steps": 501, "loss": 0.4179, "learning_rate": 4.235965406577636e-05, "epoch": 0.6946107784431138, "percentage": 69.46, "elapsed_time": "0:15:27", "remaining_time": "0:06:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 349, "total_steps": 501, "loss": 0.358, "learning_rate": 4.2380423782653e-05, "epoch": 0.6966067864271457, "percentage": 69.66, "elapsed_time": "0:15:30", "remaining_time": "0:06:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 350, "total_steps": 501, "loss": 0.4223, "learning_rate": 4.240113407250459e-05, "epoch": 0.6986027944111777, "percentage": 69.86, "elapsed_time": "0:15:32", "remaining_time": "0:06:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 351, "total_steps": 501, "loss": 0.4283, "learning_rate": 4.24217852744304e-05, "epoch": 0.7005988023952096, "percentage": 70.06, "elapsed_time": "0:15:34", "remaining_time": "0:06:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 352, "total_steps": 501, "loss": 0.3277, "learning_rate": 4.244237772463552e-05, "epoch": 0.7025948103792415, "percentage": 70.26, "elapsed_time": "0:15:37", "remaining_time": "0:06:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 353, "total_steps": 501, "loss": 0.3153, "learning_rate": 4.246291175646371e-05, "epoch": 0.7045908183632734, "percentage": 70.46, "elapsed_time": "0:15:39", "remaining_time": "0:06:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 354, "total_steps": 501, "loss": 0.2934, "learning_rate": 4.24833877004298e-05, "epoch": 0.7065868263473054, "percentage": 70.66, "elapsed_time": "0:15:41", "remaining_time": "0:06:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 355, "total_steps": 501, "loss": 0.2647, "learning_rate": 4.250380588425157e-05, "epoch": 0.7085828343313373, "percentage": 70.86, "elapsed_time": "0:15:44", "remaining_time": "0:06:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 356, "total_steps": 501, "loss": 0.3777, "learning_rate": 4.2524166632881255e-05, "epoch": 0.7105788423153693, "percentage": 71.06, "elapsed_time": "0:15:46", "remaining_time": "0:06:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 357, "total_steps": 501, "loss": 0.2874, "learning_rate": 4.254447026853656e-05, "epoch": 0.7125748502994012, "percentage": 71.26, "elapsed_time": "0:15:48", "remaining_time": "0:06:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 358, "total_steps": 501, "loss": 0.3137, "learning_rate": 4.2564717110731244e-05, "epoch": 0.7145708582834331, "percentage": 71.46, "elapsed_time": "0:15:51", "remaining_time": "0:06:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 359, "total_steps": 501, "loss": 0.3366, "learning_rate": 4.258490747630532e-05, "epoch": 0.716566866267465, "percentage": 71.66, "elapsed_time": "0:15:53", "remaining_time": "0:06:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 360, "total_steps": 501, "loss": 0.367, "learning_rate": 4.260504167945479e-05, "epoch": 0.718562874251497, "percentage": 71.86, "elapsed_time": "0:15:55", "remaining_time": "0:06:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 361, "total_steps": 501, "loss": 0.3473, "learning_rate": 4.2625120031760965e-05, "epoch": 0.720558882235529, "percentage": 72.06, "elapsed_time": "0:15:58", "remaining_time": "0:06:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 362, "total_steps": 501, "loss": 0.3477, "learning_rate": 4.264514284221944e-05, "epoch": 0.7225548902195609, "percentage": 72.26, "elapsed_time": "0:16:00", "remaining_time": "0:06:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 363, "total_steps": 501, "loss": 0.3818, "learning_rate": 4.266511041726854e-05, "epoch": 0.7245508982035929, "percentage": 72.46, "elapsed_time": "0:16:02", "remaining_time": "0:06:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 364, "total_steps": 501, "loss": 0.3959, "learning_rate": 4.26850230608176e-05, "epoch": 0.7265469061876247, "percentage": 72.65, "elapsed_time": "0:16:05", "remaining_time": "0:06:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 365, "total_steps": 501, "loss": 0.3484, "learning_rate": 4.2704881074274584e-05, "epoch": 0.7285429141716567, "percentage": 72.85, "elapsed_time": "0:16:07", "remaining_time": "0:06:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 366, "total_steps": 501, "loss": 0.3315, "learning_rate": 4.272468475657351e-05, "epoch": 0.7305389221556886, "percentage": 73.05, "elapsed_time": "0:16:09", "remaining_time": "0:05:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 367, "total_steps": 501, "loss": 0.3806, "learning_rate": 4.2744434404201497e-05, "epoch": 0.7325349301397206, "percentage": 73.25, "elapsed_time": "0:16:12", "remaining_time": "0:05:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 368, "total_steps": 501, "loss": 0.3889, "learning_rate": 4.27641303112253e-05, "epoch": 0.7345309381237525, "percentage": 73.45, "elapsed_time": "0:16:14", "remaining_time": "0:05:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 369, "total_steps": 501, "loss": 0.2647, "learning_rate": 4.278377276931767e-05, "epoch": 0.7365269461077845, "percentage": 73.65, "elapsed_time": "0:16:16", "remaining_time": "0:05:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 370, "total_steps": 501, "loss": 0.3912, "learning_rate": 4.2803362067783256e-05, "epoch": 0.7385229540918163, "percentage": 73.85, "elapsed_time": "0:16:19", "remaining_time": "0:05:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 371, "total_steps": 501, "loss": 0.4216, "learning_rate": 4.2822898493584104e-05, "epoch": 0.7405189620758483, "percentage": 74.05, "elapsed_time": "0:16:21", "remaining_time": "0:05:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 372, "total_steps": 501, "loss": 0.395, "learning_rate": 4.284238233136496e-05, "epoch": 0.7425149700598802, "percentage": 74.25, "elapsed_time": "0:16:24", "remaining_time": "0:05:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 373, "total_steps": 501, "loss": 0.3683, "learning_rate": 4.286181386347813e-05, "epoch": 0.7445109780439122, "percentage": 74.45, "elapsed_time": "0:16:26", "remaining_time": "0:05:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 374, "total_steps": 501, "loss": 0.3518, "learning_rate": 4.288119337000801e-05, "epoch": 0.7465069860279441, "percentage": 74.65, "elapsed_time": "0:16:28", "remaining_time": "0:05:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 375, "total_steps": 501, "loss": 0.4018, "learning_rate": 4.2900521128795315e-05, "epoch": 0.7485029940119761, "percentage": 74.85, "elapsed_time": "0:16:31", "remaining_time": "0:05:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 376, "total_steps": 501, "loss": 0.3719, "learning_rate": 4.291979741546102e-05, "epoch": 0.7504990019960079, "percentage": 75.05, "elapsed_time": "0:16:33", "remaining_time": "0:05:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 377, "total_steps": 501, "loss": 0.3623, "learning_rate": 4.293902250342989e-05, "epoch": 0.7524950099800399, "percentage": 75.25, "elapsed_time": "0:16:35", "remaining_time": "0:05:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 378, "total_steps": 501, "loss": 0.3945, "learning_rate": 4.295819666395376e-05, "epoch": 0.7544910179640718, "percentage": 75.45, "elapsed_time": "0:16:38", "remaining_time": "0:05:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 379, "total_steps": 501, "loss": 0.4585, "learning_rate": 4.297732016613454e-05, "epoch": 0.7564870259481038, "percentage": 75.65, "elapsed_time": "0:16:40", "remaining_time": "0:05:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 380, "total_steps": 501, "loss": 0.4261, "learning_rate": 4.299639327694684e-05, "epoch": 0.7584830339321357, "percentage": 75.85, "elapsed_time": "0:16:42", "remaining_time": "0:05:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 381, "total_steps": 501, "loss": 0.336, "learning_rate": 4.3015416261260325e-05, "epoch": 0.7604790419161677, "percentage": 76.05, "elapsed_time": "0:16:45", "remaining_time": "0:05:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 382, "total_steps": 501, "loss": 0.3949, "learning_rate": 4.303438938186182e-05, "epoch": 0.7624750499001997, "percentage": 76.25, "elapsed_time": "0:16:47", "remaining_time": "0:05:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 383, "total_steps": 501, "loss": 0.348, "learning_rate": 4.305331289947705e-05, "epoch": 0.7644710578842315, "percentage": 76.45, "elapsed_time": "0:16:49", "remaining_time": "0:05:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 384, "total_steps": 501, "loss": 0.3715, "learning_rate": 4.3072187072792184e-05, "epoch": 0.7664670658682635, "percentage": 76.65, "elapsed_time": "0:16:52", "remaining_time": "0:05:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 385, "total_steps": 501, "loss": 0.3471, "learning_rate": 4.309101215847502e-05, "epoch": 0.7684630738522954, "percentage": 76.85, "elapsed_time": "0:16:54", "remaining_time": "0:05:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 386, "total_steps": 501, "loss": 0.3721, "learning_rate": 4.3109788411195924e-05, "epoch": 0.7704590818363274, "percentage": 77.05, "elapsed_time": "0:16:56", "remaining_time": "0:05:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 387, "total_steps": 501, "loss": 0.3501, "learning_rate": 4.312851608364853e-05, "epoch": 0.7724550898203593, "percentage": 77.25, "elapsed_time": "0:16:59", "remaining_time": "0:05:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 388, "total_steps": 501, "loss": 0.3446, "learning_rate": 4.314719542657013e-05, "epoch": 0.7744510978043913, "percentage": 77.45, "elapsed_time": "0:17:01", "remaining_time": "0:04:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 389, "total_steps": 501, "loss": 0.31, "learning_rate": 4.3165826688761796e-05, "epoch": 0.7764471057884231, "percentage": 77.64, "elapsed_time": "0:17:03", "remaining_time": "0:04:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 390, "total_steps": 501, "loss": 0.3356, "learning_rate": 4.318441011710833e-05, "epoch": 0.7784431137724551, "percentage": 77.84, "elapsed_time": "0:17:06", "remaining_time": "0:04:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 391, "total_steps": 501, "loss": 0.3543, "learning_rate": 4.3202945956597786e-05, "epoch": 0.780439121756487, "percentage": 78.04, "elapsed_time": "0:17:08", "remaining_time": "0:04:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 392, "total_steps": 501, "loss": 0.3157, "learning_rate": 4.3221434450340956e-05, "epoch": 0.782435129740519, "percentage": 78.24, "elapsed_time": "0:17:10", "remaining_time": "0:04:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 393, "total_steps": 501, "loss": 0.3533, "learning_rate": 4.323987583959045e-05, "epoch": 0.7844311377245509, "percentage": 78.44, "elapsed_time": "0:17:13", "remaining_time": "0:04:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 394, "total_steps": 501, "loss": 0.3742, "learning_rate": 4.325827036375957e-05, "epoch": 0.7864271457085829, "percentage": 78.64, "elapsed_time": "0:17:15", "remaining_time": "0:04:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 395, "total_steps": 501, "loss": 0.3472, "learning_rate": 4.327661826044101e-05, "epoch": 0.7884231536926147, "percentage": 78.84, "elapsed_time": "0:17:17", "remaining_time": "0:04:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 396, "total_steps": 501, "loss": 0.359, "learning_rate": 4.329491976542521e-05, "epoch": 0.7904191616766467, "percentage": 79.04, "elapsed_time": "0:17:20", "remaining_time": "0:04:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 397, "total_steps": 501, "loss": 0.4445, "learning_rate": 4.331317511271859e-05, "epoch": 0.7924151696606786, "percentage": 79.24, "elapsed_time": "0:17:22", "remaining_time": "0:04:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 398, "total_steps": 501, "loss": 0.3213, "learning_rate": 4.333138453456147e-05, "epoch": 0.7944111776447106, "percentage": 79.44, "elapsed_time": "0:17:24", "remaining_time": "0:04:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 399, "total_steps": 501, "loss": 0.3359, "learning_rate": 4.334954826144581e-05, "epoch": 0.7964071856287425, "percentage": 79.64, "elapsed_time": "0:17:27", "remaining_time": "0:04:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 400, "total_steps": 501, "loss": 0.3542, "learning_rate": 4.336766652213271e-05, "epoch": 0.7984031936127745, "percentage": 79.84, "elapsed_time": "0:17:29", "remaining_time": "0:04:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 401, "total_steps": 501, "loss": 0.3642, "learning_rate": 4.338573954366971e-05, "epoch": 0.8003992015968064, "percentage": 80.04, "elapsed_time": "0:18:04", "remaining_time": "0:04:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 402, "total_steps": 501, "loss": 0.3603, "learning_rate": 4.340376755140784e-05, "epoch": 0.8023952095808383, "percentage": 80.24, "elapsed_time": "0:18:06", "remaining_time": "0:04:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 403, "total_steps": 501, "loss": 0.3817, "learning_rate": 4.342175076901849e-05, "epoch": 0.8043912175648703, "percentage": 80.44, "elapsed_time": "0:18:09", "remaining_time": "0:04:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 404, "total_steps": 501, "loss": 0.3017, "learning_rate": 4.343968941851009e-05, "epoch": 0.8063872255489022, "percentage": 80.64, "elapsed_time": "0:18:11", "remaining_time": "0:04:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 405, "total_steps": 501, "loss": 0.3949, "learning_rate": 4.345758372024448e-05, "epoch": 0.8083832335329342, "percentage": 80.84, "elapsed_time": "0:18:13", "remaining_time": "0:04:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 406, "total_steps": 501, "loss": 0.3668, "learning_rate": 4.347543389295324e-05, "epoch": 0.810379241516966, "percentage": 81.04, "elapsed_time": "0:18:16", "remaining_time": "0:04:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 407, "total_steps": 501, "loss": 0.3499, "learning_rate": 4.3493240153753666e-05, "epoch": 0.812375249500998, "percentage": 81.24, "elapsed_time": "0:18:18", "remaining_time": "0:04:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 408, "total_steps": 501, "loss": 0.3304, "learning_rate": 4.3511002718164666e-05, "epoch": 0.8143712574850299, "percentage": 81.44, "elapsed_time": "0:18:20", "remaining_time": "0:04:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 409, "total_steps": 501, "loss": 0.3337, "learning_rate": 4.352872180012237e-05, "epoch": 0.8163672654690619, "percentage": 81.64, "elapsed_time": "0:18:23", "remaining_time": "0:04:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 410, "total_steps": 501, "loss": 0.4502, "learning_rate": 4.35463976119956e-05, "epoch": 0.8183632734530938, "percentage": 81.84, "elapsed_time": "0:18:25", "remaining_time": "0:04:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 411, "total_steps": 501, "loss": 0.4128, "learning_rate": 4.356403036460115e-05, "epoch": 0.8203592814371258, "percentage": 82.04, "elapsed_time": "0:18:27", "remaining_time": "0:04:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 412, "total_steps": 501, "loss": 0.3341, "learning_rate": 4.3581620267218916e-05, "epoch": 0.8223552894211577, "percentage": 82.24, "elapsed_time": "0:18:30", "remaining_time": "0:03:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 413, "total_steps": 501, "loss": 0.3498, "learning_rate": 4.359916752760669e-05, "epoch": 0.8243512974051896, "percentage": 82.44, "elapsed_time": "0:18:32", "remaining_time": "0:03:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 414, "total_steps": 501, "loss": 0.3796, "learning_rate": 4.361667235201499e-05, "epoch": 0.8263473053892215, "percentage": 82.63, "elapsed_time": "0:18:34", "remaining_time": "0:03:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 415, "total_steps": 501, "loss": 0.3911, "learning_rate": 4.363413494520154e-05, "epoch": 0.8283433133732535, "percentage": 82.83, "elapsed_time": "0:18:37", "remaining_time": "0:03:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 416, "total_steps": 501, "loss": 0.367, "learning_rate": 4.365155551044572e-05, "epoch": 0.8303393213572854, "percentage": 83.03, "elapsed_time": "0:18:39", "remaining_time": "0:03:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 417, "total_steps": 501, "loss": 0.289, "learning_rate": 4.366893424956263e-05, "epoch": 0.8323353293413174, "percentage": 83.23, "elapsed_time": "0:18:41", "remaining_time": "0:03:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 418, "total_steps": 501, "loss": 0.2747, "learning_rate": 4.368627136291726e-05, "epoch": 0.8343313373253493, "percentage": 83.43, "elapsed_time": "0:18:44", "remaining_time": "0:03:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 419, "total_steps": 501, "loss": 0.3435, "learning_rate": 4.370356704943825e-05, "epoch": 0.8363273453093812, "percentage": 83.63, "elapsed_time": "0:18:46", "remaining_time": "0:03:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 420, "total_steps": 501, "loss": 0.3645, "learning_rate": 4.372082150663168e-05, "epoch": 0.8383233532934131, "percentage": 83.83, "elapsed_time": "0:18:48", "remaining_time": "0:03:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 421, "total_steps": 501, "loss": 0.3672, "learning_rate": 4.3738034930594475e-05, "epoch": 0.8403193612774451, "percentage": 84.03, "elapsed_time": "0:18:51", "remaining_time": "0:03:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 422, "total_steps": 501, "loss": 0.3806, "learning_rate": 4.3755207516027904e-05, "epoch": 0.8423153692614771, "percentage": 84.23, "elapsed_time": "0:18:53", "remaining_time": "0:03:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 423, "total_steps": 501, "loss": 0.4031, "learning_rate": 4.377233945625071e-05, "epoch": 0.844311377245509, "percentage": 84.43, "elapsed_time": "0:18:55", "remaining_time": "0:03:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 424, "total_steps": 501, "loss": 0.3628, "learning_rate": 4.378943094321221e-05, "epoch": 0.846307385229541, "percentage": 84.63, "elapsed_time": "0:18:58", "remaining_time": "0:03:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 425, "total_steps": 501, "loss": 0.3434, "learning_rate": 4.3806482167505196e-05, "epoch": 0.8483033932135728, "percentage": 84.83, "elapsed_time": "0:19:00", "remaining_time": "0:03:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 426, "total_steps": 501, "loss": 0.3803, "learning_rate": 4.382349331837866e-05, "epoch": 0.8502994011976048, "percentage": 85.03, "elapsed_time": "0:19:02", "remaining_time": "0:03:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 427, "total_steps": 501, "loss": 0.3627, "learning_rate": 4.3840464583750404e-05, "epoch": 0.8522954091816367, "percentage": 85.23, "elapsed_time": "0:19:05", "remaining_time": "0:03:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 428, "total_steps": 501, "loss": 0.395, "learning_rate": 4.385739615021954e-05, "epoch": 0.8542914171656687, "percentage": 85.43, "elapsed_time": "0:19:07", "remaining_time": "0:03:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 429, "total_steps": 501, "loss": 0.3627, "learning_rate": 4.387428820307874e-05, "epoch": 0.8562874251497006, "percentage": 85.63, "elapsed_time": "0:19:09", "remaining_time": "0:03:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 430, "total_steps": 501, "loss": 0.3166, "learning_rate": 4.3891140926326446e-05, "epoch": 0.8582834331337326, "percentage": 85.83, "elapsed_time": "0:19:12", "remaining_time": "0:03:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 431, "total_steps": 501, "loss": 0.3634, "learning_rate": 4.390795450267886e-05, "epoch": 0.8602794411177644, "percentage": 86.03, "elapsed_time": "0:19:14", "remaining_time": "0:03:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 432, "total_steps": 501, "loss": 0.3103, "learning_rate": 4.3924729113581876e-05, "epoch": 0.8622754491017964, "percentage": 86.23, "elapsed_time": "0:19:16", "remaining_time": "0:03:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 433, "total_steps": 501, "loss": 0.3551, "learning_rate": 4.394146493922276e-05, "epoch": 0.8642714570858283, "percentage": 86.43, "elapsed_time": "0:19:19", "remaining_time": "0:03:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 434, "total_steps": 501, "loss": 0.3433, "learning_rate": 4.395816215854185e-05, "epoch": 0.8662674650698603, "percentage": 86.63, "elapsed_time": "0:19:21", "remaining_time": "0:02:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 435, "total_steps": 501, "loss": 0.3748, "learning_rate": 4.397482094924396e-05, "epoch": 0.8682634730538922, "percentage": 86.83, "elapsed_time": "0:19:23", "remaining_time": "0:02:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 436, "total_steps": 501, "loss": 0.3988, "learning_rate": 4.399144148780977e-05, "epoch": 0.8702594810379242, "percentage": 87.03, "elapsed_time": "0:19:26", "remaining_time": "0:02:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 437, "total_steps": 501, "loss": 0.3821, "learning_rate": 4.400802394950703e-05, "epoch": 0.872255489021956, "percentage": 87.23, "elapsed_time": "0:19:28", "remaining_time": "0:02:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 438, "total_steps": 501, "loss": 0.3212, "learning_rate": 4.402456850840166e-05, "epoch": 0.874251497005988, "percentage": 87.43, "elapsed_time": "0:19:31", "remaining_time": "0:02:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 439, "total_steps": 501, "loss": 0.3014, "learning_rate": 4.4041075337368695e-05, "epoch": 0.8762475049900199, "percentage": 87.62, "elapsed_time": "0:19:33", "remaining_time": "0:02:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 440, "total_steps": 501, "loss": 0.3363, "learning_rate": 4.405754460810312e-05, "epoch": 0.8782435129740519, "percentage": 87.82, "elapsed_time": "0:19:35", "remaining_time": "0:02:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 441, "total_steps": 501, "loss": 0.3706, "learning_rate": 4.407397649113065e-05, "epoch": 0.8802395209580839, "percentage": 88.02, "elapsed_time": "0:19:38", "remaining_time": "0:02:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 442, "total_steps": 501, "loss": 0.3625, "learning_rate": 4.40903711558182e-05, "epoch": 0.8822355289421158, "percentage": 88.22, "elapsed_time": "0:19:40", "remaining_time": "0:02:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 443, "total_steps": 501, "loss": 0.3459, "learning_rate": 4.41067287703845e-05, "epoch": 0.8842315369261478, "percentage": 88.42, "elapsed_time": "0:19:42", "remaining_time": "0:02:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 444, "total_steps": 501, "loss": 0.3863, "learning_rate": 4.412304950191033e-05, "epoch": 0.8862275449101796, "percentage": 88.62, "elapsed_time": "0:19:45", "remaining_time": "0:02:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 445, "total_steps": 501, "loss": 0.3873, "learning_rate": 4.413933351634886e-05, "epoch": 0.8882235528942116, "percentage": 88.82, "elapsed_time": "0:19:47", "remaining_time": "0:02:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 446, "total_steps": 501, "loss": 0.3199, "learning_rate": 4.4155580978535707e-05, "epoch": 0.8902195608782435, "percentage": 89.02, "elapsed_time": "0:19:49", "remaining_time": "0:02:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 447, "total_steps": 501, "loss": 0.3679, "learning_rate": 4.417179205219895e-05, "epoch": 0.8922155688622755, "percentage": 89.22, "elapsed_time": "0:19:52", "remaining_time": "0:02:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 448, "total_steps": 501, "loss": 0.2962, "learning_rate": 4.418796689996907e-05, "epoch": 0.8942115768463074, "percentage": 89.42, "elapsed_time": "0:19:54", "remaining_time": "0:02:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 449, "total_steps": 501, "loss": 0.4021, "learning_rate": 4.420410568338872e-05, "epoch": 0.8962075848303394, "percentage": 89.62, "elapsed_time": "0:19:56", "remaining_time": "0:02:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 450, "total_steps": 501, "loss": 0.3129, "learning_rate": 4.42202085629224e-05, "epoch": 0.8982035928143712, "percentage": 89.82, "elapsed_time": "0:19:59", "remaining_time": "0:02:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 451, "total_steps": 501, "loss": 0.3672, "learning_rate": 4.423627569796601e-05, "epoch": 0.9001996007984032, "percentage": 90.02, "elapsed_time": "0:20:01", "remaining_time": "0:02:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 452, "total_steps": 501, "loss": 0.4024, "learning_rate": 4.425230724685638e-05, "epoch": 0.9021956087824351, "percentage": 90.22, "elapsed_time": "0:20:03", "remaining_time": "0:02:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 453, "total_steps": 501, "loss": 0.355, "learning_rate": 4.4268303366880536e-05, "epoch": 0.9041916167664671, "percentage": 90.42, "elapsed_time": "0:20:06", "remaining_time": "0:02:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 454, "total_steps": 501, "loss": 0.4207, "learning_rate": 4.428426421428507e-05, "epoch": 0.906187624750499, "percentage": 90.62, "elapsed_time": "0:20:08", "remaining_time": "0:02:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 455, "total_steps": 501, "loss": 0.3068, "learning_rate": 4.430018994428521e-05, "epoch": 0.908183632734531, "percentage": 90.82, "elapsed_time": "0:20:10", "remaining_time": "0:02:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 456, "total_steps": 501, "loss": 0.3828, "learning_rate": 4.431608071107392e-05, "epoch": 0.9101796407185628, "percentage": 91.02, "elapsed_time": "0:20:13", "remaining_time": "0:01:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 457, "total_steps": 501, "loss": 0.3921, "learning_rate": 4.433193666783084e-05, "epoch": 0.9121756487025948, "percentage": 91.22, "elapsed_time": "0:20:15", "remaining_time": "0:01:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 458, "total_steps": 501, "loss": 0.2997, "learning_rate": 4.4347757966731156e-05, "epoch": 0.9141716566866267, "percentage": 91.42, "elapsed_time": "0:20:17", "remaining_time": "0:01:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 459, "total_steps": 501, "loss": 0.3478, "learning_rate": 4.436354475895436e-05, "epoch": 0.9161676646706587, "percentage": 91.62, "elapsed_time": "0:20:20", "remaining_time": "0:01:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 460, "total_steps": 501, "loss": 0.317, "learning_rate": 4.437929719469291e-05, "epoch": 0.9181636726546906, "percentage": 91.82, "elapsed_time": "0:20:22", "remaining_time": "0:01:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 461, "total_steps": 501, "loss": 0.3268, "learning_rate": 4.4395015423160807e-05, "epoch": 0.9201596806387226, "percentage": 92.02, "elapsed_time": "0:20:24", "remaining_time": "0:01:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 462, "total_steps": 501, "loss": 0.3791, "learning_rate": 4.4410699592602094e-05, "epoch": 0.9221556886227545, "percentage": 92.22, "elapsed_time": "0:20:27", "remaining_time": "0:01:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 463, "total_steps": 501, "loss": 0.36, "learning_rate": 4.442634985029922e-05, "epoch": 0.9241516966067864, "percentage": 92.42, "elapsed_time": "0:20:29", "remaining_time": "0:01:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 464, "total_steps": 501, "loss": 0.379, "learning_rate": 4.444196634258136e-05, "epoch": 0.9261477045908184, "percentage": 92.61, "elapsed_time": "0:20:31", "remaining_time": "0:01:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 465, "total_steps": 501, "loss": 0.3696, "learning_rate": 4.4457549214832566e-05, "epoch": 0.9281437125748503, "percentage": 92.81, "elapsed_time": "0:20:34", "remaining_time": "0:01:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 466, "total_steps": 501, "loss": 0.345, "learning_rate": 4.44730986115e-05, "epoch": 0.9301397205588823, "percentage": 93.01, "elapsed_time": "0:20:36", "remaining_time": "0:01:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 467, "total_steps": 501, "loss": 0.4367, "learning_rate": 4.448861467610187e-05, "epoch": 0.9321357285429142, "percentage": 93.21, "elapsed_time": "0:20:38", "remaining_time": "0:01:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 468, "total_steps": 501, "loss": 0.3615, "learning_rate": 4.4504097551235406e-05, "epoch": 0.9341317365269461, "percentage": 93.41, "elapsed_time": "0:20:41", "remaining_time": "0:01:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 469, "total_steps": 501, "loss": 0.2511, "learning_rate": 4.4519547378584725e-05, "epoch": 0.936127744510978, "percentage": 93.61, "elapsed_time": "0:20:43", "remaining_time": "0:01:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 470, "total_steps": 501, "loss": 0.3438, "learning_rate": 4.453496429892863e-05, "epoch": 0.93812375249501, "percentage": 93.81, "elapsed_time": "0:20:45", "remaining_time": "0:01:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 471, "total_steps": 501, "loss": 0.4078, "learning_rate": 4.455034845214827e-05, "epoch": 0.9401197604790419, "percentage": 94.01, "elapsed_time": "0:20:48", "remaining_time": "0:01:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 472, "total_steps": 501, "loss": 0.3297, "learning_rate": 4.4565699977234796e-05, "epoch": 0.9421157684630739, "percentage": 94.21, "elapsed_time": "0:20:50", "remaining_time": "0:01:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 473, "total_steps": 501, "loss": 0.3305, "learning_rate": 4.458101901229686e-05, "epoch": 0.9441117764471058, "percentage": 94.41, "elapsed_time": "0:20:53", "remaining_time": "0:01:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 474, "total_steps": 501, "loss": 0.345, "learning_rate": 4.459630569456809e-05, "epoch": 0.9461077844311377, "percentage": 94.61, "elapsed_time": "0:20:55", "remaining_time": "0:01:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 475, "total_steps": 501, "loss": 0.4174, "learning_rate": 4.461156016041444e-05, "epoch": 0.9481037924151696, "percentage": 94.81, "elapsed_time": "0:20:57", "remaining_time": "0:01:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 476, "total_steps": 501, "loss": 0.3657, "learning_rate": 4.462678254534156e-05, "epoch": 0.9500998003992016, "percentage": 95.01, "elapsed_time": "0:21:00", "remaining_time": "0:01:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 477, "total_steps": 501, "loss": 0.3401, "learning_rate": 4.464197298400191e-05, "epoch": 0.9520958083832335, "percentage": 95.21, "elapsed_time": "0:21:02", "remaining_time": "0:01:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 478, "total_steps": 501, "loss": 0.316, "learning_rate": 4.4657131610201994e-05, "epoch": 0.9540918163672655, "percentage": 95.41, "elapsed_time": "0:21:04", "remaining_time": "0:01:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 479, "total_steps": 501, "loss": 0.4096, "learning_rate": 4.467225855690939e-05, "epoch": 0.9560878243512974, "percentage": 95.61, "elapsed_time": "0:21:07", "remaining_time": "0:00:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 480, "total_steps": 501, "loss": 0.4383, "learning_rate": 4.468735395625979e-05, "epoch": 0.9580838323353293, "percentage": 95.81, "elapsed_time": "0:21:09", "remaining_time": "0:00:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 481, "total_steps": 501, "loss": 0.3269, "learning_rate": 4.470241793956387e-05, "epoch": 0.9600798403193613, "percentage": 96.01, "elapsed_time": "0:21:11", "remaining_time": "0:00:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 482, "total_steps": 501, "loss": 0.338, "learning_rate": 4.471745063731416e-05, "epoch": 0.9620758483033932, "percentage": 96.21, "elapsed_time": "0:21:14", "remaining_time": "0:00:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 483, "total_steps": 501, "loss": 0.3583, "learning_rate": 4.473245217919187e-05, "epoch": 0.9640718562874252, "percentage": 96.41, "elapsed_time": "0:21:16", "remaining_time": "0:00:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 484, "total_steps": 501, "loss": 0.333, "learning_rate": 4.474742269407355e-05, "epoch": 0.9660678642714571, "percentage": 96.61, "elapsed_time": "0:21:18", "remaining_time": "0:00:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 485, "total_steps": 501, "loss": 0.388, "learning_rate": 4.476236231003773e-05, "epoch": 0.9680638722554891, "percentage": 96.81, "elapsed_time": "0:21:21", "remaining_time": "0:00:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 486, "total_steps": 501, "loss": 0.3867, "learning_rate": 4.477727115437156e-05, "epoch": 0.9700598802395209, "percentage": 97.01, "elapsed_time": "0:21:23", "remaining_time": "0:00:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 487, "total_steps": 501, "loss": 0.312, "learning_rate": 4.479214935357724e-05, "epoch": 0.9720558882235529, "percentage": 97.21, "elapsed_time": "0:21:25", "remaining_time": "0:00:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 488, "total_steps": 501, "loss": 0.4059, "learning_rate": 4.480699703337852e-05, "epoch": 0.9740518962075848, "percentage": 97.41, "elapsed_time": "0:21:28", "remaining_time": "0:00:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 489, "total_steps": 501, "loss": 0.3789, "learning_rate": 4.4821814318727016e-05, "epoch": 0.9760479041916168, "percentage": 97.6, "elapsed_time": "0:21:30", "remaining_time": "0:00:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 490, "total_steps": 501, "loss": 0.3354, "learning_rate": 4.483660133380856e-05, "epoch": 0.9780439121756487, "percentage": 97.8, "elapsed_time": "0:21:32", "remaining_time": "0:00:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 491, "total_steps": 501, "loss": 0.3842, "learning_rate": 4.485135820204948e-05, "epoch": 0.9800399201596807, "percentage": 98.0, "elapsed_time": "0:21:35", "remaining_time": "0:00:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 492, "total_steps": 501, "loss": 0.432, "learning_rate": 4.486608504612267e-05, "epoch": 0.9820359281437125, "percentage": 98.2, "elapsed_time": "0:21:37", "remaining_time": "0:00:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 493, "total_steps": 501, "loss": 0.3503, "learning_rate": 4.488078198795383e-05, "epoch": 0.9840319361277445, "percentage": 98.4, "elapsed_time": "0:21:39", "remaining_time": "0:00:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 494, "total_steps": 501, "loss": 0.354, "learning_rate": 4.489544914872745e-05, "epoch": 0.9860279441117764, "percentage": 98.6, "elapsed_time": "0:21:42", "remaining_time": "0:00:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 495, "total_steps": 501, "loss": 0.3528, "learning_rate": 4.4910086648892815e-05, "epoch": 0.9880239520958084, "percentage": 98.8, "elapsed_time": "0:21:44", "remaining_time": "0:00:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 496, "total_steps": 501, "loss": 0.3698, "learning_rate": 4.4924694608169965e-05, "epoch": 0.9900199600798403, "percentage": 99.0, "elapsed_time": "0:21:46", "remaining_time": "0:00:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 497, "total_steps": 501, "loss": 0.3878, "learning_rate": 4.4939273145555536e-05, "epoch": 0.9920159680638723, "percentage": 99.2, "elapsed_time": "0:21:49", "remaining_time": "0:00:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 498, "total_steps": 501, "loss": 0.3155, "learning_rate": 4.495382237932863e-05, "epoch": 0.9940119760479041, "percentage": 99.4, "elapsed_time": "0:21:51", "remaining_time": "0:00:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 499, "total_steps": 501, "loss": 0.3425, "learning_rate": 4.4968342427056505e-05, "epoch": 0.9960079840319361, "percentage": 99.6, "elapsed_time": "0:21:53", "remaining_time": "0:00:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 500, "total_steps": 501, "loss": 0.3599, "learning_rate": 4.498283340560031e-05, "epoch": 0.998003992015968, "percentage": 99.8, "elapsed_time": "0:21:56", "remaining_time": "0:00:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 501, "total_steps": 501, "loss": 0.3201, "learning_rate": 4.499729543112076e-05, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:22:35", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 501, "total_steps": 501, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:23:08", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}