File size: 50,961 Bytes
40e4c43
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1b0a94e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0de8233
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0635a2c
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
{"current_steps": 10, "total_steps": 2631, "loss": 0.7552, "learning_rate": 5e-06, "epoch": 0.011396011396011397, "percentage": 0.38, "elapsed_time": "0:04:26", "remaining_time": "19:26:07"}
{"current_steps": 20, "total_steps": 2631, "loss": 0.7051, "learning_rate": 5e-06, "epoch": 0.022792022792022793, "percentage": 0.76, "elapsed_time": "0:08:48", "remaining_time": "19:10:45"}
{"current_steps": 30, "total_steps": 2631, "loss": 0.6821, "learning_rate": 5e-06, "epoch": 0.03418803418803419, "percentage": 1.14, "elapsed_time": "0:13:11", "remaining_time": "19:03:46"}
{"current_steps": 40, "total_steps": 2631, "loss": 0.6856, "learning_rate": 5e-06, "epoch": 0.045584045584045586, "percentage": 1.52, "elapsed_time": "0:17:34", "remaining_time": "18:58:14"}
{"current_steps": 50, "total_steps": 2631, "loss": 0.6637, "learning_rate": 5e-06, "epoch": 0.05698005698005698, "percentage": 1.9, "elapsed_time": "0:21:57", "remaining_time": "18:53:22"}
{"current_steps": 60, "total_steps": 2631, "loss": 0.6622, "learning_rate": 5e-06, "epoch": 0.06837606837606838, "percentage": 2.28, "elapsed_time": "0:26:20", "remaining_time": "18:48:23"}
{"current_steps": 70, "total_steps": 2631, "loss": 0.6663, "learning_rate": 5e-06, "epoch": 0.07977207977207977, "percentage": 2.66, "elapsed_time": "0:30:42", "remaining_time": "18:43:35"}
{"current_steps": 80, "total_steps": 2631, "loss": 0.6571, "learning_rate": 5e-06, "epoch": 0.09116809116809117, "percentage": 3.04, "elapsed_time": "0:35:06", "remaining_time": "18:39:25"}
{"current_steps": 90, "total_steps": 2631, "loss": 0.6638, "learning_rate": 5e-06, "epoch": 0.10256410256410256, "percentage": 3.42, "elapsed_time": "0:39:28", "remaining_time": "18:34:43"}
{"current_steps": 100, "total_steps": 2631, "loss": 0.6579, "learning_rate": 5e-06, "epoch": 0.11396011396011396, "percentage": 3.8, "elapsed_time": "0:43:52", "remaining_time": "18:30:26"}
{"current_steps": 110, "total_steps": 2631, "loss": 0.6526, "learning_rate": 5e-06, "epoch": 0.12535612535612536, "percentage": 4.18, "elapsed_time": "0:48:15", "remaining_time": "18:26:10"}
{"current_steps": 120, "total_steps": 2631, "loss": 0.6369, "learning_rate": 5e-06, "epoch": 0.13675213675213677, "percentage": 4.56, "elapsed_time": "0:52:38", "remaining_time": "18:21:37"}
{"current_steps": 130, "total_steps": 2631, "loss": 0.6341, "learning_rate": 5e-06, "epoch": 0.14814814814814814, "percentage": 4.94, "elapsed_time": "0:57:01", "remaining_time": "18:16:58"}
{"current_steps": 140, "total_steps": 2631, "loss": 0.6573, "learning_rate": 5e-06, "epoch": 0.15954415954415954, "percentage": 5.32, "elapsed_time": "1:01:23", "remaining_time": "18:12:27"}
{"current_steps": 150, "total_steps": 2631, "loss": 0.6449, "learning_rate": 5e-06, "epoch": 0.17094017094017094, "percentage": 5.7, "elapsed_time": "1:05:46", "remaining_time": "18:08:00"}
{"current_steps": 160, "total_steps": 2631, "loss": 0.6558, "learning_rate": 5e-06, "epoch": 0.18233618233618235, "percentage": 6.08, "elapsed_time": "1:10:09", "remaining_time": "18:03:34"}
{"current_steps": 170, "total_steps": 2631, "loss": 0.6287, "learning_rate": 5e-06, "epoch": 0.19373219373219372, "percentage": 6.46, "elapsed_time": "1:14:32", "remaining_time": "17:59:07"}
{"current_steps": 180, "total_steps": 2631, "loss": 0.6439, "learning_rate": 5e-06, "epoch": 0.20512820512820512, "percentage": 6.84, "elapsed_time": "1:18:55", "remaining_time": "17:54:43"}
{"current_steps": 190, "total_steps": 2631, "loss": 0.6396, "learning_rate": 5e-06, "epoch": 0.21652421652421652, "percentage": 7.22, "elapsed_time": "1:23:18", "remaining_time": "17:50:18"}
{"current_steps": 200, "total_steps": 2631, "loss": 0.6356, "learning_rate": 5e-06, "epoch": 0.22792022792022792, "percentage": 7.6, "elapsed_time": "1:27:41", "remaining_time": "17:45:56"}
{"current_steps": 210, "total_steps": 2631, "loss": 0.6306, "learning_rate": 5e-06, "epoch": 0.23931623931623933, "percentage": 7.98, "elapsed_time": "1:32:04", "remaining_time": "17:41:34"}
{"current_steps": 220, "total_steps": 2631, "loss": 0.6277, "learning_rate": 5e-06, "epoch": 0.25071225071225073, "percentage": 8.36, "elapsed_time": "1:36:27", "remaining_time": "17:37:06"}
{"current_steps": 230, "total_steps": 2631, "loss": 0.6339, "learning_rate": 5e-06, "epoch": 0.2621082621082621, "percentage": 8.74, "elapsed_time": "1:40:50", "remaining_time": "17:32:41"}
{"current_steps": 240, "total_steps": 2631, "loss": 0.641, "learning_rate": 5e-06, "epoch": 0.27350427350427353, "percentage": 9.12, "elapsed_time": "1:45:13", "remaining_time": "17:28:17"}
{"current_steps": 250, "total_steps": 2631, "loss": 0.6372, "learning_rate": 5e-06, "epoch": 0.2849002849002849, "percentage": 9.5, "elapsed_time": "1:49:36", "remaining_time": "17:23:53"}
{"current_steps": 260, "total_steps": 2631, "loss": 0.6403, "learning_rate": 5e-06, "epoch": 0.2962962962962963, "percentage": 9.88, "elapsed_time": "1:53:58", "remaining_time": "17:19:25"}
{"current_steps": 270, "total_steps": 2631, "loss": 0.6415, "learning_rate": 5e-06, "epoch": 0.3076923076923077, "percentage": 10.26, "elapsed_time": "1:58:21", "remaining_time": "17:15:01"}
{"current_steps": 280, "total_steps": 2631, "loss": 0.6399, "learning_rate": 5e-06, "epoch": 0.3190883190883191, "percentage": 10.64, "elapsed_time": "2:02:43", "remaining_time": "17:10:30"}
{"current_steps": 290, "total_steps": 2631, "loss": 0.6336, "learning_rate": 5e-06, "epoch": 0.33048433048433046, "percentage": 11.02, "elapsed_time": "2:07:06", "remaining_time": "17:06:02"}
{"current_steps": 300, "total_steps": 2631, "loss": 0.6337, "learning_rate": 5e-06, "epoch": 0.3418803418803419, "percentage": 11.4, "elapsed_time": "2:11:29", "remaining_time": "17:01:40"}
{"current_steps": 310, "total_steps": 2631, "loss": 0.637, "learning_rate": 5e-06, "epoch": 0.35327635327635326, "percentage": 11.78, "elapsed_time": "2:15:51", "remaining_time": "16:57:14"}
{"current_steps": 320, "total_steps": 2631, "loss": 0.64, "learning_rate": 5e-06, "epoch": 0.3646723646723647, "percentage": 12.16, "elapsed_time": "2:20:15", "remaining_time": "16:52:52"}
{"current_steps": 330, "total_steps": 2631, "loss": 0.6252, "learning_rate": 5e-06, "epoch": 0.37606837606837606, "percentage": 12.54, "elapsed_time": "2:24:37", "remaining_time": "16:48:28"}
{"current_steps": 340, "total_steps": 2631, "loss": 0.636, "learning_rate": 5e-06, "epoch": 0.38746438746438744, "percentage": 12.92, "elapsed_time": "2:29:00", "remaining_time": "16:44:05"}
{"current_steps": 350, "total_steps": 2631, "loss": 0.6387, "learning_rate": 5e-06, "epoch": 0.39886039886039887, "percentage": 13.3, "elapsed_time": "2:33:23", "remaining_time": "16:39:41"}
{"current_steps": 360, "total_steps": 2631, "loss": 0.6338, "learning_rate": 5e-06, "epoch": 0.41025641025641024, "percentage": 13.68, "elapsed_time": "2:37:46", "remaining_time": "16:35:20"}
{"current_steps": 370, "total_steps": 2631, "loss": 0.6337, "learning_rate": 5e-06, "epoch": 0.42165242165242167, "percentage": 14.06, "elapsed_time": "2:42:10", "remaining_time": "16:30:59"}
{"current_steps": 380, "total_steps": 2631, "loss": 0.6235, "learning_rate": 5e-06, "epoch": 0.43304843304843305, "percentage": 14.44, "elapsed_time": "2:46:33", "remaining_time": "16:26:38"}
{"current_steps": 390, "total_steps": 2631, "loss": 0.6305, "learning_rate": 5e-06, "epoch": 0.4444444444444444, "percentage": 14.82, "elapsed_time": "2:50:56", "remaining_time": "16:22:16"}
{"current_steps": 400, "total_steps": 2631, "loss": 0.6424, "learning_rate": 5e-06, "epoch": 0.45584045584045585, "percentage": 15.2, "elapsed_time": "2:55:19", "remaining_time": "16:17:50"}
{"current_steps": 410, "total_steps": 2631, "loss": 0.6319, "learning_rate": 5e-06, "epoch": 0.4672364672364672, "percentage": 15.58, "elapsed_time": "2:59:42", "remaining_time": "16:13:27"}
{"current_steps": 420, "total_steps": 2631, "loss": 0.6332, "learning_rate": 5e-06, "epoch": 0.47863247863247865, "percentage": 15.96, "elapsed_time": "3:04:05", "remaining_time": "16:09:04"}
{"current_steps": 430, "total_steps": 2631, "loss": 0.6328, "learning_rate": 5e-06, "epoch": 0.49002849002849, "percentage": 16.34, "elapsed_time": "3:08:27", "remaining_time": "16:04:41"}
{"current_steps": 440, "total_steps": 2631, "loss": 0.6402, "learning_rate": 5e-06, "epoch": 0.5014245014245015, "percentage": 16.72, "elapsed_time": "3:12:50", "remaining_time": "16:00:18"}
{"current_steps": 450, "total_steps": 2631, "loss": 0.6306, "learning_rate": 5e-06, "epoch": 0.5128205128205128, "percentage": 17.1, "elapsed_time": "3:17:13", "remaining_time": "15:55:54"}
{"current_steps": 460, "total_steps": 2631, "loss": 0.6344, "learning_rate": 5e-06, "epoch": 0.5242165242165242, "percentage": 17.48, "elapsed_time": "3:21:36", "remaining_time": "15:51:31"}
{"current_steps": 470, "total_steps": 2631, "loss": 0.6231, "learning_rate": 5e-06, "epoch": 0.5356125356125356, "percentage": 17.86, "elapsed_time": "3:25:59", "remaining_time": "15:47:08"}
{"current_steps": 480, "total_steps": 2631, "loss": 0.6341, "learning_rate": 5e-06, "epoch": 0.5470085470085471, "percentage": 18.24, "elapsed_time": "3:30:22", "remaining_time": "15:42:44"}
{"current_steps": 490, "total_steps": 2631, "loss": 0.6351, "learning_rate": 5e-06, "epoch": 0.5584045584045584, "percentage": 18.62, "elapsed_time": "3:34:44", "remaining_time": "15:38:18"}
{"current_steps": 500, "total_steps": 2631, "loss": 0.6309, "learning_rate": 5e-06, "epoch": 0.5698005698005698, "percentage": 19.0, "elapsed_time": "3:39:07", "remaining_time": "15:33:54"}
{"current_steps": 510, "total_steps": 2631, "loss": 0.6331, "learning_rate": 5e-06, "epoch": 0.5811965811965812, "percentage": 19.38, "elapsed_time": "3:43:30", "remaining_time": "15:29:30"}
{"current_steps": 520, "total_steps": 2631, "loss": 0.6303, "learning_rate": 5e-06, "epoch": 0.5925925925925926, "percentage": 19.76, "elapsed_time": "3:47:53", "remaining_time": "15:25:08"}
{"current_steps": 530, "total_steps": 2631, "loss": 0.6295, "learning_rate": 5e-06, "epoch": 0.603988603988604, "percentage": 20.14, "elapsed_time": "3:52:16", "remaining_time": "15:20:45"}
{"current_steps": 540, "total_steps": 2631, "loss": 0.629, "learning_rate": 5e-06, "epoch": 0.6153846153846154, "percentage": 20.52, "elapsed_time": "3:56:39", "remaining_time": "15:16:23"}
{"current_steps": 550, "total_steps": 2631, "loss": 0.6418, "learning_rate": 5e-06, "epoch": 0.6267806267806267, "percentage": 20.9, "elapsed_time": "4:01:02", "remaining_time": "15:12:00"}
{"current_steps": 560, "total_steps": 2631, "loss": 0.6365, "learning_rate": 5e-06, "epoch": 0.6381766381766382, "percentage": 21.28, "elapsed_time": "4:05:25", "remaining_time": "15:07:38"}
{"current_steps": 570, "total_steps": 2631, "loss": 0.6298, "learning_rate": 5e-06, "epoch": 0.6495726495726496, "percentage": 21.66, "elapsed_time": "4:09:48", "remaining_time": "15:03:16"}
{"current_steps": 580, "total_steps": 2631, "loss": 0.6264, "learning_rate": 5e-06, "epoch": 0.6609686609686609, "percentage": 22.04, "elapsed_time": "4:14:11", "remaining_time": "14:58:54"}
{"current_steps": 590, "total_steps": 2631, "loss": 0.6338, "learning_rate": 5e-06, "epoch": 0.6723646723646723, "percentage": 22.42, "elapsed_time": "4:18:34", "remaining_time": "14:54:29"}
{"current_steps": 600, "total_steps": 2631, "loss": 0.6185, "learning_rate": 5e-06, "epoch": 0.6837606837606838, "percentage": 22.81, "elapsed_time": "4:22:57", "remaining_time": "14:50:07"}
{"current_steps": 610, "total_steps": 2631, "loss": 0.6285, "learning_rate": 5e-06, "epoch": 0.6951566951566952, "percentage": 23.19, "elapsed_time": "4:27:20", "remaining_time": "14:45:45"}
{"current_steps": 620, "total_steps": 2631, "loss": 0.6249, "learning_rate": 5e-06, "epoch": 0.7065527065527065, "percentage": 23.57, "elapsed_time": "4:31:44", "remaining_time": "14:41:23"}
{"current_steps": 630, "total_steps": 2631, "loss": 0.6297, "learning_rate": 5e-06, "epoch": 0.717948717948718, "percentage": 23.95, "elapsed_time": "4:36:06", "remaining_time": "14:36:59"}
{"current_steps": 640, "total_steps": 2631, "loss": 0.624, "learning_rate": 5e-06, "epoch": 0.7293447293447294, "percentage": 24.33, "elapsed_time": "4:40:29", "remaining_time": "14:32:37"}
{"current_steps": 650, "total_steps": 2631, "loss": 0.629, "learning_rate": 5e-06, "epoch": 0.7407407407407407, "percentage": 24.71, "elapsed_time": "4:44:53", "remaining_time": "14:28:15"}
{"current_steps": 660, "total_steps": 2631, "loss": 0.6177, "learning_rate": 5e-06, "epoch": 0.7521367521367521, "percentage": 25.09, "elapsed_time": "4:49:16", "remaining_time": "14:23:52"}
{"current_steps": 670, "total_steps": 2631, "loss": 0.6261, "learning_rate": 5e-06, "epoch": 0.7635327635327636, "percentage": 25.47, "elapsed_time": "4:53:38", "remaining_time": "14:19:28"}
{"current_steps": 680, "total_steps": 2631, "loss": 0.6304, "learning_rate": 5e-06, "epoch": 0.7749287749287749, "percentage": 25.85, "elapsed_time": "4:58:02", "remaining_time": "14:15:05"}
{"current_steps": 690, "total_steps": 2631, "loss": 0.6398, "learning_rate": 5e-06, "epoch": 0.7863247863247863, "percentage": 26.23, "elapsed_time": "5:02:25", "remaining_time": "14:10:42"}
{"current_steps": 700, "total_steps": 2631, "loss": 0.6319, "learning_rate": 5e-06, "epoch": 0.7977207977207977, "percentage": 26.61, "elapsed_time": "5:06:47", "remaining_time": "14:06:18"}
{"current_steps": 710, "total_steps": 2631, "loss": 0.6314, "learning_rate": 5e-06, "epoch": 0.8091168091168092, "percentage": 26.99, "elapsed_time": "5:11:11", "remaining_time": "14:01:57"}
{"current_steps": 720, "total_steps": 2631, "loss": 0.6243, "learning_rate": 5e-06, "epoch": 0.8205128205128205, "percentage": 27.37, "elapsed_time": "5:15:34", "remaining_time": "13:57:34"}
{"current_steps": 730, "total_steps": 2631, "loss": 0.6226, "learning_rate": 5e-06, "epoch": 0.8319088319088319, "percentage": 27.75, "elapsed_time": "5:19:57", "remaining_time": "13:53:11"}
{"current_steps": 740, "total_steps": 2631, "loss": 0.6208, "learning_rate": 5e-06, "epoch": 0.8433048433048433, "percentage": 28.13, "elapsed_time": "5:24:20", "remaining_time": "13:48:48"}
{"current_steps": 750, "total_steps": 2631, "loss": 0.6338, "learning_rate": 5e-06, "epoch": 0.8547008547008547, "percentage": 28.51, "elapsed_time": "5:28:43", "remaining_time": "13:44:26"}
{"current_steps": 760, "total_steps": 2631, "loss": 0.6337, "learning_rate": 5e-06, "epoch": 0.8660968660968661, "percentage": 28.89, "elapsed_time": "5:33:06", "remaining_time": "13:40:03"}
{"current_steps": 770, "total_steps": 2631, "loss": 0.6296, "learning_rate": 5e-06, "epoch": 0.8774928774928775, "percentage": 29.27, "elapsed_time": "5:37:28", "remaining_time": "13:35:38"}
{"current_steps": 780, "total_steps": 2631, "loss": 0.6357, "learning_rate": 5e-06, "epoch": 0.8888888888888888, "percentage": 29.65, "elapsed_time": "5:41:51", "remaining_time": "13:31:14"}
{"current_steps": 790, "total_steps": 2631, "loss": 0.6333, "learning_rate": 5e-06, "epoch": 0.9002849002849003, "percentage": 30.03, "elapsed_time": "5:46:14", "remaining_time": "13:26:51"}
{"current_steps": 800, "total_steps": 2631, "loss": 0.6384, "learning_rate": 5e-06, "epoch": 0.9116809116809117, "percentage": 30.41, "elapsed_time": "5:50:36", "remaining_time": "13:22:27"}
{"current_steps": 810, "total_steps": 2631, "loss": 0.6309, "learning_rate": 5e-06, "epoch": 0.9230769230769231, "percentage": 30.79, "elapsed_time": "5:54:59", "remaining_time": "13:18:04"}
{"current_steps": 820, "total_steps": 2631, "loss": 0.6323, "learning_rate": 5e-06, "epoch": 0.9344729344729344, "percentage": 31.17, "elapsed_time": "5:59:23", "remaining_time": "13:13:42"}
{"current_steps": 830, "total_steps": 2631, "loss": 0.6117, "learning_rate": 5e-06, "epoch": 0.9458689458689459, "percentage": 31.55, "elapsed_time": "6:03:46", "remaining_time": "13:09:20"}
{"current_steps": 840, "total_steps": 2631, "loss": 0.6258, "learning_rate": 5e-06, "epoch": 0.9572649572649573, "percentage": 31.93, "elapsed_time": "6:08:09", "remaining_time": "13:04:58"}
{"current_steps": 850, "total_steps": 2631, "loss": 0.6334, "learning_rate": 5e-06, "epoch": 0.9686609686609686, "percentage": 32.31, "elapsed_time": "6:12:32", "remaining_time": "13:00:34"}
{"current_steps": 860, "total_steps": 2631, "loss": 0.6299, "learning_rate": 5e-06, "epoch": 0.98005698005698, "percentage": 32.69, "elapsed_time": "6:16:55", "remaining_time": "12:56:12"}
{"current_steps": 870, "total_steps": 2631, "loss": 0.6134, "learning_rate": 5e-06, "epoch": 0.9914529914529915, "percentage": 33.07, "elapsed_time": "6:21:18", "remaining_time": "12:51:49"}
{"current_steps": 877, "total_steps": 2631, "eval_loss": 0.622437059879303, "epoch": 0.9994301994301994, "percentage": 33.33, "elapsed_time": "6:31:57", "remaining_time": "13:03:55"}
{"current_steps": 880, "total_steps": 2631, "loss": 0.6384, "learning_rate": 5e-06, "epoch": 1.002849002849003, "percentage": 33.45, "elapsed_time": "6:34:09", "remaining_time": "13:04:17"}
{"current_steps": 890, "total_steps": 2631, "loss": 0.5855, "learning_rate": 5e-06, "epoch": 1.0142450142450143, "percentage": 33.83, "elapsed_time": "6:38:32", "remaining_time": "12:59:37"}
{"current_steps": 900, "total_steps": 2631, "loss": 0.5924, "learning_rate": 5e-06, "epoch": 1.0256410256410255, "percentage": 34.21, "elapsed_time": "6:42:56", "remaining_time": "12:54:58"}
{"current_steps": 910, "total_steps": 2631, "loss": 0.5882, "learning_rate": 5e-06, "epoch": 1.037037037037037, "percentage": 34.59, "elapsed_time": "6:47:19", "remaining_time": "12:50:19"}
{"current_steps": 920, "total_steps": 2631, "loss": 0.5834, "learning_rate": 5e-06, "epoch": 1.0484330484330484, "percentage": 34.97, "elapsed_time": "6:51:42", "remaining_time": "12:45:40"}
{"current_steps": 930, "total_steps": 2631, "loss": 0.5875, "learning_rate": 5e-06, "epoch": 1.0598290598290598, "percentage": 35.35, "elapsed_time": "6:56:05", "remaining_time": "12:41:02"}
{"current_steps": 940, "total_steps": 2631, "loss": 0.578, "learning_rate": 5e-06, "epoch": 1.0712250712250713, "percentage": 35.73, "elapsed_time": "7:00:28", "remaining_time": "12:36:24"}
{"current_steps": 950, "total_steps": 2631, "loss": 0.5945, "learning_rate": 5e-06, "epoch": 1.0826210826210827, "percentage": 36.11, "elapsed_time": "7:04:52", "remaining_time": "12:31:47"}
{"current_steps": 960, "total_steps": 2631, "loss": 0.591, "learning_rate": 5e-06, "epoch": 1.0940170940170941, "percentage": 36.49, "elapsed_time": "7:09:15", "remaining_time": "12:27:10"}
{"current_steps": 970, "total_steps": 2631, "loss": 0.5947, "learning_rate": 5e-06, "epoch": 1.1054131054131053, "percentage": 36.87, "elapsed_time": "7:13:39", "remaining_time": "12:22:34"}
{"current_steps": 980, "total_steps": 2631, "loss": 0.5989, "learning_rate": 5e-06, "epoch": 1.1168091168091168, "percentage": 37.25, "elapsed_time": "7:18:01", "remaining_time": "12:17:57"}
{"current_steps": 990, "total_steps": 2631, "loss": 0.5883, "learning_rate": 5e-06, "epoch": 1.1282051282051282, "percentage": 37.63, "elapsed_time": "7:22:25", "remaining_time": "12:13:20"}
{"current_steps": 1000, "total_steps": 2631, "loss": 0.5857, "learning_rate": 5e-06, "epoch": 1.1396011396011396, "percentage": 38.01, "elapsed_time": "7:26:48", "remaining_time": "12:08:45"}
{"current_steps": 1010, "total_steps": 2631, "loss": 0.5846, "learning_rate": 5e-06, "epoch": 1.150997150997151, "percentage": 38.39, "elapsed_time": "7:31:12", "remaining_time": "12:04:09"}
{"current_steps": 1020, "total_steps": 2631, "loss": 0.5862, "learning_rate": 5e-06, "epoch": 1.1623931623931625, "percentage": 38.77, "elapsed_time": "7:35:35", "remaining_time": "11:59:33"}
{"current_steps": 1030, "total_steps": 2631, "loss": 0.5828, "learning_rate": 5e-06, "epoch": 1.173789173789174, "percentage": 39.15, "elapsed_time": "7:39:58", "remaining_time": "11:54:58"}
{"current_steps": 1040, "total_steps": 2631, "loss": 0.5969, "learning_rate": 5e-06, "epoch": 1.1851851851851851, "percentage": 39.53, "elapsed_time": "7:44:21", "remaining_time": "11:50:22"}
{"current_steps": 1050, "total_steps": 2631, "loss": 0.5849, "learning_rate": 5e-06, "epoch": 1.1965811965811965, "percentage": 39.91, "elapsed_time": "7:48:43", "remaining_time": "11:45:46"}
{"current_steps": 1060, "total_steps": 2631, "loss": 0.5866, "learning_rate": 5e-06, "epoch": 1.207977207977208, "percentage": 40.29, "elapsed_time": "7:53:06", "remaining_time": "11:41:10"}
{"current_steps": 1070, "total_steps": 2631, "loss": 0.5963, "learning_rate": 5e-06, "epoch": 1.2193732193732194, "percentage": 40.67, "elapsed_time": "7:57:29", "remaining_time": "11:36:36"}
{"current_steps": 1080, "total_steps": 2631, "loss": 0.5872, "learning_rate": 5e-06, "epoch": 1.2307692307692308, "percentage": 41.05, "elapsed_time": "8:01:53", "remaining_time": "11:32:02"}
{"current_steps": 1090, "total_steps": 2631, "loss": 0.5952, "learning_rate": 5e-06, "epoch": 1.242165242165242, "percentage": 41.43, "elapsed_time": "8:06:16", "remaining_time": "11:27:28"}
{"current_steps": 1100, "total_steps": 2631, "loss": 0.5903, "learning_rate": 5e-06, "epoch": 1.2535612535612537, "percentage": 41.81, "elapsed_time": "8:10:39", "remaining_time": "11:22:54"}
{"current_steps": 1110, "total_steps": 2631, "loss": 0.5989, "learning_rate": 5e-06, "epoch": 1.264957264957265, "percentage": 42.19, "elapsed_time": "8:15:02", "remaining_time": "11:18:20"}
{"current_steps": 1120, "total_steps": 2631, "loss": 0.583, "learning_rate": 5e-06, "epoch": 1.2763532763532763, "percentage": 42.57, "elapsed_time": "8:19:25", "remaining_time": "11:13:47"}
{"current_steps": 1130, "total_steps": 2631, "loss": 0.5938, "learning_rate": 5e-06, "epoch": 1.2877492877492878, "percentage": 42.95, "elapsed_time": "8:23:49", "remaining_time": "11:09:14"}
{"current_steps": 1140, "total_steps": 2631, "loss": 0.5805, "learning_rate": 5e-06, "epoch": 1.2991452991452992, "percentage": 43.33, "elapsed_time": "8:28:12", "remaining_time": "11:04:41"}
{"current_steps": 1150, "total_steps": 2631, "loss": 0.5862, "learning_rate": 5e-06, "epoch": 1.3105413105413106, "percentage": 43.71, "elapsed_time": "8:32:36", "remaining_time": "11:00:08"}
{"current_steps": 1160, "total_steps": 2631, "loss": 0.5883, "learning_rate": 5e-06, "epoch": 1.3219373219373218, "percentage": 44.09, "elapsed_time": "8:36:59", "remaining_time": "10:55:36"}
{"current_steps": 1170, "total_steps": 2631, "loss": 0.5833, "learning_rate": 5e-06, "epoch": 1.3333333333333333, "percentage": 44.47, "elapsed_time": "8:41:23", "remaining_time": "10:51:03"}
{"current_steps": 1180, "total_steps": 2631, "loss": 0.5824, "learning_rate": 5e-06, "epoch": 1.3447293447293447, "percentage": 44.85, "elapsed_time": "8:45:46", "remaining_time": "10:46:31"}
{"current_steps": 1190, "total_steps": 2631, "loss": 0.6004, "learning_rate": 5e-06, "epoch": 1.3561253561253561, "percentage": 45.23, "elapsed_time": "8:50:09", "remaining_time": "10:41:58"}
{"current_steps": 1200, "total_steps": 2631, "loss": 0.5818, "learning_rate": 5e-06, "epoch": 1.3675213675213675, "percentage": 45.61, "elapsed_time": "8:54:32", "remaining_time": "10:37:26"}
{"current_steps": 1210, "total_steps": 2631, "loss": 0.5859, "learning_rate": 5e-06, "epoch": 1.378917378917379, "percentage": 45.99, "elapsed_time": "8:58:55", "remaining_time": "10:32:54"}
{"current_steps": 1220, "total_steps": 2631, "loss": 0.5906, "learning_rate": 5e-06, "epoch": 1.3903133903133904, "percentage": 46.37, "elapsed_time": "9:03:18", "remaining_time": "10:28:22"}
{"current_steps": 1230, "total_steps": 2631, "loss": 0.5927, "learning_rate": 5e-06, "epoch": 1.4017094017094016, "percentage": 46.75, "elapsed_time": "9:07:42", "remaining_time": "10:23:50"}
{"current_steps": 1240, "total_steps": 2631, "loss": 0.5956, "learning_rate": 5e-06, "epoch": 1.413105413105413, "percentage": 47.13, "elapsed_time": "9:12:05", "remaining_time": "10:19:19"}
{"current_steps": 1250, "total_steps": 2631, "loss": 0.6033, "learning_rate": 5e-06, "epoch": 1.4245014245014245, "percentage": 47.51, "elapsed_time": "9:16:28", "remaining_time": "10:14:48"}
{"current_steps": 1260, "total_steps": 2631, "loss": 0.5825, "learning_rate": 5e-06, "epoch": 1.435897435897436, "percentage": 47.89, "elapsed_time": "9:20:51", "remaining_time": "10:10:16"}
{"current_steps": 1270, "total_steps": 2631, "loss": 0.5842, "learning_rate": 5e-06, "epoch": 1.4472934472934473, "percentage": 48.27, "elapsed_time": "9:25:14", "remaining_time": "10:05:44"}
{"current_steps": 1280, "total_steps": 2631, "loss": 0.5851, "learning_rate": 5e-06, "epoch": 1.4586894586894588, "percentage": 48.65, "elapsed_time": "9:29:37", "remaining_time": "10:01:13"}
{"current_steps": 1290, "total_steps": 2631, "loss": 0.5815, "learning_rate": 5e-06, "epoch": 1.4700854700854702, "percentage": 49.03, "elapsed_time": "9:34:00", "remaining_time": "9:56:42"}
{"current_steps": 1300, "total_steps": 2631, "loss": 0.5893, "learning_rate": 5e-06, "epoch": 1.4814814814814814, "percentage": 49.41, "elapsed_time": "9:38:23", "remaining_time": "9:52:11"}
{"current_steps": 1310, "total_steps": 2631, "loss": 0.5812, "learning_rate": 5e-06, "epoch": 1.4928774928774928, "percentage": 49.79, "elapsed_time": "9:42:47", "remaining_time": "9:47:40"}
{"current_steps": 1320, "total_steps": 2631, "loss": 0.5872, "learning_rate": 5e-06, "epoch": 1.5042735042735043, "percentage": 50.17, "elapsed_time": "9:47:09", "remaining_time": "9:43:09"}
{"current_steps": 1330, "total_steps": 2631, "loss": 0.5894, "learning_rate": 5e-06, "epoch": 1.5156695156695157, "percentage": 50.55, "elapsed_time": "9:51:31", "remaining_time": "9:38:37"}
{"current_steps": 1340, "total_steps": 2631, "loss": 0.5948, "learning_rate": 5e-06, "epoch": 1.5270655270655271, "percentage": 50.93, "elapsed_time": "9:55:54", "remaining_time": "9:34:07"}
{"current_steps": 1350, "total_steps": 2631, "loss": 0.5755, "learning_rate": 5e-06, "epoch": 1.5384615384615383, "percentage": 51.31, "elapsed_time": "10:00:17", "remaining_time": "9:29:36"}
{"current_steps": 1360, "total_steps": 2631, "loss": 0.5892, "learning_rate": 5e-06, "epoch": 1.54985754985755, "percentage": 51.69, "elapsed_time": "10:04:41", "remaining_time": "9:25:06"}
{"current_steps": 1370, "total_steps": 2631, "loss": 0.5784, "learning_rate": 5e-06, "epoch": 1.5612535612535612, "percentage": 52.07, "elapsed_time": "10:09:03", "remaining_time": "9:20:35"}
{"current_steps": 1380, "total_steps": 2631, "loss": 0.5864, "learning_rate": 5e-06, "epoch": 1.5726495726495726, "percentage": 52.45, "elapsed_time": "10:13:26", "remaining_time": "9:16:05"}
{"current_steps": 1390, "total_steps": 2631, "loss": 0.6075, "learning_rate": 5e-06, "epoch": 1.584045584045584, "percentage": 52.83, "elapsed_time": "10:17:49", "remaining_time": "9:11:36"}
{"current_steps": 1400, "total_steps": 2631, "loss": 0.5944, "learning_rate": 5e-06, "epoch": 1.5954415954415955, "percentage": 53.21, "elapsed_time": "10:22:13", "remaining_time": "9:07:06"}
{"current_steps": 1410, "total_steps": 2631, "loss": 0.5915, "learning_rate": 5e-06, "epoch": 1.606837606837607, "percentage": 53.59, "elapsed_time": "10:26:37", "remaining_time": "9:02:37"}
{"current_steps": 1420, "total_steps": 2631, "loss": 0.5817, "learning_rate": 5e-06, "epoch": 1.618233618233618, "percentage": 53.97, "elapsed_time": "10:31:00", "remaining_time": "8:58:07"}
{"current_steps": 1430, "total_steps": 2631, "loss": 0.5983, "learning_rate": 5e-06, "epoch": 1.6296296296296298, "percentage": 54.35, "elapsed_time": "10:35:23", "remaining_time": "8:53:38"}
{"current_steps": 1440, "total_steps": 2631, "loss": 0.5826, "learning_rate": 5e-06, "epoch": 1.641025641025641, "percentage": 54.73, "elapsed_time": "10:39:47", "remaining_time": "8:49:09"}
{"current_steps": 1450, "total_steps": 2631, "loss": 0.5889, "learning_rate": 5e-06, "epoch": 1.6524216524216524, "percentage": 55.11, "elapsed_time": "10:44:10", "remaining_time": "8:44:40"}
{"current_steps": 1460, "total_steps": 2631, "loss": 0.5859, "learning_rate": 5e-06, "epoch": 1.6638176638176638, "percentage": 55.49, "elapsed_time": "10:48:34", "remaining_time": "8:40:11"}
{"current_steps": 1470, "total_steps": 2631, "loss": 0.5806, "learning_rate": 5e-06, "epoch": 1.6752136752136753, "percentage": 55.87, "elapsed_time": "10:52:57", "remaining_time": "8:35:42"}
{"current_steps": 1480, "total_steps": 2631, "loss": 0.5866, "learning_rate": 5e-06, "epoch": 1.6866096866096867, "percentage": 56.25, "elapsed_time": "10:57:21", "remaining_time": "8:31:13"}
{"current_steps": 1490, "total_steps": 2631, "loss": 0.5803, "learning_rate": 5e-06, "epoch": 1.698005698005698, "percentage": 56.63, "elapsed_time": "11:01:44", "remaining_time": "8:26:44"}
{"current_steps": 1500, "total_steps": 2631, "loss": 0.5913, "learning_rate": 5e-06, "epoch": 1.7094017094017095, "percentage": 57.01, "elapsed_time": "11:06:07", "remaining_time": "8:22:15"}
{"current_steps": 1510, "total_steps": 2631, "loss": 0.5795, "learning_rate": 5e-06, "epoch": 1.7207977207977208, "percentage": 57.39, "elapsed_time": "11:10:30", "remaining_time": "8:17:46"}
{"current_steps": 1520, "total_steps": 2631, "loss": 0.5888, "learning_rate": 5e-06, "epoch": 1.7321937321937322, "percentage": 57.77, "elapsed_time": "11:14:53", "remaining_time": "8:13:17"}
{"current_steps": 1530, "total_steps": 2631, "loss": 0.5865, "learning_rate": 5e-06, "epoch": 1.7435897435897436, "percentage": 58.15, "elapsed_time": "11:19:16", "remaining_time": "8:08:49"}
{"current_steps": 1540, "total_steps": 2631, "loss": 0.5816, "learning_rate": 5e-06, "epoch": 1.7549857549857548, "percentage": 58.53, "elapsed_time": "11:23:40", "remaining_time": "8:04:20"}
{"current_steps": 1550, "total_steps": 2631, "loss": 0.5952, "learning_rate": 5e-06, "epoch": 1.7663817663817665, "percentage": 58.91, "elapsed_time": "11:28:04", "remaining_time": "7:59:52"}
{"current_steps": 1560, "total_steps": 2631, "loss": 0.5879, "learning_rate": 5e-06, "epoch": 1.7777777777777777, "percentage": 59.29, "elapsed_time": "11:32:26", "remaining_time": "7:55:23"}
{"current_steps": 1570, "total_steps": 2631, "loss": 0.5907, "learning_rate": 5e-06, "epoch": 1.7891737891737893, "percentage": 59.67, "elapsed_time": "11:36:50", "remaining_time": "7:50:55"}
{"current_steps": 1580, "total_steps": 2631, "loss": 0.5841, "learning_rate": 5e-06, "epoch": 1.8005698005698005, "percentage": 60.05, "elapsed_time": "11:41:13", "remaining_time": "7:46:27"}
{"current_steps": 1590, "total_steps": 2631, "loss": 0.5849, "learning_rate": 5e-06, "epoch": 1.811965811965812, "percentage": 60.43, "elapsed_time": "11:45:36", "remaining_time": "7:41:58"}
{"current_steps": 1600, "total_steps": 2631, "loss": 0.5712, "learning_rate": 5e-06, "epoch": 1.8233618233618234, "percentage": 60.81, "elapsed_time": "11:49:59", "remaining_time": "7:37:29"}
{"current_steps": 1610, "total_steps": 2631, "loss": 0.5773, "learning_rate": 5e-06, "epoch": 1.8347578347578346, "percentage": 61.19, "elapsed_time": "11:54:22", "remaining_time": "7:33:01"}
{"current_steps": 1620, "total_steps": 2631, "loss": 0.5828, "learning_rate": 5e-06, "epoch": 1.8461538461538463, "percentage": 61.57, "elapsed_time": "11:58:46", "remaining_time": "7:28:33"}
{"current_steps": 1630, "total_steps": 2631, "loss": 0.577, "learning_rate": 5e-06, "epoch": 1.8575498575498575, "percentage": 61.95, "elapsed_time": "12:03:09", "remaining_time": "7:24:06"}
{"current_steps": 1640, "total_steps": 2631, "loss": 0.5852, "learning_rate": 5e-06, "epoch": 1.868945868945869, "percentage": 62.33, "elapsed_time": "12:07:32", "remaining_time": "7:19:38"}
{"current_steps": 1650, "total_steps": 2631, "loss": 0.5765, "learning_rate": 5e-06, "epoch": 1.8803418803418803, "percentage": 62.71, "elapsed_time": "12:11:56", "remaining_time": "7:15:10"}
{"current_steps": 1660, "total_steps": 2631, "loss": 0.5941, "learning_rate": 5e-06, "epoch": 1.8917378917378918, "percentage": 63.09, "elapsed_time": "12:16:19", "remaining_time": "7:10:42"}
{"current_steps": 1670, "total_steps": 2631, "loss": 0.5958, "learning_rate": 5e-06, "epoch": 1.9031339031339032, "percentage": 63.47, "elapsed_time": "12:20:42", "remaining_time": "7:06:14"}
{"current_steps": 1680, "total_steps": 2631, "loss": 0.5822, "learning_rate": 5e-06, "epoch": 1.9145299145299144, "percentage": 63.85, "elapsed_time": "12:25:06", "remaining_time": "7:01:46"}
{"current_steps": 1690, "total_steps": 2631, "loss": 0.591, "learning_rate": 5e-06, "epoch": 1.925925925925926, "percentage": 64.23, "elapsed_time": "12:29:29", "remaining_time": "6:57:19"}
{"current_steps": 1700, "total_steps": 2631, "loss": 0.5866, "learning_rate": 5e-06, "epoch": 1.9373219373219372, "percentage": 64.61, "elapsed_time": "12:33:51", "remaining_time": "6:52:50"}
{"current_steps": 1710, "total_steps": 2631, "loss": 0.5812, "learning_rate": 5e-06, "epoch": 1.9487179487179487, "percentage": 64.99, "elapsed_time": "12:38:14", "remaining_time": "6:48:23"}
{"current_steps": 1720, "total_steps": 2631, "loss": 0.5952, "learning_rate": 5e-06, "epoch": 1.96011396011396, "percentage": 65.37, "elapsed_time": "12:42:37", "remaining_time": "6:43:55"}
{"current_steps": 1730, "total_steps": 2631, "loss": 0.5905, "learning_rate": 5e-06, "epoch": 1.9715099715099715, "percentage": 65.75, "elapsed_time": "12:47:00", "remaining_time": "6:39:27"}
{"current_steps": 1740, "total_steps": 2631, "loss": 0.5835, "learning_rate": 5e-06, "epoch": 1.982905982905983, "percentage": 66.13, "elapsed_time": "12:51:23", "remaining_time": "6:35:00"}
{"current_steps": 1750, "total_steps": 2631, "loss": 0.5823, "learning_rate": 5e-06, "epoch": 1.9943019943019942, "percentage": 66.51, "elapsed_time": "12:55:47", "remaining_time": "6:30:33"}
{"current_steps": 1755, "total_steps": 2631, "eval_loss": 0.6174917817115784, "epoch": 2.0, "percentage": 66.7, "elapsed_time": "13:05:18", "remaining_time": "6:31:59"}
{"current_steps": 1760, "total_steps": 2631, "loss": 0.6003, "learning_rate": 5e-06, "epoch": 2.005698005698006, "percentage": 66.89, "elapsed_time": "13:08:40", "remaining_time": "6:30:18"}
{"current_steps": 1770, "total_steps": 2631, "loss": 0.5295, "learning_rate": 5e-06, "epoch": 2.017094017094017, "percentage": 67.27, "elapsed_time": "13:13:03", "remaining_time": "6:25:46"}
{"current_steps": 1780, "total_steps": 2631, "loss": 0.5396, "learning_rate": 5e-06, "epoch": 2.0284900284900287, "percentage": 67.65, "elapsed_time": "13:17:26", "remaining_time": "6:21:14"}
{"current_steps": 1790, "total_steps": 2631, "loss": 0.5498, "learning_rate": 5e-06, "epoch": 2.03988603988604, "percentage": 68.03, "elapsed_time": "13:21:50", "remaining_time": "6:16:43"}
{"current_steps": 1800, "total_steps": 2631, "loss": 0.5485, "learning_rate": 5e-06, "epoch": 2.051282051282051, "percentage": 68.42, "elapsed_time": "13:26:12", "remaining_time": "6:12:12"}
{"current_steps": 1810, "total_steps": 2631, "loss": 0.5443, "learning_rate": 5e-06, "epoch": 2.0626780626780628, "percentage": 68.8, "elapsed_time": "13:30:36", "remaining_time": "6:07:40"}
{"current_steps": 1820, "total_steps": 2631, "loss": 0.5499, "learning_rate": 5e-06, "epoch": 2.074074074074074, "percentage": 69.18, "elapsed_time": "13:34:59", "remaining_time": "6:03:09"}
{"current_steps": 1830, "total_steps": 2631, "loss": 0.5472, "learning_rate": 5e-06, "epoch": 2.0854700854700856, "percentage": 69.56, "elapsed_time": "13:39:22", "remaining_time": "5:58:38"}
{"current_steps": 1840, "total_steps": 2631, "loss": 0.5557, "learning_rate": 5e-06, "epoch": 2.096866096866097, "percentage": 69.94, "elapsed_time": "13:43:46", "remaining_time": "5:54:07"}
{"current_steps": 1850, "total_steps": 2631, "loss": 0.5423, "learning_rate": 5e-06, "epoch": 2.1082621082621085, "percentage": 70.32, "elapsed_time": "13:48:09", "remaining_time": "5:49:37"}
{"current_steps": 1860, "total_steps": 2631, "loss": 0.5556, "learning_rate": 5e-06, "epoch": 2.1196581196581197, "percentage": 70.7, "elapsed_time": "13:52:32", "remaining_time": "5:45:06"}
{"current_steps": 1870, "total_steps": 2631, "loss": 0.5464, "learning_rate": 5e-06, "epoch": 2.131054131054131, "percentage": 71.08, "elapsed_time": "13:56:55", "remaining_time": "5:40:35"}
{"current_steps": 1880, "total_steps": 2631, "loss": 0.5459, "learning_rate": 5e-06, "epoch": 2.1424501424501425, "percentage": 71.46, "elapsed_time": "14:01:19", "remaining_time": "5:36:04"}
{"current_steps": 1890, "total_steps": 2631, "loss": 0.5432, "learning_rate": 5e-06, "epoch": 2.1538461538461537, "percentage": 71.84, "elapsed_time": "14:05:41", "remaining_time": "5:31:34"}
{"current_steps": 1900, "total_steps": 2631, "loss": 0.5434, "learning_rate": 5e-06, "epoch": 2.1652421652421654, "percentage": 72.22, "elapsed_time": "14:10:05", "remaining_time": "5:27:03"}
{"current_steps": 1910, "total_steps": 2631, "loss": 0.548, "learning_rate": 5e-06, "epoch": 2.1766381766381766, "percentage": 72.6, "elapsed_time": "14:14:28", "remaining_time": "5:22:33"}
{"current_steps": 1920, "total_steps": 2631, "loss": 0.551, "learning_rate": 5e-06, "epoch": 2.1880341880341883, "percentage": 72.98, "elapsed_time": "14:18:52", "remaining_time": "5:18:03"}
{"current_steps": 1930, "total_steps": 2631, "loss": 0.5487, "learning_rate": 5e-06, "epoch": 2.1994301994301995, "percentage": 73.36, "elapsed_time": "14:23:16", "remaining_time": "5:13:33"}
{"current_steps": 1940, "total_steps": 2631, "loss": 0.5518, "learning_rate": 5e-06, "epoch": 2.2108262108262107, "percentage": 73.74, "elapsed_time": "14:27:40", "remaining_time": "5:09:03"}
{"current_steps": 1950, "total_steps": 2631, "loss": 0.5455, "learning_rate": 5e-06, "epoch": 2.2222222222222223, "percentage": 74.12, "elapsed_time": "14:32:03", "remaining_time": "5:04:32"}
{"current_steps": 1960, "total_steps": 2631, "loss": 0.5371, "learning_rate": 5e-06, "epoch": 2.2336182336182335, "percentage": 74.5, "elapsed_time": "14:36:27", "remaining_time": "5:00:03"}
{"current_steps": 1970, "total_steps": 2631, "loss": 0.548, "learning_rate": 5e-06, "epoch": 2.245014245014245, "percentage": 74.88, "elapsed_time": "14:40:50", "remaining_time": "4:55:33"}
{"current_steps": 1980, "total_steps": 2631, "loss": 0.5489, "learning_rate": 5e-06, "epoch": 2.2564102564102564, "percentage": 75.26, "elapsed_time": "14:45:14", "remaining_time": "4:51:03"}
{"current_steps": 1990, "total_steps": 2631, "loss": 0.5452, "learning_rate": 5e-06, "epoch": 2.267806267806268, "percentage": 75.64, "elapsed_time": "14:49:36", "remaining_time": "4:46:33"}
{"current_steps": 2000, "total_steps": 2631, "loss": 0.5506, "learning_rate": 5e-06, "epoch": 2.2792022792022792, "percentage": 76.02, "elapsed_time": "14:53:59", "remaining_time": "4:42:03"}
{"current_steps": 2010, "total_steps": 2631, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.2905982905982905, "percentage": 76.4, "elapsed_time": "14:58:23", "remaining_time": "4:37:33"}
{"current_steps": 2020, "total_steps": 2631, "loss": 0.5447, "learning_rate": 5e-06, "epoch": 2.301994301994302, "percentage": 76.78, "elapsed_time": "15:02:47", "remaining_time": "4:33:04"}
{"current_steps": 2030, "total_steps": 2631, "loss": 0.5533, "learning_rate": 5e-06, "epoch": 2.3133903133903133, "percentage": 77.16, "elapsed_time": "15:07:09", "remaining_time": "4:28:34"}
{"current_steps": 2040, "total_steps": 2631, "loss": 0.5493, "learning_rate": 5e-06, "epoch": 2.324786324786325, "percentage": 77.54, "elapsed_time": "15:11:32", "remaining_time": "4:24:04"}
{"current_steps": 2050, "total_steps": 2631, "loss": 0.5484, "learning_rate": 5e-06, "epoch": 2.336182336182336, "percentage": 77.92, "elapsed_time": "15:15:55", "remaining_time": "4:19:35"}
{"current_steps": 2060, "total_steps": 2631, "loss": 0.5561, "learning_rate": 5e-06, "epoch": 2.347578347578348, "percentage": 78.3, "elapsed_time": "15:20:19", "remaining_time": "4:15:05"}
{"current_steps": 2070, "total_steps": 2631, "loss": 0.5479, "learning_rate": 5e-06, "epoch": 2.358974358974359, "percentage": 78.68, "elapsed_time": "15:24:41", "remaining_time": "4:10:36"}
{"current_steps": 2080, "total_steps": 2631, "loss": 0.5482, "learning_rate": 5e-06, "epoch": 2.3703703703703702, "percentage": 79.06, "elapsed_time": "15:29:04", "remaining_time": "4:06:06"}
{"current_steps": 2090, "total_steps": 2631, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.381766381766382, "percentage": 79.44, "elapsed_time": "15:33:27", "remaining_time": "4:01:37"}
{"current_steps": 2100, "total_steps": 2631, "loss": 0.5475, "learning_rate": 5e-06, "epoch": 2.393162393162393, "percentage": 79.82, "elapsed_time": "15:37:50", "remaining_time": "3:57:08"}
{"current_steps": 2110, "total_steps": 2631, "loss": 0.564, "learning_rate": 5e-06, "epoch": 2.4045584045584047, "percentage": 80.2, "elapsed_time": "15:42:12", "remaining_time": "3:52:39"}
{"current_steps": 2120, "total_steps": 2631, "loss": 0.5495, "learning_rate": 5e-06, "epoch": 2.415954415954416, "percentage": 80.58, "elapsed_time": "15:46:36", "remaining_time": "3:48:10"}
{"current_steps": 2130, "total_steps": 2631, "loss": 0.56, "learning_rate": 5e-06, "epoch": 2.427350427350427, "percentage": 80.96, "elapsed_time": "15:50:59", "remaining_time": "3:43:41"}
{"current_steps": 2140, "total_steps": 2631, "loss": 0.5592, "learning_rate": 5e-06, "epoch": 2.438746438746439, "percentage": 81.34, "elapsed_time": "15:55:23", "remaining_time": "3:39:12"}
{"current_steps": 2150, "total_steps": 2631, "loss": 0.5633, "learning_rate": 5e-06, "epoch": 2.45014245014245, "percentage": 81.72, "elapsed_time": "15:59:47", "remaining_time": "3:34:43"}
{"current_steps": 2160, "total_steps": 2631, "loss": 0.5488, "learning_rate": 5e-06, "epoch": 2.4615384615384617, "percentage": 82.1, "elapsed_time": "16:04:11", "remaining_time": "3:30:14"}
{"current_steps": 2170, "total_steps": 2631, "loss": 0.5513, "learning_rate": 5e-06, "epoch": 2.472934472934473, "percentage": 82.48, "elapsed_time": "16:08:35", "remaining_time": "3:25:46"}
{"current_steps": 2180, "total_steps": 2631, "loss": 0.5554, "learning_rate": 5e-06, "epoch": 2.484330484330484, "percentage": 82.86, "elapsed_time": "16:12:59", "remaining_time": "3:21:17"}
{"current_steps": 2190, "total_steps": 2631, "loss": 0.5574, "learning_rate": 5e-06, "epoch": 2.4957264957264957, "percentage": 83.24, "elapsed_time": "16:17:23", "remaining_time": "3:16:49"}
{"current_steps": 2200, "total_steps": 2631, "loss": 0.5629, "learning_rate": 5e-06, "epoch": 2.5071225071225074, "percentage": 83.62, "elapsed_time": "16:21:46", "remaining_time": "3:12:20"}
{"current_steps": 2210, "total_steps": 2631, "loss": 0.5444, "learning_rate": 5e-06, "epoch": 2.5185185185185186, "percentage": 84.0, "elapsed_time": "16:26:09", "remaining_time": "3:07:51"}
{"current_steps": 2220, "total_steps": 2631, "loss": 0.5591, "learning_rate": 5e-06, "epoch": 2.52991452991453, "percentage": 84.38, "elapsed_time": "16:30:33", "remaining_time": "3:03:23"}
{"current_steps": 2230, "total_steps": 2631, "loss": 0.5513, "learning_rate": 5e-06, "epoch": 2.5413105413105415, "percentage": 84.76, "elapsed_time": "16:34:57", "remaining_time": "2:58:54"}
{"current_steps": 2240, "total_steps": 2631, "loss": 0.5501, "learning_rate": 5e-06, "epoch": 2.5527065527065527, "percentage": 85.14, "elapsed_time": "16:39:20", "remaining_time": "2:54:26"}
{"current_steps": 2250, "total_steps": 2631, "loss": 0.5488, "learning_rate": 5e-06, "epoch": 2.564102564102564, "percentage": 85.52, "elapsed_time": "16:43:44", "remaining_time": "2:49:58"}
{"current_steps": 2260, "total_steps": 2631, "loss": 0.5534, "learning_rate": 5e-06, "epoch": 2.5754985754985755, "percentage": 85.9, "elapsed_time": "16:48:07", "remaining_time": "2:45:29"}
{"current_steps": 2270, "total_steps": 2631, "loss": 0.5509, "learning_rate": 5e-06, "epoch": 2.5868945868945867, "percentage": 86.28, "elapsed_time": "16:52:30", "remaining_time": "2:41:01"}
{"current_steps": 2280, "total_steps": 2631, "loss": 0.5515, "learning_rate": 5e-06, "epoch": 2.5982905982905984, "percentage": 86.66, "elapsed_time": "16:56:54", "remaining_time": "2:36:33"}
{"current_steps": 2290, "total_steps": 2631, "loss": 0.5567, "learning_rate": 5e-06, "epoch": 2.6096866096866096, "percentage": 87.04, "elapsed_time": "17:01:18", "remaining_time": "2:32:04"}
{"current_steps": 2300, "total_steps": 2631, "loss": 0.5429, "learning_rate": 5e-06, "epoch": 2.6210826210826212, "percentage": 87.42, "elapsed_time": "17:05:40", "remaining_time": "2:27:36"}
{"current_steps": 2310, "total_steps": 2631, "loss": 0.553, "learning_rate": 5e-06, "epoch": 2.6324786324786325, "percentage": 87.8, "elapsed_time": "17:10:03", "remaining_time": "2:23:08"}
{"current_steps": 2320, "total_steps": 2631, "loss": 0.5524, "learning_rate": 5e-06, "epoch": 2.6438746438746437, "percentage": 88.18, "elapsed_time": "17:14:27", "remaining_time": "2:18:40"}
{"current_steps": 2330, "total_steps": 2631, "loss": 0.5552, "learning_rate": 5e-06, "epoch": 2.6552706552706553, "percentage": 88.56, "elapsed_time": "17:18:51", "remaining_time": "2:14:12"}
{"current_steps": 2340, "total_steps": 2631, "loss": 0.5534, "learning_rate": 5e-06, "epoch": 2.6666666666666665, "percentage": 88.94, "elapsed_time": "17:23:14", "remaining_time": "2:09:44"}
{"current_steps": 2350, "total_steps": 2631, "loss": 0.5467, "learning_rate": 5e-06, "epoch": 2.678062678062678, "percentage": 89.32, "elapsed_time": "17:27:37", "remaining_time": "2:05:16"}
{"current_steps": 2360, "total_steps": 2631, "loss": 0.5565, "learning_rate": 5e-06, "epoch": 2.6894586894586894, "percentage": 89.7, "elapsed_time": "17:32:00", "remaining_time": "2:00:48"}
{"current_steps": 2370, "total_steps": 2631, "loss": 0.5444, "learning_rate": 5e-06, "epoch": 2.700854700854701, "percentage": 90.08, "elapsed_time": "17:36:24", "remaining_time": "1:56:20"}
{"current_steps": 2380, "total_steps": 2631, "loss": 0.5563, "learning_rate": 5e-06, "epoch": 2.7122507122507122, "percentage": 90.46, "elapsed_time": "17:40:48", "remaining_time": "1:51:52"}
{"current_steps": 2390, "total_steps": 2631, "loss": 0.5551, "learning_rate": 5e-06, "epoch": 2.7236467236467234, "percentage": 90.84, "elapsed_time": "17:45:11", "remaining_time": "1:47:24"}
{"current_steps": 2400, "total_steps": 2631, "loss": 0.5539, "learning_rate": 5e-06, "epoch": 2.735042735042735, "percentage": 91.22, "elapsed_time": "17:49:34", "remaining_time": "1:42:56"}
{"current_steps": 2410, "total_steps": 2631, "loss": 0.5588, "learning_rate": 5e-06, "epoch": 2.7464387464387463, "percentage": 91.6, "elapsed_time": "17:53:57", "remaining_time": "1:38:28"}
{"current_steps": 2420, "total_steps": 2631, "loss": 0.5575, "learning_rate": 5e-06, "epoch": 2.757834757834758, "percentage": 91.98, "elapsed_time": "17:58:20", "remaining_time": "1:34:01"}
{"current_steps": 2430, "total_steps": 2631, "loss": 0.5471, "learning_rate": 5e-06, "epoch": 2.769230769230769, "percentage": 92.36, "elapsed_time": "18:02:43", "remaining_time": "1:29:33"}
{"current_steps": 2440, "total_steps": 2631, "loss": 0.5468, "learning_rate": 5e-06, "epoch": 2.780626780626781, "percentage": 92.74, "elapsed_time": "18:07:05", "remaining_time": "1:25:05"}
{"current_steps": 2450, "total_steps": 2631, "loss": 0.5501, "learning_rate": 5e-06, "epoch": 2.792022792022792, "percentage": 93.12, "elapsed_time": "18:11:29", "remaining_time": "1:20:38"}
{"current_steps": 2460, "total_steps": 2631, "loss": 0.5444, "learning_rate": 5e-06, "epoch": 2.8034188034188032, "percentage": 93.5, "elapsed_time": "18:15:53", "remaining_time": "1:16:10"}
{"current_steps": 2470, "total_steps": 2631, "loss": 0.5601, "learning_rate": 5e-06, "epoch": 2.814814814814815, "percentage": 93.88, "elapsed_time": "18:20:16", "remaining_time": "1:11:43"}
{"current_steps": 2480, "total_steps": 2631, "loss": 0.5623, "learning_rate": 5e-06, "epoch": 2.826210826210826, "percentage": 94.26, "elapsed_time": "18:24:38", "remaining_time": "1:07:15"}
{"current_steps": 2490, "total_steps": 2631, "loss": 0.5543, "learning_rate": 5e-06, "epoch": 2.8376068376068377, "percentage": 94.64, "elapsed_time": "18:29:02", "remaining_time": "1:02:48"}
{"current_steps": 2500, "total_steps": 2631, "loss": 0.562, "learning_rate": 5e-06, "epoch": 2.849002849002849, "percentage": 95.02, "elapsed_time": "18:33:25", "remaining_time": "0:58:20"}
{"current_steps": 2510, "total_steps": 2631, "loss": 0.5536, "learning_rate": 5e-06, "epoch": 2.8603988603988606, "percentage": 95.4, "elapsed_time": "18:37:48", "remaining_time": "0:53:53"}
{"current_steps": 2520, "total_steps": 2631, "loss": 0.5539, "learning_rate": 5e-06, "epoch": 2.871794871794872, "percentage": 95.78, "elapsed_time": "18:42:12", "remaining_time": "0:49:25"}
{"current_steps": 2530, "total_steps": 2631, "loss": 0.5601, "learning_rate": 5e-06, "epoch": 2.883190883190883, "percentage": 96.16, "elapsed_time": "18:46:36", "remaining_time": "0:44:58"}
{"current_steps": 2540, "total_steps": 2631, "loss": 0.5557, "learning_rate": 5e-06, "epoch": 2.8945868945868947, "percentage": 96.54, "elapsed_time": "18:50:59", "remaining_time": "0:40:31"}
{"current_steps": 2550, "total_steps": 2631, "loss": 0.5528, "learning_rate": 5e-06, "epoch": 2.905982905982906, "percentage": 96.92, "elapsed_time": "18:55:22", "remaining_time": "0:36:03"}
{"current_steps": 2560, "total_steps": 2631, "loss": 0.5416, "learning_rate": 5e-06, "epoch": 2.9173789173789175, "percentage": 97.3, "elapsed_time": "18:59:45", "remaining_time": "0:31:36"}
{"current_steps": 2570, "total_steps": 2631, "loss": 0.5471, "learning_rate": 5e-06, "epoch": 2.9287749287749287, "percentage": 97.68, "elapsed_time": "19:04:09", "remaining_time": "0:27:09"}
{"current_steps": 2580, "total_steps": 2631, "loss": 0.5438, "learning_rate": 5e-06, "epoch": 2.9401709401709404, "percentage": 98.06, "elapsed_time": "19:08:33", "remaining_time": "0:22:42"}
{"current_steps": 2590, "total_steps": 2631, "loss": 0.5533, "learning_rate": 5e-06, "epoch": 2.9515669515669516, "percentage": 98.44, "elapsed_time": "19:12:56", "remaining_time": "0:18:15"}
{"current_steps": 2600, "total_steps": 2631, "loss": 0.5446, "learning_rate": 5e-06, "epoch": 2.962962962962963, "percentage": 98.82, "elapsed_time": "19:17:19", "remaining_time": "0:13:47"}
{"current_steps": 2610, "total_steps": 2631, "loss": 0.556, "learning_rate": 5e-06, "epoch": 2.9743589743589745, "percentage": 99.2, "elapsed_time": "19:21:43", "remaining_time": "0:09:20"}
{"current_steps": 2620, "total_steps": 2631, "loss": 0.5571, "learning_rate": 5e-06, "epoch": 2.9857549857549857, "percentage": 99.58, "elapsed_time": "19:26:07", "remaining_time": "0:04:53"}
{"current_steps": 2630, "total_steps": 2631, "loss": 0.5443, "learning_rate": 5e-06, "epoch": 2.9971509971509973, "percentage": 99.96, "elapsed_time": "19:30:29", "remaining_time": "0:00:26"}
{"current_steps": 2631, "total_steps": 2631, "eval_loss": 0.6213015913963318, "epoch": 2.9982905982905983, "percentage": 100.0, "elapsed_time": "19:39:26", "remaining_time": "0:00:00"}
{"current_steps": 2631, "total_steps": 2631, "epoch": 2.9982905982905983, "percentage": 100.0, "elapsed_time": "19:40:49", "remaining_time": "0:00:00"}