charsiu commited on
Commit
bfe312e
1 Parent(s): 4f10a92

Upload trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +271 -0
trainer_state.json ADDED
@@ -0,0 +1,271 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 0.9947774185525988,
5
+ "global_step": 8500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.06,
12
+ "learning_rate": 0.00015,
13
+ "loss": 2.3077,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.06,
18
+ "eval_loss": 0.9413899183273315,
19
+ "eval_phone_accuracy": 0.7518319068307362,
20
+ "eval_runtime": 12.1406,
21
+ "eval_samples_per_second": 16.474,
22
+ "eval_steps_per_second": 4.118,
23
+ "step": 500
24
+ },
25
+ {
26
+ "epoch": 0.12,
27
+ "learning_rate": 0.0003,
28
+ "loss": 1.1762,
29
+ "step": 1000
30
+ },
31
+ {
32
+ "epoch": 0.12,
33
+ "eval_loss": 0.6205331683158875,
34
+ "eval_phone_accuracy": 0.8215267480076658,
35
+ "eval_runtime": 10.7397,
36
+ "eval_samples_per_second": 18.623,
37
+ "eval_steps_per_second": 4.656,
38
+ "step": 1000
39
+ },
40
+ {
41
+ "epoch": 0.18,
42
+ "learning_rate": 0.00028011664899257687,
43
+ "loss": 0.8235,
44
+ "step": 1500
45
+ },
46
+ {
47
+ "epoch": 0.18,
48
+ "eval_loss": 0.4551730751991272,
49
+ "eval_phone_accuracy": 0.8648594743186174,
50
+ "eval_runtime": 10.6304,
51
+ "eval_samples_per_second": 18.814,
52
+ "eval_steps_per_second": 4.703,
53
+ "step": 1500
54
+ },
55
+ {
56
+ "epoch": 0.23,
57
+ "learning_rate": 0.0002602332979851537,
58
+ "loss": 0.6647,
59
+ "step": 2000
60
+ },
61
+ {
62
+ "epoch": 0.23,
63
+ "eval_loss": 0.3814973533153534,
64
+ "eval_phone_accuracy": 0.8815525898176332,
65
+ "eval_runtime": 11.7606,
66
+ "eval_samples_per_second": 17.006,
67
+ "eval_steps_per_second": 4.251,
68
+ "step": 2000
69
+ },
70
+ {
71
+ "epoch": 0.29,
72
+ "learning_rate": 0.0002403499469777306,
73
+ "loss": 0.5809,
74
+ "step": 2500
75
+ },
76
+ {
77
+ "epoch": 0.29,
78
+ "eval_loss": 0.3442990481853485,
79
+ "eval_phone_accuracy": 0.8922361837370032,
80
+ "eval_runtime": 11.2643,
81
+ "eval_samples_per_second": 17.755,
82
+ "eval_steps_per_second": 4.439,
83
+ "step": 2500
84
+ },
85
+ {
86
+ "epoch": 0.35,
87
+ "learning_rate": 0.00022046659597030753,
88
+ "loss": 0.5289,
89
+ "step": 3000
90
+ },
91
+ {
92
+ "epoch": 0.35,
93
+ "eval_loss": 0.314848929643631,
94
+ "eval_phone_accuracy": 0.9002575509248419,
95
+ "eval_runtime": 11.2871,
96
+ "eval_samples_per_second": 17.719,
97
+ "eval_steps_per_second": 4.43,
98
+ "step": 3000
99
+ },
100
+ {
101
+ "epoch": 0.41,
102
+ "learning_rate": 0.0002005832449628844,
103
+ "loss": 0.4896,
104
+ "step": 3500
105
+ },
106
+ {
107
+ "epoch": 0.41,
108
+ "eval_loss": 0.30238407850265503,
109
+ "eval_phone_accuracy": 0.9030845408742857,
110
+ "eval_runtime": 11.2397,
111
+ "eval_samples_per_second": 17.794,
112
+ "eval_steps_per_second": 4.449,
113
+ "step": 3500
114
+ },
115
+ {
116
+ "epoch": 0.47,
117
+ "learning_rate": 0.0001806998939554613,
118
+ "loss": 0.4622,
119
+ "step": 4000
120
+ },
121
+ {
122
+ "epoch": 0.47,
123
+ "eval_loss": 0.2689047157764435,
124
+ "eval_phone_accuracy": 0.9141496917193476,
125
+ "eval_runtime": 12.0191,
126
+ "eval_samples_per_second": 16.64,
127
+ "eval_steps_per_second": 4.16,
128
+ "step": 4000
129
+ },
130
+ {
131
+ "epoch": 0.53,
132
+ "learning_rate": 0.00016081654294803816,
133
+ "loss": 0.4386,
134
+ "step": 4500
135
+ },
136
+ {
137
+ "epoch": 0.53,
138
+ "eval_loss": 0.2747265696525574,
139
+ "eval_phone_accuracy": 0.9112533277834144,
140
+ "eval_runtime": 11.09,
141
+ "eval_samples_per_second": 18.034,
142
+ "eval_steps_per_second": 4.509,
143
+ "step": 4500
144
+ },
145
+ {
146
+ "epoch": 0.59,
147
+ "learning_rate": 0.00014093319194061505,
148
+ "loss": 0.419,
149
+ "step": 5000
150
+ },
151
+ {
152
+ "epoch": 0.59,
153
+ "eval_loss": 0.2555970251560211,
154
+ "eval_phone_accuracy": 0.9181213524458666,
155
+ "eval_runtime": 11.6344,
156
+ "eval_samples_per_second": 17.19,
157
+ "eval_steps_per_second": 4.298,
158
+ "step": 5000
159
+ },
160
+ {
161
+ "epoch": 0.64,
162
+ "learning_rate": 0.00012104984093319194,
163
+ "loss": 0.4032,
164
+ "step": 5500
165
+ },
166
+ {
167
+ "epoch": 0.64,
168
+ "eval_loss": 0.2447209358215332,
169
+ "eval_phone_accuracy": 0.920003121829392,
170
+ "eval_runtime": 10.8148,
171
+ "eval_samples_per_second": 18.493,
172
+ "eval_steps_per_second": 4.623,
173
+ "step": 5500
174
+ },
175
+ {
176
+ "epoch": 0.7,
177
+ "learning_rate": 0.00010116648992576882,
178
+ "loss": 0.3892,
179
+ "step": 6000
180
+ },
181
+ {
182
+ "epoch": 0.7,
183
+ "eval_loss": 0.23665592074394226,
184
+ "eval_phone_accuracy": 0.9239054085694217,
185
+ "eval_runtime": 10.9341,
186
+ "eval_samples_per_second": 18.291,
187
+ "eval_steps_per_second": 4.573,
188
+ "step": 6000
189
+ },
190
+ {
191
+ "epoch": 0.76,
192
+ "learning_rate": 8.12831389183457e-05,
193
+ "loss": 0.3786,
194
+ "step": 6500
195
+ },
196
+ {
197
+ "epoch": 0.76,
198
+ "eval_loss": 0.2295096516609192,
199
+ "eval_phone_accuracy": 0.9251801555711647,
200
+ "eval_runtime": 10.8468,
201
+ "eval_samples_per_second": 18.439,
202
+ "eval_steps_per_second": 4.61,
203
+ "step": 6500
204
+ },
205
+ {
206
+ "epoch": 0.82,
207
+ "learning_rate": 6.139978791092258e-05,
208
+ "loss": 0.3701,
209
+ "step": 7000
210
+ },
211
+ {
212
+ "epoch": 0.82,
213
+ "eval_loss": 0.22638411819934845,
214
+ "eval_phone_accuracy": 0.9254229645238776,
215
+ "eval_runtime": 10.8611,
216
+ "eval_samples_per_second": 18.414,
217
+ "eval_steps_per_second": 4.604,
218
+ "step": 7000
219
+ },
220
+ {
221
+ "epoch": 0.88,
222
+ "learning_rate": 4.151643690349946e-05,
223
+ "loss": 0.3592,
224
+ "step": 7500
225
+ },
226
+ {
227
+ "epoch": 0.88,
228
+ "eval_loss": 0.2183924913406372,
229
+ "eval_phone_accuracy": 0.9286401831473243,
230
+ "eval_runtime": 11.5166,
231
+ "eval_samples_per_second": 17.366,
232
+ "eval_steps_per_second": 4.342,
233
+ "step": 7500
234
+ },
235
+ {
236
+ "epoch": 0.94,
237
+ "learning_rate": 2.163308589607635e-05,
238
+ "loss": 0.3511,
239
+ "step": 8000
240
+ },
241
+ {
242
+ "epoch": 0.94,
243
+ "eval_loss": 0.2142486721277237,
244
+ "eval_phone_accuracy": 0.9288309616101702,
245
+ "eval_runtime": 11.0635,
246
+ "eval_samples_per_second": 18.077,
247
+ "eval_steps_per_second": 4.519,
248
+ "step": 8000
249
+ },
250
+ {
251
+ "epoch": 0.99,
252
+ "learning_rate": 1.7497348886532342e-06,
253
+ "loss": 0.3459,
254
+ "step": 8500
255
+ },
256
+ {
257
+ "epoch": 0.99,
258
+ "eval_loss": 0.2112182378768921,
259
+ "eval_phone_accuracy": 0.9303051588230703,
260
+ "eval_runtime": 10.7118,
261
+ "eval_samples_per_second": 18.671,
262
+ "eval_steps_per_second": 4.668,
263
+ "step": 8500
264
+ }
265
+ ],
266
+ "max_steps": 8544,
267
+ "num_train_epochs": 1,
268
+ "total_flos": 1.2317797842209997e+19,
269
+ "trial_name": null,
270
+ "trial_params": null
271
+ }