kurosekurose commited on
Commit
0605546
1 Parent(s): 1f5b79b

End of training

Browse files
Files changed (3) hide show
  1. pytorch_model.bin +1 -1
  2. trainer_state.json +193 -118
  3. training_args.bin +1 -1
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:348ab06f94fbbb9a4199388bb3e4280f3c923b86ec82c2428d19d8ce781444bd
3
  size 379933779
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb729785e010720003468bbd578129098f1d9623cf3713742d472e8e9688714a
3
  size 379933779
trainer_state.json CHANGED
@@ -1,250 +1,325 @@
1
  {
2
- "best_metric": 0.7735137939453125,
3
- "best_model_checkpoint": "kurosekurose/wav2vec2-base-EMOPIA/checkpoint-348",
4
- "epoch": 14.994285714285715,
5
- "global_step": 870,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.99,
12
- "learning_rate": 1.9333333333333336e-06,
13
- "loss": 1.3867,
14
  "step": 58
15
  },
16
  {
17
  "epoch": 0.99,
18
- "eval_accuracy": 0.3285714387893677,
19
- "eval_loss": 1.3517659902572632,
20
- "eval_runtime": 46.5999,
21
- "eval_samples_per_second": 1.502,
22
- "eval_steps_per_second": 0.386,
23
  "step": 58
24
  },
25
  {
26
  "epoch": 1.99,
27
- "learning_rate": 3.866666666666667e-06,
28
- "loss": 1.2842,
29
  "step": 116
30
  },
31
  {
32
  "epoch": 1.99,
33
- "eval_accuracy": 0.4571428596973419,
34
- "eval_loss": 1.18719482421875,
35
- "eval_runtime": 46.74,
36
- "eval_samples_per_second": 1.498,
37
- "eval_steps_per_second": 0.385,
38
  "step": 116
39
  },
40
  {
41
  "epoch": 2.99,
42
- "learning_rate": 5.8e-06,
43
- "loss": 1.0725,
44
  "step": 174
45
  },
46
  {
47
  "epoch": 2.99,
48
- "eval_accuracy": 0.5571428537368774,
49
- "eval_loss": 1.0476346015930176,
50
- "eval_runtime": 46.9576,
51
- "eval_samples_per_second": 1.491,
52
- "eval_steps_per_second": 0.383,
53
  "step": 174
54
  },
55
  {
56
  "epoch": 3.99,
57
- "learning_rate": 7.733333333333334e-06,
58
- "loss": 0.9343,
59
  "step": 232
60
  },
61
  {
62
  "epoch": 3.99,
63
- "eval_accuracy": 0.5714285969734192,
64
- "eval_loss": 0.9676682949066162,
65
- "eval_runtime": 46.68,
66
- "eval_samples_per_second": 1.5,
67
- "eval_steps_per_second": 0.386,
68
  "step": 232
69
  },
70
  {
71
  "epoch": 4.99,
72
- "learning_rate": 9.666666666666667e-06,
73
- "loss": 0.8053,
74
  "step": 290
75
  },
76
  {
77
  "epoch": 4.99,
78
- "eval_accuracy": 0.6142857074737549,
79
- "eval_loss": 0.9524909257888794,
80
- "eval_runtime": 46.7102,
81
- "eval_samples_per_second": 1.499,
82
- "eval_steps_per_second": 0.385,
83
  "step": 290
84
  },
85
  {
86
  "epoch": 5.99,
87
- "learning_rate": 9.157894736842105e-06,
88
- "loss": 0.7895,
89
  "step": 348
90
  },
91
  {
92
  "epoch": 5.99,
93
- "eval_accuracy": 0.6857143044471741,
94
- "eval_loss": 0.7735137939453125,
95
- "eval_runtime": 46.9896,
96
- "eval_samples_per_second": 1.49,
97
- "eval_steps_per_second": 0.383,
98
  "step": 348
99
  },
100
  {
101
  "epoch": 6.99,
102
- "learning_rate": 8.140350877192983e-06,
103
- "loss": 0.6867,
104
  "step": 406
105
  },
106
  {
107
  "epoch": 6.99,
108
- "eval_accuracy": 0.6428571343421936,
109
- "eval_loss": 0.8555552363395691,
110
- "eval_runtime": 46.718,
111
- "eval_samples_per_second": 1.498,
112
- "eval_steps_per_second": 0.385,
113
  "step": 406
114
  },
115
  {
116
  "epoch": 7.99,
117
- "learning_rate": 7.140350877192983e-06,
118
- "loss": 0.6218,
119
  "step": 464
120
  },
121
  {
122
  "epoch": 7.99,
123
- "eval_accuracy": 0.6714285612106323,
124
- "eval_loss": 0.8454030156135559,
125
- "eval_runtime": 46.4466,
126
- "eval_samples_per_second": 1.507,
127
- "eval_steps_per_second": 0.388,
128
  "step": 464
129
  },
130
  {
131
  "epoch": 8.99,
132
- "learning_rate": 6.140350877192983e-06,
133
- "loss": 0.558,
134
  "step": 522
135
  },
136
  {
137
  "epoch": 8.99,
138
- "eval_accuracy": 0.6571428775787354,
139
- "eval_loss": 0.8404667973518372,
140
- "eval_runtime": 46.7611,
141
- "eval_samples_per_second": 1.497,
142
- "eval_steps_per_second": 0.385,
143
  "step": 522
144
  },
145
  {
146
  "epoch": 9.99,
147
- "learning_rate": 5.12280701754386e-06,
148
- "loss": 0.5033,
149
  "step": 580
150
  },
151
  {
152
  "epoch": 9.99,
153
- "eval_accuracy": 0.6285714507102966,
154
- "eval_loss": 1.0190438032150269,
155
- "eval_runtime": 47.1353,
156
- "eval_samples_per_second": 1.485,
157
- "eval_steps_per_second": 0.382,
158
  "step": 580
159
  },
160
  {
161
  "epoch": 10.99,
162
- "learning_rate": 4.105263157894737e-06,
163
- "loss": 0.4403,
164
  "step": 638
165
  },
166
  {
167
  "epoch": 10.99,
168
- "eval_accuracy": 0.699999988079071,
169
- "eval_loss": 0.82489013671875,
170
- "eval_runtime": 46.7633,
171
- "eval_samples_per_second": 1.497,
172
- "eval_steps_per_second": 0.385,
173
  "step": 638
174
  },
175
  {
176
  "epoch": 11.99,
177
- "learning_rate": 3.0877192982456146e-06,
178
- "loss": 0.3995,
179
  "step": 696
180
  },
181
  {
182
  "epoch": 11.99,
183
- "eval_accuracy": 0.7142857313156128,
184
- "eval_loss": 0.8996997475624084,
185
- "eval_runtime": 46.7333,
186
- "eval_samples_per_second": 1.498,
187
- "eval_steps_per_second": 0.385,
188
  "step": 696
189
  },
190
  {
191
  "epoch": 12.99,
192
- "learning_rate": 2.0701754385964913e-06,
193
- "loss": 0.3534,
194
  "step": 754
195
  },
196
  {
197
  "epoch": 12.99,
198
- "eval_accuracy": 0.699999988079071,
199
- "eval_loss": 0.9177280068397522,
200
- "eval_runtime": 46.7502,
201
- "eval_samples_per_second": 1.497,
202
- "eval_steps_per_second": 0.385,
203
  "step": 754
204
  },
205
  {
206
  "epoch": 13.99,
207
- "learning_rate": 1.0526315789473685e-06,
208
- "loss": 0.3023,
209
  "step": 812
210
  },
211
  {
212
  "epoch": 13.99,
213
- "eval_accuracy": 0.6571428775787354,
214
- "eval_loss": 0.9544177651405334,
215
- "eval_runtime": 46.7592,
216
- "eval_samples_per_second": 1.497,
217
- "eval_steps_per_second": 0.385,
218
  "step": 812
219
  },
220
  {
221
  "epoch": 14.99,
222
- "learning_rate": 3.508771929824562e-08,
223
- "loss": 0.2752,
224
  "step": 870
225
  },
226
  {
227
  "epoch": 14.99,
228
- "eval_accuracy": 0.699999988079071,
229
- "eval_loss": 0.9346058964729309,
230
- "eval_runtime": 46.4397,
231
- "eval_samples_per_second": 1.507,
232
- "eval_steps_per_second": 0.388,
233
  "step": 870
234
  },
235
  {
236
- "epoch": 14.99,
237
- "step": 870,
238
- "total_flos": 4.99147314409986e+18,
239
- "train_loss": 0.6941862314596944,
240
- "train_runtime": 20182.4464,
241
- "train_samples_per_second": 0.52,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
242
  "train_steps_per_second": 0.043
243
  }
244
  ],
245
- "max_steps": 870,
246
- "num_train_epochs": 15,
247
- "total_flos": 4.99147314409986e+18,
248
  "trial_name": null,
249
  "trial_params": null
250
  }
 
1
  {
2
+ "best_metric": 0.7888200283050537,
3
+ "best_model_checkpoint": "kurosekurose/wav2vec2-base-EMOPIA/checkpoint-812",
4
+ "epoch": 19.994285714285713,
5
+ "global_step": 1160,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.99,
12
+ "learning_rate": 1.1600000000000001e-06,
13
+ "loss": 1.393,
14
  "step": 58
15
  },
16
  {
17
  "epoch": 0.99,
18
+ "eval_accuracy": 0.5285714268684387,
19
+ "eval_loss": 1.3617215156555176,
20
+ "eval_runtime": 48.0313,
21
+ "eval_samples_per_second": 1.457,
22
+ "eval_steps_per_second": 0.375,
23
  "step": 58
24
  },
25
  {
26
  "epoch": 1.99,
27
+ "learning_rate": 2.3200000000000002e-06,
28
+ "loss": 1.3257,
29
  "step": 116
30
  },
31
  {
32
  "epoch": 1.99,
33
+ "eval_accuracy": 0.4000000059604645,
34
+ "eval_loss": 1.2633056640625,
35
+ "eval_runtime": 48.3007,
36
+ "eval_samples_per_second": 1.449,
37
+ "eval_steps_per_second": 0.373,
38
  "step": 116
39
  },
40
  {
41
  "epoch": 2.99,
42
+ "learning_rate": 3.48e-06,
43
+ "loss": 1.175,
44
  "step": 174
45
  },
46
  {
47
  "epoch": 2.99,
48
+ "eval_accuracy": 0.4000000059604645,
49
+ "eval_loss": 1.11065673828125,
50
+ "eval_runtime": 48.0736,
51
+ "eval_samples_per_second": 1.456,
52
+ "eval_steps_per_second": 0.374,
53
  "step": 174
54
  },
55
  {
56
  "epoch": 3.99,
57
+ "learning_rate": 4.6400000000000005e-06,
58
+ "loss": 1.0229,
59
  "step": 232
60
  },
61
  {
62
  "epoch": 3.99,
63
+ "eval_accuracy": 0.4285714328289032,
64
+ "eval_loss": 1.0352715253829956,
65
+ "eval_runtime": 48.1873,
66
+ "eval_samples_per_second": 1.453,
67
+ "eval_steps_per_second": 0.374,
68
  "step": 232
69
  },
70
  {
71
  "epoch": 4.99,
72
+ "learning_rate": 5.8e-06,
73
+ "loss": 0.9276,
74
  "step": 290
75
  },
76
  {
77
  "epoch": 4.99,
78
+ "eval_accuracy": 0.37142857909202576,
79
+ "eval_loss": 1.0740830898284912,
80
+ "eval_runtime": 48.3346,
81
+ "eval_samples_per_second": 1.448,
82
+ "eval_steps_per_second": 0.372,
83
  "step": 290
84
  },
85
  {
86
  "epoch": 5.99,
87
+ "learning_rate": 6.96e-06,
88
+ "loss": 0.8505,
89
  "step": 348
90
  },
91
  {
92
  "epoch": 5.99,
93
+ "eval_accuracy": 0.6285714507102966,
94
+ "eval_loss": 0.9529690146446228,
95
+ "eval_runtime": 48.6491,
96
+ "eval_samples_per_second": 1.439,
97
+ "eval_steps_per_second": 0.37,
98
  "step": 348
99
  },
100
  {
101
  "epoch": 6.99,
102
+ "learning_rate": 8.120000000000002e-06,
103
+ "loss": 0.7713,
104
  "step": 406
105
  },
106
  {
107
  "epoch": 6.99,
108
+ "eval_accuracy": 0.6142857074737549,
109
+ "eval_loss": 0.9922705888748169,
110
+ "eval_runtime": 48.6353,
111
+ "eval_samples_per_second": 1.439,
112
+ "eval_steps_per_second": 0.37,
113
  "step": 406
114
  },
115
  {
116
  "epoch": 7.99,
117
+ "learning_rate": 9.280000000000001e-06,
118
+ "loss": 0.7208,
119
  "step": 464
120
  },
121
  {
122
  "epoch": 7.99,
123
+ "eval_accuracy": 0.6142857074737549,
124
+ "eval_loss": 0.8938446044921875,
125
+ "eval_runtime": 48.2669,
126
+ "eval_samples_per_second": 1.45,
127
+ "eval_steps_per_second": 0.373,
128
  "step": 464
129
  },
130
  {
131
  "epoch": 8.99,
132
+ "learning_rate": 9.666666666666667e-06,
133
+ "loss": 0.6573,
134
  "step": 522
135
  },
136
  {
137
  "epoch": 8.99,
138
+ "eval_accuracy": 0.6142857074737549,
139
+ "eval_loss": 1.0785200595855713,
140
+ "eval_runtime": 47.8068,
141
+ "eval_samples_per_second": 1.464,
142
+ "eval_steps_per_second": 0.377,
143
  "step": 522
144
  },
145
  {
146
  "epoch": 9.99,
147
+ "learning_rate": 8.787878787878788e-06,
148
+ "loss": 0.6134,
149
  "step": 580
150
  },
151
  {
152
  "epoch": 9.99,
153
+ "eval_accuracy": 0.6428571343421936,
154
+ "eval_loss": 0.9662051796913147,
155
+ "eval_runtime": 48.1596,
156
+ "eval_samples_per_second": 1.454,
157
+ "eval_steps_per_second": 0.374,
158
  "step": 580
159
  },
160
  {
161
  "epoch": 10.99,
162
+ "learning_rate": 7.909090909090909e-06,
163
+ "loss": 0.5514,
164
  "step": 638
165
  },
166
  {
167
  "epoch": 10.99,
168
+ "eval_accuracy": 0.6571428775787354,
169
+ "eval_loss": 0.9189529418945312,
170
+ "eval_runtime": 48.0311,
171
+ "eval_samples_per_second": 1.457,
172
+ "eval_steps_per_second": 0.375,
173
  "step": 638
174
  },
175
  {
176
  "epoch": 11.99,
177
+ "learning_rate": 7.030303030303031e-06,
178
+ "loss": 0.4643,
179
  "step": 696
180
  },
181
  {
182
  "epoch": 11.99,
183
+ "eval_accuracy": 0.6857143044471741,
184
+ "eval_loss": 0.8748092651367188,
185
+ "eval_runtime": 48.3032,
186
+ "eval_samples_per_second": 1.449,
187
+ "eval_steps_per_second": 0.373,
188
  "step": 696
189
  },
190
  {
191
  "epoch": 12.99,
192
+ "learning_rate": 6.166666666666667e-06,
193
+ "loss": 0.3946,
194
  "step": 754
195
  },
196
  {
197
  "epoch": 12.99,
198
+ "eval_accuracy": 0.6571428775787354,
199
+ "eval_loss": 0.9243893027305603,
200
+ "eval_runtime": 48.1936,
201
+ "eval_samples_per_second": 1.452,
202
+ "eval_steps_per_second": 0.373,
203
  "step": 754
204
  },
205
  {
206
  "epoch": 13.99,
207
+ "learning_rate": 5.287878787878788e-06,
208
+ "loss": 0.3875,
209
  "step": 812
210
  },
211
  {
212
  "epoch": 13.99,
213
+ "eval_accuracy": 0.7285714149475098,
214
+ "eval_loss": 0.7888200283050537,
215
+ "eval_runtime": 47.9295,
216
+ "eval_samples_per_second": 1.46,
217
+ "eval_steps_per_second": 0.376,
218
  "step": 812
219
  },
220
  {
221
  "epoch": 14.99,
222
+ "learning_rate": 4.409090909090909e-06,
223
+ "loss": 0.3044,
224
  "step": 870
225
  },
226
  {
227
  "epoch": 14.99,
228
+ "eval_accuracy": 0.6714285612106323,
229
+ "eval_loss": 0.8981361389160156,
230
+ "eval_runtime": 47.9952,
231
+ "eval_samples_per_second": 1.458,
232
+ "eval_steps_per_second": 0.375,
233
  "step": 870
234
  },
235
  {
236
+ "epoch": 15.99,
237
+ "learning_rate": 3.5303030303030304e-06,
238
+ "loss": 0.2794,
239
+ "step": 928
240
+ },
241
+ {
242
+ "epoch": 15.99,
243
+ "eval_accuracy": 0.6714285612106323,
244
+ "eval_loss": 0.8927078247070312,
245
+ "eval_runtime": 47.849,
246
+ "eval_samples_per_second": 1.463,
247
+ "eval_steps_per_second": 0.376,
248
+ "step": 928
249
+ },
250
+ {
251
+ "epoch": 16.99,
252
+ "learning_rate": 2.6515151515151514e-06,
253
+ "loss": 0.2307,
254
+ "step": 986
255
+ },
256
+ {
257
+ "epoch": 16.99,
258
+ "eval_accuracy": 0.6714285612106323,
259
+ "eval_loss": 0.9921481013298035,
260
+ "eval_runtime": 48.0049,
261
+ "eval_samples_per_second": 1.458,
262
+ "eval_steps_per_second": 0.375,
263
+ "step": 986
264
+ },
265
+ {
266
+ "epoch": 17.99,
267
+ "learning_rate": 1.7727272727272729e-06,
268
+ "loss": 0.2153,
269
+ "step": 1044
270
+ },
271
+ {
272
+ "epoch": 17.99,
273
+ "eval_accuracy": 0.6714285612106323,
274
+ "eval_loss": 0.979206919670105,
275
+ "eval_runtime": 47.8808,
276
+ "eval_samples_per_second": 1.462,
277
+ "eval_steps_per_second": 0.376,
278
+ "step": 1044
279
+ },
280
+ {
281
+ "epoch": 18.99,
282
+ "learning_rate": 8.93939393939394e-07,
283
+ "loss": 0.1805,
284
+ "step": 1102
285
+ },
286
+ {
287
+ "epoch": 18.99,
288
+ "eval_accuracy": 0.6714285612106323,
289
+ "eval_loss": 1.1085455417633057,
290
+ "eval_runtime": 48.1686,
291
+ "eval_samples_per_second": 1.453,
292
+ "eval_steps_per_second": 0.374,
293
+ "step": 1102
294
+ },
295
+ {
296
+ "epoch": 19.99,
297
+ "learning_rate": 3.0303030303030305e-08,
298
+ "loss": 0.1625,
299
+ "step": 1160
300
+ },
301
+ {
302
+ "epoch": 19.99,
303
+ "eval_accuracy": 0.6571428775787354,
304
+ "eval_loss": 1.0330772399902344,
305
+ "eval_runtime": 48.6,
306
+ "eval_samples_per_second": 1.44,
307
+ "eval_steps_per_second": 0.37,
308
+ "step": 1160
309
+ },
310
+ {
311
+ "epoch": 19.99,
312
+ "step": 1160,
313
+ "total_flos": 6.655036715585741e+18,
314
+ "train_loss": 0.6313976797564277,
315
+ "train_runtime": 27101.5799,
316
+ "train_samples_per_second": 0.517,
317
  "train_steps_per_second": 0.043
318
  }
319
  ],
320
+ "max_steps": 1160,
321
+ "num_train_epochs": 20,
322
+ "total_flos": 6.655036715585741e+18,
323
  "trial_name": null,
324
  "trial_params": null
325
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:129989de89a833eb0c8d9e960516ce76d7fddab79482e76bde4c7c1f16fb577e
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7928bd3831d9778b904dbb74e2262a29e5f3356eebda42137796d84d8e0c2218
3
  size 3055