kurosekurose commited on
Commit
7e763e1
1 Parent(s): 57ab6ba

End of training

Browse files
Files changed (3) hide show
  1. pytorch_model.bin +1 -1
  2. trainer_state.json +127 -277
  3. training_args.bin +1 -1
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbd58cd935301cd872d7f66acefe198815b34137c7737f8630f292d3366423a4
3
  size 379933779
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7457c6eea8ce91eb1e913e2bdae191fa9f401dce20c54b7f58078596e6ecc698
3
  size 379933779
trainer_state.json CHANGED
@@ -1,325 +1,175 @@
1
  {
2
- "best_metric": 0.8695746660232544,
3
- "best_model_checkpoint": "kurosekurose/wav2vec2-base-EMOPIA/checkpoint-522",
4
- "epoch": 19.994285714285713,
5
- "global_step": 1160,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.99,
12
- "learning_rate": 1.1600000000000001e-06,
13
- "loss": 1.3846,
14
- "step": 58
15
  },
16
  {
17
- "epoch": 0.99,
18
- "eval_accuracy": 0.41428571939468384,
19
- "eval_loss": 1.3525933027267456,
20
- "eval_runtime": 48.4658,
21
- "eval_samples_per_second": 1.444,
22
- "eval_steps_per_second": 0.371,
23
- "step": 58
24
  },
25
  {
26
- "epoch": 1.99,
27
- "learning_rate": 2.3200000000000002e-06,
28
- "loss": 1.3182,
29
- "step": 116
30
  },
31
  {
32
- "epoch": 1.99,
33
- "eval_accuracy": 0.48571428656578064,
34
- "eval_loss": 1.2529839277267456,
35
- "eval_runtime": 48.2009,
36
- "eval_samples_per_second": 1.452,
37
- "eval_steps_per_second": 0.373,
38
- "step": 116
39
  },
40
  {
41
- "epoch": 2.99,
42
- "learning_rate": 3.48e-06,
43
- "loss": 1.1606,
44
- "step": 174
45
  },
46
  {
47
- "epoch": 2.99,
48
- "eval_accuracy": 0.4000000059604645,
49
- "eval_loss": 1.0961982011795044,
50
- "eval_runtime": 48.4788,
51
- "eval_samples_per_second": 1.444,
52
- "eval_steps_per_second": 0.371,
53
- "step": 174
54
  },
55
  {
56
- "epoch": 3.99,
57
- "learning_rate": 4.6400000000000005e-06,
58
- "loss": 1.0104,
59
- "step": 232
60
  },
61
  {
62
- "epoch": 3.99,
63
- "eval_accuracy": 0.44285714626312256,
64
- "eval_loss": 1.0213487148284912,
65
- "eval_runtime": 48.0421,
66
- "eval_samples_per_second": 1.457,
67
- "eval_steps_per_second": 0.375,
68
- "step": 232
69
  },
70
  {
71
- "epoch": 4.99,
72
- "learning_rate": 5.8e-06,
73
- "loss": 0.9127,
74
- "step": 290
75
  },
76
  {
77
- "epoch": 4.99,
78
- "eval_accuracy": 0.48571428656578064,
79
- "eval_loss": 0.9955207109451294,
80
- "eval_runtime": 48.3011,
81
- "eval_samples_per_second": 1.449,
82
- "eval_steps_per_second": 0.373,
83
- "step": 290
84
- },
85
- {
86
- "epoch": 5.99,
87
- "learning_rate": 6.96e-06,
88
- "loss": 0.8464,
89
- "step": 348
90
- },
91
- {
92
- "epoch": 5.99,
93
- "eval_accuracy": 0.5857142806053162,
94
- "eval_loss": 0.9400736689567566,
95
- "eval_runtime": 48.3878,
96
- "eval_samples_per_second": 1.447,
97
- "eval_steps_per_second": 0.372,
98
- "step": 348
99
- },
100
- {
101
- "epoch": 6.99,
102
- "learning_rate": 8.120000000000002e-06,
103
- "loss": 0.787,
104
- "step": 406
105
- },
106
- {
107
- "epoch": 6.99,
108
- "eval_accuracy": 0.6571428775787354,
109
- "eval_loss": 0.9043138027191162,
110
- "eval_runtime": 48.4438,
111
- "eval_samples_per_second": 1.445,
112
- "eval_steps_per_second": 0.372,
113
- "step": 406
114
- },
115
- {
116
- "epoch": 7.99,
117
- "learning_rate": 9.260000000000001e-06,
118
- "loss": 0.7181,
119
- "step": 464
120
- },
121
- {
122
- "epoch": 7.99,
123
- "eval_accuracy": 0.6000000238418579,
124
- "eval_loss": 0.9584859013557434,
125
- "eval_runtime": 48.0745,
126
- "eval_samples_per_second": 1.456,
127
- "eval_steps_per_second": 0.374,
128
- "step": 464
129
- },
130
- {
131
- "epoch": 8.99,
132
- "learning_rate": 9.681818181818182e-06,
133
- "loss": 0.6804,
134
- "step": 522
135
- },
136
- {
137
- "epoch": 8.99,
138
- "eval_accuracy": 0.6285714507102966,
139
- "eval_loss": 0.8695746660232544,
140
- "eval_runtime": 48.2058,
141
- "eval_samples_per_second": 1.452,
142
- "eval_steps_per_second": 0.373,
143
- "step": 522
144
- },
145
- {
146
- "epoch": 9.99,
147
- "learning_rate": 8.818181818181819e-06,
148
- "loss": 0.6065,
149
- "step": 580
150
- },
151
- {
152
- "epoch": 9.99,
153
- "eval_accuracy": 0.6285714507102966,
154
- "eval_loss": 0.9474284052848816,
155
- "eval_runtime": 48.413,
156
- "eval_samples_per_second": 1.446,
157
- "eval_steps_per_second": 0.372,
158
- "step": 580
159
  },
160
  {
161
- "epoch": 10.99,
162
- "learning_rate": 7.93939393939394e-06,
163
- "loss": 0.6316,
164
- "step": 638
165
  },
166
  {
167
- "epoch": 10.99,
168
  "eval_accuracy": 0.6857143044471741,
169
- "eval_loss": 0.9475699663162231,
170
- "eval_runtime": 47.8485,
171
- "eval_samples_per_second": 1.463,
172
- "eval_steps_per_second": 0.376,
173
- "step": 638
174
- },
175
- {
176
- "epoch": 11.99,
177
- "learning_rate": 7.060606060606061e-06,
178
- "loss": 0.517,
179
- "step": 696
180
  },
181
  {
182
- "epoch": 11.99,
183
- "eval_accuracy": 0.6571428775787354,
184
- "eval_loss": 0.9657440185546875,
185
- "eval_runtime": 48.3215,
186
- "eval_samples_per_second": 1.449,
187
- "eval_steps_per_second": 0.373,
188
- "step": 696
189
  },
190
  {
191
- "epoch": 12.99,
192
- "learning_rate": 6.181818181818182e-06,
193
- "loss": 0.4487,
194
- "step": 754
195
- },
196
- {
197
- "epoch": 12.99,
198
- "eval_accuracy": 0.6428571343421936,
199
- "eval_loss": 1.0147874355316162,
200
- "eval_runtime": 48.212,
201
- "eval_samples_per_second": 1.452,
202
- "eval_steps_per_second": 0.373,
203
- "step": 754
204
- },
205
- {
206
- "epoch": 13.99,
207
- "learning_rate": 5.303030303030303e-06,
208
- "loss": 0.4093,
209
- "step": 812
210
- },
211
- {
212
- "epoch": 13.99,
213
  "eval_accuracy": 0.6714285612106323,
214
- "eval_loss": 0.9352009892463684,
215
- "eval_runtime": 47.9193,
216
- "eval_samples_per_second": 1.461,
217
- "eval_steps_per_second": 0.376,
218
- "step": 812
219
- },
220
- {
221
- "epoch": 14.99,
222
- "learning_rate": 4.424242424242425e-06,
223
- "loss": 0.3458,
224
- "step": 870
225
- },
226
- {
227
- "epoch": 14.99,
228
- "eval_accuracy": 0.6571428775787354,
229
- "eval_loss": 1.01514732837677,
230
- "eval_runtime": 47.8767,
231
- "eval_samples_per_second": 1.462,
232
- "eval_steps_per_second": 0.376,
233
- "step": 870
234
- },
235
- {
236
- "epoch": 15.99,
237
- "learning_rate": 3.5454545454545458e-06,
238
- "loss": 0.3082,
239
- "step": 928
240
  },
241
  {
242
- "epoch": 15.99,
243
- "eval_accuracy": 0.6571428775787354,
244
- "eval_loss": 1.0875554084777832,
245
- "eval_runtime": 47.9039,
246
- "eval_samples_per_second": 1.461,
247
- "eval_steps_per_second": 0.376,
248
- "step": 928
249
  },
250
  {
251
- "epoch": 16.99,
252
- "learning_rate": 2.666666666666667e-06,
253
- "loss": 0.2619,
254
- "step": 986
255
- },
256
- {
257
- "epoch": 16.99,
258
- "eval_accuracy": 0.699999988079071,
259
- "eval_loss": 0.9961318969726562,
260
- "eval_runtime": 47.6669,
261
- "eval_samples_per_second": 1.469,
262
- "eval_steps_per_second": 0.378,
263
- "step": 986
264
- },
265
- {
266
- "epoch": 17.99,
267
- "learning_rate": 1.787878787878788e-06,
268
- "loss": 0.2332,
269
- "step": 1044
270
- },
271
- {
272
- "epoch": 17.99,
273
  "eval_accuracy": 0.6714285612106323,
274
- "eval_loss": 1.15262770652771,
275
- "eval_runtime": 48.0091,
276
- "eval_samples_per_second": 1.458,
277
- "eval_steps_per_second": 0.375,
278
- "step": 1044
279
  },
280
  {
281
- "epoch": 18.99,
282
- "learning_rate": 9.090909090909091e-07,
283
- "loss": 0.2029,
284
- "step": 1102
285
  },
286
  {
287
- "epoch": 18.99,
288
- "eval_accuracy": 0.699999988079071,
289
- "eval_loss": 1.0439351797103882,
290
- "eval_runtime": 47.7114,
291
- "eval_samples_per_second": 1.467,
292
- "eval_steps_per_second": 0.377,
293
- "step": 1102
294
- },
295
- {
296
- "epoch": 19.99,
297
- "learning_rate": 3.0303030303030305e-08,
298
- "loss": 0.1781,
299
- "step": 1160
300
- },
301
- {
302
- "epoch": 19.99,
303
- "eval_accuracy": 0.6857143044471741,
304
- "eval_loss": 1.0611016750335693,
305
- "eval_runtime": 47.5705,
306
- "eval_samples_per_second": 1.472,
307
- "eval_steps_per_second": 0.378,
308
- "step": 1160
309
- },
310
- {
311
- "epoch": 19.99,
312
- "step": 1160,
313
- "total_flos": 6.655036715585741e+18,
314
- "train_loss": 0.6480823286648454,
315
- "train_runtime": 27204.8,
316
- "train_samples_per_second": 0.515,
317
- "train_steps_per_second": 0.043
318
  }
319
  ],
320
- "max_steps": 1160,
321
- "num_train_epochs": 20,
322
- "total_flos": 6.655036715585741e+18,
323
  "trial_name": null,
324
  "trial_params": null
325
  }
 
1
  {
2
+ "best_metric": 0.9727444052696228,
3
+ "best_model_checkpoint": "kurosekurose/wav2vec2-base-EMOPIA/checkpoint-525",
4
+ "epoch": 10.0,
5
+ "global_step": 1750,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 1.0,
12
+ "learning_rate": 3.5e-06,
13
+ "loss": 1.3252,
14
+ "step": 175
15
  },
16
  {
17
+ "epoch": 1.0,
18
+ "eval_accuracy": 0.4285714328289032,
19
+ "eval_loss": 1.2177598476409912,
20
+ "eval_runtime": 47.4346,
21
+ "eval_samples_per_second": 1.476,
22
+ "eval_steps_per_second": 0.379,
23
+ "step": 175
24
  },
25
  {
26
+ "epoch": 2.0,
27
+ "learning_rate": 6.98e-06,
28
+ "loss": 1.039,
29
+ "step": 350
30
  },
31
  {
32
+ "epoch": 2.0,
33
+ "eval_accuracy": 0.5714285969734192,
34
+ "eval_loss": 1.0262044668197632,
35
+ "eval_runtime": 47.2654,
36
+ "eval_samples_per_second": 1.481,
37
+ "eval_steps_per_second": 0.381,
38
+ "step": 350
39
  },
40
  {
41
+ "epoch": 3.0,
42
+ "learning_rate": 9.808000000000002e-06,
43
+ "loss": 0.9232,
44
+ "step": 525
45
  },
46
  {
47
+ "epoch": 3.0,
48
+ "eval_accuracy": 0.5714285969734192,
49
+ "eval_loss": 0.9727444052696228,
50
+ "eval_runtime": 47.5019,
51
+ "eval_samples_per_second": 1.474,
52
+ "eval_steps_per_second": 0.379,
53
+ "step": 525
54
  },
55
  {
56
+ "epoch": 4.0,
57
+ "learning_rate": 8.408e-06,
58
+ "loss": 0.8248,
59
+ "step": 700
60
  },
61
  {
62
+ "epoch": 4.0,
63
+ "eval_accuracy": 0.5142857432365417,
64
+ "eval_loss": 1.0024999380111694,
65
+ "eval_runtime": 47.3119,
66
+ "eval_samples_per_second": 1.48,
67
+ "eval_steps_per_second": 0.38,
68
+ "step": 700
69
  },
70
  {
71
+ "epoch": 5.0,
72
+ "learning_rate": 7.0080000000000005e-06,
73
+ "loss": 0.7389,
74
+ "step": 875
75
  },
76
  {
77
+ "epoch": 5.0,
78
+ "eval_accuracy": 0.6428571343421936,
79
+ "eval_loss": 0.9947425127029419,
80
+ "eval_runtime": 47.6424,
81
+ "eval_samples_per_second": 1.469,
82
+ "eval_steps_per_second": 0.378,
83
+ "step": 875
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84
  },
85
  {
86
+ "epoch": 6.0,
87
+ "learning_rate": 5.616e-06,
88
+ "loss": 0.6253,
89
+ "step": 1050
90
  },
91
  {
92
+ "epoch": 6.0,
93
  "eval_accuracy": 0.6857143044471741,
94
+ "eval_loss": 1.0144152641296387,
95
+ "eval_runtime": 47.3265,
96
+ "eval_samples_per_second": 1.479,
97
+ "eval_steps_per_second": 0.38,
98
+ "step": 1050
 
 
 
 
 
 
99
  },
100
  {
101
+ "epoch": 7.0,
102
+ "learning_rate": 4.216e-06,
103
+ "loss": 0.5691,
104
+ "step": 1225
 
 
 
105
  },
106
  {
107
+ "epoch": 7.0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
108
  "eval_accuracy": 0.6714285612106323,
109
+ "eval_loss": 1.0645909309387207,
110
+ "eval_runtime": 47.3515,
111
+ "eval_samples_per_second": 1.478,
112
+ "eval_steps_per_second": 0.38,
113
+ "step": 1225
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
114
  },
115
  {
116
+ "epoch": 8.0,
117
+ "learning_rate": 2.824e-06,
118
+ "loss": 0.5264,
119
+ "step": 1400
 
 
 
120
  },
121
  {
122
+ "epoch": 8.0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
123
  "eval_accuracy": 0.6714285612106323,
124
+ "eval_loss": 1.2786132097244263,
125
+ "eval_runtime": 47.1262,
126
+ "eval_samples_per_second": 1.485,
127
+ "eval_steps_per_second": 0.382,
128
+ "step": 1400
129
  },
130
  {
131
+ "epoch": 9.0,
132
+ "learning_rate": 1.424e-06,
133
+ "loss": 0.4535,
134
+ "step": 1575
135
  },
136
  {
137
+ "epoch": 9.0,
138
+ "eval_accuracy": 0.6428571343421936,
139
+ "eval_loss": 1.353231430053711,
140
+ "eval_runtime": 47.1844,
141
+ "eval_samples_per_second": 1.484,
142
+ "eval_steps_per_second": 0.381,
143
+ "step": 1575
144
+ },
145
+ {
146
+ "epoch": 10.0,
147
+ "learning_rate": 2.4e-08,
148
+ "loss": 0.4008,
149
+ "step": 1750
150
+ },
151
+ {
152
+ "epoch": 10.0,
153
+ "eval_accuracy": 0.7285714149475098,
154
+ "eval_loss": 1.1368242502212524,
155
+ "eval_runtime": 47.4087,
156
+ "eval_samples_per_second": 1.477,
157
+ "eval_steps_per_second": 0.38,
158
+ "step": 1750
159
+ },
160
+ {
161
+ "epoch": 10.0,
162
+ "step": 1750,
163
+ "total_flos": 3.328882796061573e+18,
164
+ "train_loss": 0.7426296255929129,
165
+ "train_runtime": 13563.0274,
166
+ "train_samples_per_second": 0.516,
167
+ "train_steps_per_second": 0.129
168
  }
169
  ],
170
+ "max_steps": 1750,
171
+ "num_train_epochs": 10,
172
+ "total_flos": 3.328882796061573e+18,
173
  "trial_name": null,
174
  "trial_params": null
175
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:990634455712da4e6301f173f9ebb709ca13e2946d99da7b5ffd9662eec3717f
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cda600d7e556b18aa0b24e2e84fec73d5e94563f380c420560e3b34a61273f9
3
  size 3055