hafidber commited on
Commit
cd48e2a
1 Parent(s): ce79fe9

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +6 -6
  2. test_results.json +6 -6
  3. trainer_state.json +76 -373
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.25,
3
- "eval_accuracy": 0.8838709677419355,
4
- "eval_loss": 0.39101719856262207,
5
- "eval_runtime": 43.5539,
6
- "eval_samples_per_second": 3.559,
7
- "eval_steps_per_second": 1.791
8
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_accuracy": 0.5290322580645161,
4
+ "eval_loss": 1.4294496774673462,
5
+ "eval_runtime": 45.3757,
6
+ "eval_samples_per_second": 3.416,
7
+ "eval_steps_per_second": 1.719
8
  }
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.25,
3
- "eval_accuracy": 0.8838709677419355,
4
- "eval_loss": 0.39101719856262207,
5
- "eval_runtime": 43.5539,
6
- "eval_samples_per_second": 3.559,
7
- "eval_steps_per_second": 1.791
8
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_accuracy": 0.5290322580645161,
4
+ "eval_loss": 1.4294496774673462,
5
+ "eval_runtime": 45.3757,
6
+ "eval_samples_per_second": 3.416,
7
+ "eval_steps_per_second": 1.719
8
  }
trainer_state.json CHANGED
@@ -1,442 +1,145 @@
1
  {
2
- "best_metric": 0.9857142857142858,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-600",
4
- "epoch": 3.25,
5
  "eval_steps": 500,
6
- "global_step": 600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.02,
13
- "learning_rate": 8.333333333333334e-06,
14
- "loss": 2.3171,
15
- "step": 10
16
- },
17
- {
18
- "epoch": 0.03,
19
- "learning_rate": 1.6666666666666667e-05,
20
- "loss": 2.252,
21
- "step": 20
22
- },
23
- {
24
- "epoch": 0.05,
25
- "learning_rate": 2.5e-05,
26
- "loss": 2.1918,
27
- "step": 30
28
- },
29
  {
30
  "epoch": 0.07,
31
  "learning_rate": 3.3333333333333335e-05,
32
- "loss": 2.2038,
33
- "step": 40
34
- },
35
- {
36
- "epoch": 0.08,
37
- "learning_rate": 4.166666666666667e-05,
38
- "loss": 2.1914,
39
- "step": 50
40
- },
41
- {
42
- "epoch": 0.1,
43
- "learning_rate": 5e-05,
44
- "loss": 2.2023,
45
- "step": 60
46
- },
47
- {
48
- "epoch": 0.12,
49
- "learning_rate": 4.9074074074074075e-05,
50
- "loss": 2.206,
51
- "step": 70
52
  },
53
  {
54
  "epoch": 0.13,
55
  "learning_rate": 4.814814814814815e-05,
56
- "loss": 1.8991,
57
- "step": 80
58
- },
59
- {
60
- "epoch": 0.15,
61
- "learning_rate": 4.722222222222222e-05,
62
- "loss": 2.0264,
63
- "step": 90
64
- },
65
- {
66
- "epoch": 0.17,
67
- "learning_rate": 4.62962962962963e-05,
68
- "loss": 1.8314,
69
- "step": 100
70
- },
71
- {
72
- "epoch": 0.18,
73
- "learning_rate": 4.5370370370370374e-05,
74
- "loss": 1.7088,
75
- "step": 110
76
  },
77
  {
78
  "epoch": 0.2,
79
  "learning_rate": 4.4444444444444447e-05,
80
- "loss": 1.6541,
81
- "step": 120
82
- },
83
- {
84
- "epoch": 0.22,
85
- "learning_rate": 4.351851851851852e-05,
86
- "loss": 1.6237,
87
- "step": 130
88
- },
89
- {
90
- "epoch": 0.23,
91
- "learning_rate": 4.259259259259259e-05,
92
- "loss": 1.3924,
93
- "step": 140
94
- },
95
- {
96
- "epoch": 0.25,
97
- "learning_rate": 4.166666666666667e-05,
98
- "loss": 1.2544,
99
- "step": 150
100
- },
101
- {
102
- "epoch": 0.25,
103
- "eval_accuracy": 0.44285714285714284,
104
- "eval_loss": 1.370309829711914,
105
- "eval_runtime": 19.2054,
106
- "eval_samples_per_second": 3.645,
107
- "eval_steps_per_second": 1.822,
108
- "step": 150
109
  },
110
  {
111
- "epoch": 1.02,
112
  "learning_rate": 4.074074074074074e-05,
113
- "loss": 1.1833,
114
- "step": 160
115
- },
116
- {
117
- "epoch": 1.03,
118
- "learning_rate": 3.981481481481482e-05,
119
- "loss": 1.1287,
120
- "step": 170
121
- },
122
- {
123
- "epoch": 1.05,
124
- "learning_rate": 3.888888888888889e-05,
125
- "loss": 0.9832,
126
- "step": 180
127
- },
128
- {
129
- "epoch": 1.07,
130
- "learning_rate": 3.7962962962962964e-05,
131
- "loss": 0.9388,
132
- "step": 190
133
  },
134
  {
135
- "epoch": 1.08,
136
  "learning_rate": 3.7037037037037037e-05,
137
- "loss": 1.2162,
138
- "step": 200
139
- },
140
- {
141
- "epoch": 1.1,
142
- "learning_rate": 3.611111111111111e-05,
143
- "loss": 0.826,
144
- "step": 210
145
- },
146
- {
147
- "epoch": 1.12,
148
- "learning_rate": 3.518518518518519e-05,
149
- "loss": 0.9838,
150
- "step": 220
151
- },
152
- {
153
- "epoch": 1.13,
154
- "learning_rate": 3.425925925925926e-05,
155
- "loss": 0.8888,
156
- "step": 230
157
  },
158
  {
159
- "epoch": 1.15,
160
  "learning_rate": 3.3333333333333335e-05,
161
- "loss": 0.6393,
162
- "step": 240
163
- },
164
- {
165
- "epoch": 1.17,
166
- "learning_rate": 3.240740740740741e-05,
167
- "loss": 0.5864,
168
- "step": 250
169
- },
170
- {
171
- "epoch": 1.18,
172
- "learning_rate": 3.148148148148148e-05,
173
- "loss": 0.5376,
174
- "step": 260
175
- },
176
- {
177
- "epoch": 1.2,
178
- "learning_rate": 3.055555555555556e-05,
179
- "loss": 0.8571,
180
- "step": 270
181
  },
182
  {
183
- "epoch": 1.22,
184
  "learning_rate": 2.962962962962963e-05,
185
- "loss": 0.3683,
186
- "step": 280
187
- },
188
- {
189
- "epoch": 1.23,
190
- "learning_rate": 2.8703703703703706e-05,
191
- "loss": 1.1622,
192
- "step": 290
193
- },
194
- {
195
- "epoch": 1.25,
196
- "learning_rate": 2.777777777777778e-05,
197
- "loss": 1.0825,
198
- "step": 300
199
- },
200
- {
201
- "epoch": 1.25,
202
- "eval_accuracy": 0.7428571428571429,
203
- "eval_loss": 0.6761045455932617,
204
- "eval_runtime": 19.331,
205
- "eval_samples_per_second": 3.621,
206
- "eval_steps_per_second": 1.811,
207
- "step": 300
208
- },
209
- {
210
- "epoch": 2.02,
211
- "learning_rate": 2.6851851851851855e-05,
212
- "loss": 0.478,
213
- "step": 310
214
  },
215
  {
216
- "epoch": 2.03,
217
  "learning_rate": 2.5925925925925925e-05,
218
- "loss": 0.2416,
219
- "step": 320
220
- },
221
- {
222
- "epoch": 2.05,
223
- "learning_rate": 2.5e-05,
224
- "loss": 0.333,
225
- "step": 330
226
- },
227
- {
228
- "epoch": 2.07,
229
- "learning_rate": 2.4074074074074074e-05,
230
- "loss": 0.2037,
231
- "step": 340
232
- },
233
- {
234
- "epoch": 2.08,
235
- "learning_rate": 2.314814814814815e-05,
236
- "loss": 0.34,
237
- "step": 350
238
  },
239
  {
240
- "epoch": 2.1,
241
  "learning_rate": 2.2222222222222223e-05,
242
- "loss": 0.669,
243
- "step": 360
244
- },
245
- {
246
- "epoch": 2.12,
247
- "learning_rate": 2.1296296296296296e-05,
248
- "loss": 0.3737,
249
- "step": 370
250
- },
251
- {
252
- "epoch": 2.13,
253
- "learning_rate": 2.037037037037037e-05,
254
- "loss": 0.1322,
255
- "step": 380
256
- },
257
- {
258
- "epoch": 2.15,
259
- "learning_rate": 1.9444444444444445e-05,
260
- "loss": 0.2662,
261
- "step": 390
262
  },
263
  {
264
- "epoch": 2.17,
265
  "learning_rate": 1.8518518518518518e-05,
266
- "loss": 0.318,
267
- "step": 400
268
- },
269
- {
270
- "epoch": 2.18,
271
- "learning_rate": 1.7592592592592595e-05,
272
- "loss": 0.1596,
273
- "step": 410
274
- },
275
- {
276
- "epoch": 2.2,
277
- "learning_rate": 1.6666666666666667e-05,
278
- "loss": 0.0874,
279
- "step": 420
280
- },
281
- {
282
- "epoch": 2.22,
283
- "learning_rate": 1.574074074074074e-05,
284
- "loss": 0.2727,
285
- "step": 430
286
  },
287
  {
288
- "epoch": 2.23,
289
  "learning_rate": 1.4814814814814815e-05,
290
- "loss": 0.0459,
291
- "step": 440
292
- },
293
- {
294
- "epoch": 2.25,
295
- "learning_rate": 1.388888888888889e-05,
296
- "loss": 0.2885,
297
- "step": 450
298
- },
299
- {
300
- "epoch": 2.25,
301
- "eval_accuracy": 0.8285714285714286,
302
- "eval_loss": 0.6104217767715454,
303
- "eval_runtime": 20.1055,
304
- "eval_samples_per_second": 3.482,
305
- "eval_steps_per_second": 1.741,
306
- "step": 450
307
- },
308
- {
309
- "epoch": 3.02,
310
- "learning_rate": 1.2962962962962962e-05,
311
- "loss": 0.2173,
312
- "step": 460
313
- },
314
- {
315
- "epoch": 3.03,
316
- "learning_rate": 1.2037037037037037e-05,
317
- "loss": 0.1313,
318
- "step": 470
319
  },
320
  {
321
- "epoch": 3.05,
322
  "learning_rate": 1.1111111111111112e-05,
323
- "loss": 0.0252,
324
- "step": 480
325
- },
326
- {
327
- "epoch": 3.07,
328
- "learning_rate": 1.0185185185185185e-05,
329
- "loss": 0.035,
330
- "step": 490
331
- },
332
- {
333
- "epoch": 3.08,
334
- "learning_rate": 9.259259259259259e-06,
335
- "loss": 0.025,
336
- "step": 500
337
- },
338
- {
339
- "epoch": 3.1,
340
- "learning_rate": 8.333333333333334e-06,
341
- "loss": 0.1221,
342
- "step": 510
343
  },
344
  {
345
- "epoch": 3.12,
346
  "learning_rate": 7.4074074074074075e-06,
347
- "loss": 0.1264,
348
- "step": 520
349
- },
350
- {
351
- "epoch": 3.13,
352
- "learning_rate": 6.481481481481481e-06,
353
- "loss": 0.036,
354
- "step": 530
355
- },
356
- {
357
- "epoch": 3.15,
358
- "learning_rate": 5.555555555555556e-06,
359
- "loss": 0.0544,
360
- "step": 540
361
- },
362
- {
363
- "epoch": 3.17,
364
- "learning_rate": 4.6296296296296296e-06,
365
- "loss": 0.2549,
366
- "step": 550
367
  },
368
  {
369
- "epoch": 3.18,
370
  "learning_rate": 3.7037037037037037e-06,
371
- "loss": 0.2963,
372
- "step": 560
373
- },
374
- {
375
- "epoch": 3.2,
376
- "learning_rate": 2.777777777777778e-06,
377
- "loss": 0.1269,
378
- "step": 570
379
- },
380
- {
381
- "epoch": 3.22,
382
- "learning_rate": 1.8518518518518519e-06,
383
- "loss": 0.1344,
384
- "step": 580
385
- },
386
- {
387
- "epoch": 3.23,
388
- "learning_rate": 9.259259259259259e-07,
389
- "loss": 0.4507,
390
- "step": 590
391
  },
392
  {
393
- "epoch": 3.25,
394
  "learning_rate": 0.0,
395
- "loss": 0.262,
396
- "step": 600
397
  },
398
  {
399
- "epoch": 3.25,
400
- "eval_accuracy": 0.9857142857142858,
401
- "eval_loss": 0.093513622879982,
402
- "eval_runtime": 20.2313,
403
- "eval_samples_per_second": 3.46,
404
- "eval_steps_per_second": 1.73,
405
- "step": 600
406
  },
407
  {
408
- "epoch": 3.25,
409
- "step": 600,
410
- "total_flos": 1.495384188125184e+18,
411
- "train_loss": 0.8140682246039311,
412
- "train_runtime": 787.3727,
413
- "train_samples_per_second": 1.524,
414
- "train_steps_per_second": 0.762
415
  },
416
  {
417
- "epoch": 3.25,
418
- "eval_accuracy": 0.8838709677419355,
419
- "eval_loss": 0.39101719856262207,
420
- "eval_runtime": 43.7237,
421
- "eval_samples_per_second": 3.545,
422
- "eval_steps_per_second": 1.784,
423
- "step": 600
424
  },
425
  {
426
- "epoch": 3.25,
427
- "eval_accuracy": 0.8838709677419355,
428
- "eval_loss": 0.39101719856262207,
429
- "eval_runtime": 43.5539,
430
- "eval_samples_per_second": 3.559,
431
- "eval_steps_per_second": 1.791,
432
- "step": 600
433
  }
434
  ],
435
  "logging_steps": 10,
436
- "max_steps": 600,
437
  "num_train_epochs": 9223372036854775807,
438
  "save_steps": 500,
439
- "total_flos": 1.495384188125184e+18,
440
  "trial_name": null,
441
  "trial_params": null
442
  }
 
1
  {
2
+ "best_metric": 0.6285714285714286,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-150",
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
+ "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 0.07,
13
  "learning_rate": 3.3333333333333335e-05,
14
+ "loss": 2.3672,
15
+ "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  },
17
  {
18
  "epoch": 0.13,
19
  "learning_rate": 4.814814814814815e-05,
20
+ "loss": 2.5654,
21
+ "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  },
23
  {
24
  "epoch": 0.2,
25
  "learning_rate": 4.4444444444444447e-05,
26
+ "loss": 2.3019,
27
+ "step": 30
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  },
29
  {
30
+ "epoch": 0.27,
31
  "learning_rate": 4.074074074074074e-05,
32
+ "loss": 2.1634,
33
+ "step": 40
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  },
35
  {
36
+ "epoch": 0.33,
37
  "learning_rate": 3.7037037037037037e-05,
38
+ "loss": 1.9889,
39
+ "step": 50
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  },
41
  {
42
+ "epoch": 0.4,
43
  "learning_rate": 3.3333333333333335e-05,
44
+ "loss": 2.0758,
45
+ "step": 60
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  },
47
  {
48
+ "epoch": 0.47,
49
  "learning_rate": 2.962962962962963e-05,
50
+ "loss": 2.0439,
51
+ "step": 70
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52
  },
53
  {
54
+ "epoch": 0.53,
55
  "learning_rate": 2.5925925925925925e-05,
56
+ "loss": 1.6312,
57
+ "step": 80
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
58
  },
59
  {
60
+ "epoch": 0.6,
61
  "learning_rate": 2.2222222222222223e-05,
62
+ "loss": 1.905,
63
+ "step": 90
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
64
  },
65
  {
66
+ "epoch": 0.67,
67
  "learning_rate": 1.8518518518518518e-05,
68
+ "loss": 1.6742,
69
+ "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70
  },
71
  {
72
+ "epoch": 0.73,
73
  "learning_rate": 1.4814814814814815e-05,
74
+ "loss": 1.6093,
75
+ "step": 110
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
76
  },
77
  {
78
+ "epoch": 0.8,
79
  "learning_rate": 1.1111111111111112e-05,
80
+ "loss": 1.5733,
81
+ "step": 120
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
82
  },
83
  {
84
+ "epoch": 0.87,
85
  "learning_rate": 7.4074074074074075e-06,
86
+ "loss": 1.6627,
87
+ "step": 130
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
88
  },
89
  {
90
+ "epoch": 0.93,
91
  "learning_rate": 3.7037037037037037e-06,
92
+ "loss": 1.6796,
93
+ "step": 140
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
94
  },
95
  {
96
+ "epoch": 1.0,
97
  "learning_rate": 0.0,
98
+ "loss": 1.3265,
99
+ "step": 150
100
  },
101
  {
102
+ "epoch": 1.0,
103
+ "eval_accuracy": 0.6285714285714286,
104
+ "eval_loss": 1.2609246969223022,
105
+ "eval_runtime": 20.5848,
106
+ "eval_samples_per_second": 3.401,
107
+ "eval_steps_per_second": 1.7,
108
+ "step": 150
109
  },
110
  {
111
+ "epoch": 1.0,
112
+ "step": 150,
113
+ "total_flos": 3.73846047031296e+17,
114
+ "train_loss": 1.9045542653401693,
115
+ "train_runtime": 220.7068,
116
+ "train_samples_per_second": 1.359,
117
+ "train_steps_per_second": 0.68
118
  },
119
  {
120
+ "epoch": 1.0,
121
+ "eval_accuracy": 0.5290322580645161,
122
+ "eval_loss": 1.429449439048767,
123
+ "eval_runtime": 43.1887,
124
+ "eval_samples_per_second": 3.589,
125
+ "eval_steps_per_second": 1.806,
126
+ "step": 150
127
  },
128
  {
129
+ "epoch": 1.0,
130
+ "eval_accuracy": 0.5290322580645161,
131
+ "eval_loss": 1.4294496774673462,
132
+ "eval_runtime": 45.3757,
133
+ "eval_samples_per_second": 3.416,
134
+ "eval_steps_per_second": 1.719,
135
+ "step": 150
136
  }
137
  ],
138
  "logging_steps": 10,
139
+ "max_steps": 150,
140
  "num_train_epochs": 9223372036854775807,
141
  "save_steps": 500,
142
+ "total_flos": 3.73846047031296e+17,
143
  "trial_name": null,
144
  "trial_params": null
145
  }