shenben commited on
Commit
796df09
·
verified ·
1 Parent(s): 975b8a7

End of training

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. all_results.json +6 -6
  3. test_results.json +6 -6
  4. trainer_state.json +174 -131
README.md CHANGED
@@ -17,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.3127
21
  - Accuracy: 0.8903
22
 
23
  ## Model description
 
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.3143
21
  - Accuracy: 0.8903
22
 
23
  ## Model description
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 11.03,
3
- "eval_accuracy": 0.967741935483871,
4
- "eval_loss": 0.16526122391223907,
5
- "eval_runtime": 12.1682,
6
- "eval_samples_per_second": 12.738,
7
- "eval_steps_per_second": 0.575
8
  }
 
1
  {
2
+ "epoch": 14.05,
3
+ "eval_accuracy": 0.8903225806451613,
4
+ "eval_loss": 0.314290851354599,
5
+ "eval_runtime": 7.0489,
6
+ "eval_samples_per_second": 21.989,
7
+ "eval_steps_per_second": 0.709
8
  }
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 11.03,
3
- "eval_accuracy": 0.967741935483871,
4
- "eval_loss": 0.16526122391223907,
5
- "eval_runtime": 12.1682,
6
- "eval_samples_per_second": 12.738,
7
- "eval_steps_per_second": 0.575
8
  }
 
1
  {
2
+ "epoch": 14.05,
3
+ "eval_accuracy": 0.8903225806451613,
4
+ "eval_loss": 0.314290851354599,
5
+ "eval_runtime": 7.0489,
6
+ "eval_samples_per_second": 21.989,
7
+ "eval_steps_per_second": 0.709
8
  }
trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.9571428571428572,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-130",
4
- "epoch": 11.033783783783784,
5
  "eval_steps": 500,
6
  "global_step": 148,
7
  "is_hyper_param_search": false,
@@ -10,229 +10,272 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.07,
 
13
  "learning_rate": 3.3333333333333335e-05,
14
- "loss": 2.3293,
15
  "step": 10
16
  },
17
  {
18
- "epoch": 0.09,
19
- "eval_accuracy": 0.2714285714285714,
20
- "eval_loss": 2.157376527786255,
21
- "eval_runtime": 5.476,
22
- "eval_samples_per_second": 12.783,
23
- "eval_steps_per_second": 0.548,
24
- "step": 13
25
  },
26
  {
27
- "epoch": 1.05,
 
28
  "learning_rate": 4.81203007518797e-05,
29
- "loss": 2.1579,
30
  "step": 20
31
  },
32
  {
33
- "epoch": 1.09,
34
- "eval_accuracy": 0.4714285714285714,
35
- "eval_loss": 1.7585737705230713,
36
- "eval_runtime": 5.8808,
37
- "eval_samples_per_second": 11.903,
38
- "eval_steps_per_second": 0.51,
39
- "step": 26
40
  },
41
  {
42
- "epoch": 2.03,
 
43
  "learning_rate": 4.43609022556391e-05,
44
- "loss": 1.816,
45
  "step": 30
46
  },
47
  {
48
- "epoch": 2.09,
49
- "eval_accuracy": 0.5571428571428572,
50
- "eval_loss": 1.1273804903030396,
51
- "eval_runtime": 5.3271,
52
- "eval_samples_per_second": 13.14,
53
- "eval_steps_per_second": 0.563,
54
- "step": 39
55
  },
56
  {
57
- "epoch": 3.01,
 
58
  "learning_rate": 4.0601503759398494e-05,
59
- "loss": 1.2189,
60
  "step": 40
61
  },
62
  {
63
  "epoch": 3.07,
 
 
 
 
 
 
 
 
 
 
64
  "learning_rate": 3.6842105263157895e-05,
65
- "loss": 0.7528,
66
  "step": 50
67
  },
68
  {
69
- "epoch": 3.09,
70
- "eval_accuracy": 0.7857142857142857,
71
- "eval_loss": 0.7276753187179565,
72
- "eval_runtime": 5.3035,
73
- "eval_samples_per_second": 13.199,
74
- "eval_steps_per_second": 0.566,
75
- "step": 52
76
  },
77
  {
78
- "epoch": 4.05,
 
79
  "learning_rate": 3.3082706766917295e-05,
80
- "loss": 0.4973,
81
  "step": 60
82
  },
83
  {
84
- "epoch": 4.09,
85
  "eval_accuracy": 0.8571428571428571,
86
- "eval_loss": 0.4263572096824646,
87
- "eval_runtime": 5.6644,
88
- "eval_samples_per_second": 12.358,
89
- "eval_steps_per_second": 0.53,
90
- "step": 65
91
  },
92
  {
93
- "epoch": 5.03,
 
94
  "learning_rate": 2.9323308270676693e-05,
95
- "loss": 0.3713,
96
  "step": 70
97
  },
98
  {
99
- "epoch": 5.09,
100
- "eval_accuracy": 0.8571428571428571,
101
- "eval_loss": 0.37758442759513855,
102
- "eval_runtime": 5.2354,
103
- "eval_samples_per_second": 13.371,
104
- "eval_steps_per_second": 0.573,
105
- "step": 78
106
  },
107
  {
108
- "epoch": 6.01,
 
109
  "learning_rate": 2.556390977443609e-05,
110
- "loss": 0.2834,
111
  "step": 80
112
  },
113
  {
114
- "epoch": 6.08,
 
 
 
 
 
 
 
 
 
 
115
  "learning_rate": 2.1804511278195487e-05,
116
- "loss": 0.1453,
117
  "step": 90
118
  },
119
  {
120
- "epoch": 6.09,
121
- "eval_accuracy": 0.9285714285714286,
122
- "eval_loss": 0.25342079997062683,
123
- "eval_runtime": 5.8596,
124
- "eval_samples_per_second": 11.946,
125
- "eval_steps_per_second": 0.512,
126
- "step": 91
127
  },
128
  {
129
- "epoch": 7.06,
 
130
  "learning_rate": 1.8045112781954888e-05,
131
- "loss": 0.1148,
132
  "step": 100
133
  },
134
  {
135
- "epoch": 7.09,
136
- "eval_accuracy": 0.8428571428571429,
137
- "eval_loss": 0.3897377550601959,
138
- "eval_runtime": 5.4916,
139
- "eval_samples_per_second": 12.747,
140
- "eval_steps_per_second": 0.546,
141
- "step": 104
142
  },
143
  {
144
- "epoch": 8.04,
 
145
  "learning_rate": 1.4285714285714285e-05,
146
- "loss": 0.0763,
147
  "step": 110
148
  },
149
  {
150
- "epoch": 8.09,
151
- "eval_accuracy": 0.9428571428571428,
152
- "eval_loss": 0.2183365374803543,
153
- "eval_runtime": 5.214,
154
- "eval_samples_per_second": 13.425,
155
- "eval_steps_per_second": 0.575,
156
- "step": 117
157
  },
158
  {
159
- "epoch": 9.02,
 
160
  "learning_rate": 1.0526315789473684e-05,
161
- "loss": 0.0744,
 
 
 
 
 
 
 
 
 
162
  "step": 120
163
  },
164
  {
165
- "epoch": 9.09,
 
166
  "learning_rate": 6.766917293233083e-06,
167
- "loss": 0.0521,
168
  "step": 130
169
  },
170
  {
171
- "epoch": 9.09,
172
- "eval_accuracy": 0.9571428571428572,
173
- "eval_loss": 0.14351557195186615,
174
- "eval_runtime": 5.6806,
175
- "eval_samples_per_second": 12.323,
176
- "eval_steps_per_second": 0.528,
177
  "step": 130
178
  },
179
  {
180
- "epoch": 10.07,
 
181
  "learning_rate": 3.007518796992481e-06,
182
- "loss": 0.0323,
183
  "step": 140
184
  },
185
  {
186
- "epoch": 10.09,
187
- "eval_accuracy": 0.9285714285714286,
188
- "eval_loss": 0.2716424763202667,
189
- "eval_runtime": 5.6339,
190
- "eval_samples_per_second": 12.425,
191
- "eval_steps_per_second": 0.532,
192
- "step": 143
193
  },
194
  {
195
- "epoch": 11.03,
196
- "eval_accuracy": 0.9285714285714286,
197
- "eval_loss": 0.26677000522613525,
198
- "eval_runtime": 5.0922,
199
- "eval_samples_per_second": 13.747,
200
- "eval_steps_per_second": 0.589,
201
  "step": 148
202
  },
203
  {
204
- "epoch": 11.03,
205
  "step": 148,
206
- "total_flos": 4.2618449361567744e+18,
207
- "train_loss": 0.6719480277718725,
208
- "train_runtime": 453.1919,
209
- "train_samples_per_second": 7.838,
210
- "train_steps_per_second": 0.327
211
- },
212
- {
213
- "epoch": 11.03,
214
- "eval_accuracy": 0.967741935483871,
215
- "eval_loss": 0.16224287450313568,
216
- "eval_runtime": 11.3629,
217
- "eval_samples_per_second": 13.641,
218
- "eval_steps_per_second": 0.616,
219
  "step": 148
220
  },
221
  {
222
- "epoch": 11.03,
223
- "eval_accuracy": 0.967741935483871,
224
- "eval_loss": 0.16526122391223907,
225
- "eval_runtime": 12.1682,
226
- "eval_samples_per_second": 12.738,
227
- "eval_steps_per_second": 0.575,
228
  "step": 148
229
  }
230
  ],
231
  "logging_steps": 10,
232
  "max_steps": 148,
 
233
  "num_train_epochs": 9223372036854775807,
234
  "save_steps": 500,
235
- "total_flos": 4.2618449361567744e+18,
 
236
  "trial_name": null,
237
  "trial_params": null
238
  }
 
1
  {
2
+ "best_metric": 0.9428571428571428,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-140",
4
+ "epoch": 14.054054054054054,
5
  "eval_steps": 500,
6
  "global_step": 148,
7
  "is_hyper_param_search": false,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.07,
13
+ "grad_norm": 9.659797668457031,
14
  "learning_rate": 3.3333333333333335e-05,
15
+ "loss": 2.3172,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.07,
20
+ "eval_accuracy": 0.08571428571428572,
21
+ "eval_loss": 2.2181172370910645,
22
+ "eval_runtime": 3.9506,
23
+ "eval_samples_per_second": 17.719,
24
+ "eval_steps_per_second": 0.759,
25
+ "step": 10
26
  },
27
  {
28
+ "epoch": 1.07,
29
+ "grad_norm": 6.882665157318115,
30
  "learning_rate": 4.81203007518797e-05,
31
+ "loss": 2.1343,
32
  "step": 20
33
  },
34
  {
35
+ "epoch": 1.07,
36
+ "eval_accuracy": 0.37142857142857144,
37
+ "eval_loss": 1.9744230508804321,
38
+ "eval_runtime": 3.5795,
39
+ "eval_samples_per_second": 19.556,
40
+ "eval_steps_per_second": 0.838,
41
+ "step": 20
42
  },
43
  {
44
+ "epoch": 2.07,
45
+ "grad_norm": 8.149250030517578,
46
  "learning_rate": 4.43609022556391e-05,
47
+ "loss": 1.6727,
48
  "step": 30
49
  },
50
  {
51
+ "epoch": 2.07,
52
+ "eval_accuracy": 0.5142857142857142,
53
+ "eval_loss": 1.4526900053024292,
54
+ "eval_runtime": 3.1928,
55
+ "eval_samples_per_second": 21.925,
56
+ "eval_steps_per_second": 0.94,
57
+ "step": 30
58
  },
59
  {
60
+ "epoch": 3.07,
61
+ "grad_norm": 6.3829803466796875,
62
  "learning_rate": 4.0601503759398494e-05,
63
+ "loss": 0.9704,
64
  "step": 40
65
  },
66
  {
67
  "epoch": 3.07,
68
+ "eval_accuracy": 0.8142857142857143,
69
+ "eval_loss": 0.846143364906311,
70
+ "eval_runtime": 4.1102,
71
+ "eval_samples_per_second": 17.031,
72
+ "eval_steps_per_second": 0.73,
73
+ "step": 40
74
+ },
75
+ {
76
+ "epoch": 4.07,
77
+ "grad_norm": 6.794018268585205,
78
  "learning_rate": 3.6842105263157895e-05,
79
+ "loss": 0.5427,
80
  "step": 50
81
  },
82
  {
83
+ "epoch": 4.07,
84
+ "eval_accuracy": 0.8142857142857143,
85
+ "eval_loss": 0.5360450744628906,
86
+ "eval_runtime": 3.2207,
87
+ "eval_samples_per_second": 21.734,
88
+ "eval_steps_per_second": 0.931,
89
+ "step": 50
90
  },
91
  {
92
+ "epoch": 5.07,
93
+ "grad_norm": 6.470229625701904,
94
  "learning_rate": 3.3082706766917295e-05,
95
+ "loss": 0.3584,
96
  "step": 60
97
  },
98
  {
99
+ "epoch": 5.07,
100
  "eval_accuracy": 0.8571428571428571,
101
+ "eval_loss": 0.472709983587265,
102
+ "eval_runtime": 3.1462,
103
+ "eval_samples_per_second": 22.249,
104
+ "eval_steps_per_second": 0.954,
105
+ "step": 60
106
  },
107
  {
108
+ "epoch": 6.07,
109
+ "grad_norm": 10.196860313415527,
110
  "learning_rate": 2.9323308270676693e-05,
111
+ "loss": 0.2445,
112
  "step": 70
113
  },
114
  {
115
+ "epoch": 6.07,
116
+ "eval_accuracy": 0.9,
117
+ "eval_loss": 0.34089064598083496,
118
+ "eval_runtime": 3.5346,
119
+ "eval_samples_per_second": 19.804,
120
+ "eval_steps_per_second": 0.849,
121
+ "step": 70
122
  },
123
  {
124
+ "epoch": 7.07,
125
+ "grad_norm": 1.1203614473342896,
126
  "learning_rate": 2.556390977443609e-05,
127
+ "loss": 0.1351,
128
  "step": 80
129
  },
130
  {
131
+ "epoch": 7.07,
132
+ "eval_accuracy": 0.8428571428571429,
133
+ "eval_loss": 0.3564361035823822,
134
+ "eval_runtime": 3.1969,
135
+ "eval_samples_per_second": 21.896,
136
+ "eval_steps_per_second": 0.938,
137
+ "step": 80
138
+ },
139
+ {
140
+ "epoch": 8.07,
141
+ "grad_norm": 1.755305528640747,
142
  "learning_rate": 2.1804511278195487e-05,
143
+ "loss": 0.1238,
144
  "step": 90
145
  },
146
  {
147
+ "epoch": 8.07,
148
+ "eval_accuracy": 0.8714285714285714,
149
+ "eval_loss": 0.37149137258529663,
150
+ "eval_runtime": 3.4534,
151
+ "eval_samples_per_second": 20.27,
152
+ "eval_steps_per_second": 0.869,
153
+ "step": 90
154
  },
155
  {
156
+ "epoch": 9.07,
157
+ "grad_norm": 13.847707748413086,
158
  "learning_rate": 1.8045112781954888e-05,
159
+ "loss": 0.1064,
160
  "step": 100
161
  },
162
  {
163
+ "epoch": 9.07,
164
+ "eval_accuracy": 0.8714285714285714,
165
+ "eval_loss": 0.3149915933609009,
166
+ "eval_runtime": 3.5769,
167
+ "eval_samples_per_second": 19.57,
168
+ "eval_steps_per_second": 0.839,
169
+ "step": 100
170
  },
171
  {
172
+ "epoch": 10.07,
173
+ "grad_norm": 8.086627006530762,
174
  "learning_rate": 1.4285714285714285e-05,
175
+ "loss": 0.0839,
176
  "step": 110
177
  },
178
  {
179
+ "epoch": 10.07,
180
+ "eval_accuracy": 0.8,
181
+ "eval_loss": 0.4098597466945648,
182
+ "eval_runtime": 3.3642,
183
+ "eval_samples_per_second": 20.807,
184
+ "eval_steps_per_second": 0.892,
185
+ "step": 110
186
  },
187
  {
188
+ "epoch": 11.07,
189
+ "grad_norm": 5.879390239715576,
190
  "learning_rate": 1.0526315789473684e-05,
191
+ "loss": 0.0575,
192
+ "step": 120
193
+ },
194
+ {
195
+ "epoch": 11.07,
196
+ "eval_accuracy": 0.9,
197
+ "eval_loss": 0.3028772175312042,
198
+ "eval_runtime": 3.2332,
199
+ "eval_samples_per_second": 21.65,
200
+ "eval_steps_per_second": 0.928,
201
  "step": 120
202
  },
203
  {
204
+ "epoch": 12.07,
205
+ "grad_norm": 0.21815051138401031,
206
  "learning_rate": 6.766917293233083e-06,
207
+ "loss": 0.0329,
208
  "step": 130
209
  },
210
  {
211
+ "epoch": 12.07,
212
+ "eval_accuracy": 0.9285714285714286,
213
+ "eval_loss": 0.18007342517375946,
214
+ "eval_runtime": 3.1358,
215
+ "eval_samples_per_second": 22.323,
216
+ "eval_steps_per_second": 0.957,
217
  "step": 130
218
  },
219
  {
220
+ "epoch": 13.07,
221
+ "grad_norm": 0.26752281188964844,
222
  "learning_rate": 3.007518796992481e-06,
223
+ "loss": 0.0348,
224
  "step": 140
225
  },
226
  {
227
+ "epoch": 13.07,
228
+ "eval_accuracy": 0.9428571428571428,
229
+ "eval_loss": 0.18338440358638763,
230
+ "eval_runtime": 3.1018,
231
+ "eval_samples_per_second": 22.567,
232
+ "eval_steps_per_second": 0.967,
233
+ "step": 140
234
  },
235
  {
236
+ "epoch": 14.05,
237
+ "eval_accuracy": 0.9142857142857143,
238
+ "eval_loss": 0.21323394775390625,
239
+ "eval_runtime": 3.5887,
240
+ "eval_samples_per_second": 19.506,
241
+ "eval_steps_per_second": 0.836,
242
  "step": 148
243
  },
244
  {
245
+ "epoch": 14.05,
246
  "step": 148,
247
+ "total_flos": 5.55285995190485e+18,
248
+ "train_loss": 0.5970903383316221,
249
+ "train_runtime": 357.9623,
250
+ "train_samples_per_second": 13.23,
251
+ "train_steps_per_second": 0.413
252
+ },
253
+ {
254
+ "epoch": 14.05,
255
+ "eval_accuracy": 0.8903225806451613,
256
+ "eval_loss": 0.31274959444999695,
257
+ "eval_runtime": 6.8864,
258
+ "eval_samples_per_second": 22.508,
259
+ "eval_steps_per_second": 0.726,
260
  "step": 148
261
  },
262
  {
263
+ "epoch": 14.05,
264
+ "eval_accuracy": 0.8903225806451613,
265
+ "eval_loss": 0.314290851354599,
266
+ "eval_runtime": 7.0489,
267
+ "eval_samples_per_second": 21.989,
268
+ "eval_steps_per_second": 0.709,
269
  "step": 148
270
  }
271
  ],
272
  "logging_steps": 10,
273
  "max_steps": 148,
274
+ "num_input_tokens_seen": 0,
275
  "num_train_epochs": 9223372036854775807,
276
  "save_steps": 500,
277
+ "total_flos": 5.55285995190485e+18,
278
+ "train_batch_size": 32,
279
  "trial_name": null,
280
  "trial_params": null
281
  }