Nikeytas commited on
Commit
7874883
1 Parent(s): ab92069

End of training

Browse files
Files changed (4) hide show
  1. README.md +2 -2
  2. all_results.json +6 -6
  3. test_results.json +6 -6
  4. trainer_state.json +92 -73
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.4451
21
- - Accuracy: 0.8452
22
 
23
  ## Model description
24
 
 
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.4454
21
+ - Accuracy: 0.8462
22
 
23
  ## Model description
24
 
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.23,
3
- "eval_accuracy": 0.8580645161290322,
4
- "eval_loss": 0.5035644769668579,
5
- "eval_runtime": 299.9496,
6
- "eval_samples_per_second": 0.517,
7
- "eval_steps_per_second": 0.067
8
  }
 
1
  {
2
+ "epoch": 3.22972972972973,
3
+ "eval_accuracy": 0.8461538461538461,
4
+ "eval_loss": 0.44542694091796875,
5
+ "eval_runtime": 488.3429,
6
+ "eval_samples_per_second": 0.319,
7
+ "eval_steps_per_second": 0.041
8
  }
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.23,
3
- "eval_accuracy": 0.8580645161290322,
4
- "eval_loss": 0.5035644769668579,
5
- "eval_runtime": 299.9496,
6
- "eval_samples_per_second": 0.517,
7
- "eval_steps_per_second": 0.067
8
  }
 
1
  {
2
+ "epoch": 3.22972972972973,
3
+ "eval_accuracy": 0.8461538461538461,
4
+ "eval_loss": 0.44542694091796875,
5
+ "eval_runtime": 488.3429,
6
+ "eval_samples_per_second": 0.319,
7
+ "eval_steps_per_second": 0.041
8
  }
trainer_state.json CHANGED
@@ -1,163 +1,182 @@
1
  {
2
- "best_metric": 0.9,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-148",
4
  "epoch": 3.22972972972973,
 
5
  "global_step": 148,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.07,
 
12
  "learning_rate": 3.3333333333333335e-05,
13
- "loss": 2.3721,
14
  "step": 10
15
  },
16
  {
17
- "epoch": 0.14,
 
18
  "learning_rate": 4.81203007518797e-05,
19
- "loss": 2.2408,
20
  "step": 20
21
  },
22
  {
23
- "epoch": 0.2,
 
24
  "learning_rate": 4.43609022556391e-05,
25
- "loss": 2.0323,
26
  "step": 30
27
  },
28
  {
29
- "epoch": 0.26,
30
- "eval_accuracy": 0.5571428571428572,
31
- "eval_loss": 1.6401814222335815,
32
- "eval_runtime": 132.7593,
33
- "eval_samples_per_second": 0.527,
34
- "eval_steps_per_second": 0.068,
35
  "step": 38
36
  },
37
  {
38
- "epoch": 1.01,
 
39
  "learning_rate": 4.0601503759398494e-05,
40
- "loss": 1.873,
41
  "step": 40
42
  },
43
  {
44
- "epoch": 1.08,
 
45
  "learning_rate": 3.6842105263157895e-05,
46
- "loss": 1.4581,
47
  "step": 50
48
  },
49
  {
50
- "epoch": 1.15,
 
51
  "learning_rate": 3.3082706766917295e-05,
52
- "loss": 1.1944,
53
  "step": 60
54
  },
55
  {
56
- "epoch": 1.22,
 
57
  "learning_rate": 2.9323308270676693e-05,
58
- "loss": 0.8081,
59
  "step": 70
60
  },
61
  {
62
- "epoch": 1.26,
63
- "eval_accuracy": 0.6857142857142857,
64
- "eval_loss": 0.8534234762191772,
65
- "eval_runtime": 133.5733,
66
- "eval_samples_per_second": 0.524,
67
- "eval_steps_per_second": 0.067,
68
  "step": 76
69
  },
70
  {
71
- "epoch": 2.03,
 
72
  "learning_rate": 2.556390977443609e-05,
73
- "loss": 0.7699,
74
  "step": 80
75
  },
76
  {
77
- "epoch": 2.09,
 
78
  "learning_rate": 2.1804511278195487e-05,
79
- "loss": 0.5961,
80
  "step": 90
81
  },
82
  {
83
- "epoch": 2.16,
 
84
  "learning_rate": 1.8045112781954888e-05,
85
- "loss": 0.5411,
86
  "step": 100
87
  },
88
  {
89
- "epoch": 2.23,
 
90
  "learning_rate": 1.4285714285714285e-05,
91
- "loss": 0.4099,
92
  "step": 110
93
  },
94
  {
95
- "epoch": 2.26,
96
- "eval_accuracy": 0.8428571428571429,
97
- "eval_loss": 0.5761450529098511,
98
- "eval_runtime": 131.9517,
99
- "eval_samples_per_second": 0.53,
100
- "eval_steps_per_second": 0.068,
101
  "step": 114
102
  },
103
  {
104
- "epoch": 3.04,
 
105
  "learning_rate": 1.0526315789473684e-05,
106
- "loss": 0.3393,
107
  "step": 120
108
  },
109
  {
110
- "epoch": 3.11,
 
111
  "learning_rate": 6.766917293233083e-06,
112
- "loss": 0.2812,
113
  "step": 130
114
  },
115
  {
116
- "epoch": 3.18,
 
117
  "learning_rate": 3.007518796992481e-06,
118
- "loss": 0.255,
119
  "step": 140
120
  },
121
  {
122
- "epoch": 3.23,
123
- "eval_accuracy": 0.9,
124
- "eval_loss": 0.39665931463241577,
125
- "eval_runtime": 127.4255,
126
- "eval_samples_per_second": 0.549,
127
- "eval_steps_per_second": 0.071,
128
  "step": 148
129
  },
130
  {
131
- "epoch": 3.23,
132
  "step": 148,
133
  "total_flos": 1.460491890402263e+18,
134
- "train_loss": 1.0397279697495538,
135
- "train_runtime": 7461.1258,
136
- "train_samples_per_second": 0.159,
137
- "train_steps_per_second": 0.02
138
- },
139
- {
140
- "epoch": 3.23,
141
- "eval_accuracy": 0.8580645161290322,
142
- "eval_loss": 0.5035645365715027,
143
- "eval_runtime": 298.4366,
144
- "eval_samples_per_second": 0.519,
145
- "eval_steps_per_second": 0.067,
146
  "step": 148
147
  },
148
  {
149
- "epoch": 3.23,
150
- "eval_accuracy": 0.8580645161290322,
151
- "eval_loss": 0.5035644769668579,
152
- "eval_runtime": 299.9496,
153
- "eval_samples_per_second": 0.517,
154
- "eval_steps_per_second": 0.067,
155
  "step": 148
156
  }
157
  ],
 
158
  "max_steps": 148,
 
159
  "num_train_epochs": 9223372036854775807,
 
160
  "total_flos": 1.460491890402263e+18,
 
161
  "trial_name": null,
162
  "trial_params": null
163
  }
 
1
  {
2
+ "best_metric": 0.8428571428571429,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset\\checkpoint-148",
4
  "epoch": 3.22972972972973,
5
+ "eval_steps": 500,
6
  "global_step": 148,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.06756756756756757,
13
+ "grad_norm": 10.565461158752441,
14
  "learning_rate": 3.3333333333333335e-05,
15
+ "loss": 1.676,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.13513513513513514,
20
+ "grad_norm": 9.007370948791504,
21
  "learning_rate": 4.81203007518797e-05,
22
+ "loss": 1.3955,
23
  "step": 20
24
  },
25
  {
26
+ "epoch": 0.20270270270270271,
27
+ "grad_norm": 12.666777610778809,
28
  "learning_rate": 4.43609022556391e-05,
29
+ "loss": 1.0504,
30
  "step": 30
31
  },
32
  {
33
+ "epoch": 0.25675675675675674,
34
+ "eval_accuracy": 0.7285714285714285,
35
+ "eval_loss": 0.965540885925293,
36
+ "eval_runtime": 218.999,
37
+ "eval_samples_per_second": 0.32,
38
+ "eval_steps_per_second": 0.041,
39
  "step": 38
40
  },
41
  {
42
+ "epoch": 1.0135135135135136,
43
+ "grad_norm": 5.676259994506836,
44
  "learning_rate": 4.0601503759398494e-05,
45
+ "loss": 0.8752,
46
  "step": 40
47
  },
48
  {
49
+ "epoch": 1.0810810810810811,
50
+ "grad_norm": 13.729002952575684,
51
  "learning_rate": 3.6842105263157895e-05,
52
+ "loss": 0.5743,
53
  "step": 50
54
  },
55
  {
56
+ "epoch": 1.1486486486486487,
57
+ "grad_norm": 14.8609037399292,
58
  "learning_rate": 3.3082706766917295e-05,
59
+ "loss": 0.6753,
60
  "step": 60
61
  },
62
  {
63
+ "epoch": 1.2162162162162162,
64
+ "grad_norm": 13.474194526672363,
65
  "learning_rate": 2.9323308270676693e-05,
66
+ "loss": 0.5387,
67
  "step": 70
68
  },
69
  {
70
+ "epoch": 1.2567567567567568,
71
+ "eval_accuracy": 0.7571428571428571,
72
+ "eval_loss": 0.5636643767356873,
73
+ "eval_runtime": 215.3525,
74
+ "eval_samples_per_second": 0.325,
75
+ "eval_steps_per_second": 0.042,
76
  "step": 76
77
  },
78
  {
79
+ "epoch": 2.027027027027027,
80
+ "grad_norm": 8.333715438842773,
81
  "learning_rate": 2.556390977443609e-05,
82
+ "loss": 0.292,
83
  "step": 80
84
  },
85
  {
86
+ "epoch": 2.0945945945945947,
87
+ "grad_norm": 12.702014923095703,
88
  "learning_rate": 2.1804511278195487e-05,
89
+ "loss": 0.2774,
90
  "step": 90
91
  },
92
  {
93
+ "epoch": 2.1621621621621623,
94
+ "grad_norm": 22.819400787353516,
95
  "learning_rate": 1.8045112781954888e-05,
96
+ "loss": 0.2559,
97
  "step": 100
98
  },
99
  {
100
+ "epoch": 2.22972972972973,
101
+ "grad_norm": 11.329200744628906,
102
  "learning_rate": 1.4285714285714285e-05,
103
+ "loss": 0.2298,
104
  "step": 110
105
  },
106
  {
107
+ "epoch": 2.2567567567567566,
108
+ "eval_accuracy": 0.8285714285714286,
109
+ "eval_loss": 0.4615909159183502,
110
+ "eval_runtime": 220.3855,
111
+ "eval_samples_per_second": 0.318,
112
+ "eval_steps_per_second": 0.041,
113
  "step": 114
114
  },
115
  {
116
+ "epoch": 3.0405405405405403,
117
+ "grad_norm": 24.391935348510742,
118
  "learning_rate": 1.0526315789473684e-05,
119
+ "loss": 0.2461,
120
  "step": 120
121
  },
122
  {
123
+ "epoch": 3.108108108108108,
124
+ "grad_norm": 1.8534562587738037,
125
  "learning_rate": 6.766917293233083e-06,
126
+ "loss": 0.1163,
127
  "step": 130
128
  },
129
  {
130
+ "epoch": 3.175675675675676,
131
+ "grad_norm": 1.0798118114471436,
132
  "learning_rate": 3.007518796992481e-06,
133
+ "loss": 0.13,
134
  "step": 140
135
  },
136
  {
137
+ "epoch": 3.22972972972973,
138
+ "eval_accuracy": 0.8428571428571429,
139
+ "eval_loss": 0.4940463900566101,
140
+ "eval_runtime": 216.8735,
141
+ "eval_samples_per_second": 0.323,
142
+ "eval_steps_per_second": 0.041,
143
  "step": 148
144
  },
145
  {
146
+ "epoch": 3.22972972972973,
147
  "step": 148,
148
  "total_flos": 1.460491890402263e+18,
149
+ "train_loss": 0.5682408096822532,
150
+ "train_runtime": 21379.1283,
151
+ "train_samples_per_second": 0.055,
152
+ "train_steps_per_second": 0.007
153
+ },
154
+ {
155
+ "epoch": 3.22972972972973,
156
+ "eval_accuracy": 0.8451612903225807,
157
+ "eval_loss": 0.4450737237930298,
158
+ "eval_runtime": 471.2207,
159
+ "eval_samples_per_second": 0.329,
160
+ "eval_steps_per_second": 0.042,
161
  "step": 148
162
  },
163
  {
164
+ "epoch": 3.22972972972973,
165
+ "eval_accuracy": 0.8461538461538461,
166
+ "eval_loss": 0.44542694091796875,
167
+ "eval_runtime": 488.3429,
168
+ "eval_samples_per_second": 0.319,
169
+ "eval_steps_per_second": 0.041,
170
  "step": 148
171
  }
172
  ],
173
+ "logging_steps": 10,
174
  "max_steps": 148,
175
+ "num_input_tokens_seen": 0,
176
  "num_train_epochs": 9223372036854775807,
177
+ "save_steps": 500,
178
  "total_flos": 1.460491890402263e+18,
179
+ "train_batch_size": 8,
180
  "trial_name": null,
181
  "trial_params": null
182
  }