pavitemple commited on
Commit
d26b324
1 Parent(s): 8833e00

Model save

Browse files
Files changed (4) hide show
  1. README.md +2 -2
  2. all_results.json +5 -10
  3. train_results.json +5 -5
  4. trainer_state.json +150 -87
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 2.1163
21
- - Accuracy: 0.3594
22
 
23
  ## Model description
24
 
 
17
 
18
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 1.7371
21
+ - Accuracy: 0.3704
22
 
23
  ## Model description
24
 
all_results.json CHANGED
@@ -1,12 +1,7 @@
1
  {
2
- "epoch": 8.09,
3
- "eval_accuracy": 0.25925925925925924,
4
- "eval_loss": 1.6813513040542603,
5
- "eval_runtime": 64.4906,
6
- "eval_samples_per_second": 0.419,
7
- "eval_steps_per_second": 0.109,
8
- "train_loss": 1.5179050036839077,
9
- "train_runtime": 4008.8343,
10
- "train_samples_per_second": 0.14,
11
- "train_steps_per_second": 0.009
12
  }
 
1
  {
2
+ "epoch": 17.03,
3
+ "train_loss": 1.4362963676452636,
4
+ "train_runtime": 8809.684,
5
+ "train_samples_per_second": 0.127,
6
+ "train_steps_per_second": 0.004
 
 
 
 
 
7
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 8.09,
3
- "train_loss": 1.5179050036839077,
4
- "train_runtime": 4008.8343,
5
- "train_samples_per_second": 0.14,
6
- "train_steps_per_second": 0.009
7
  }
 
1
  {
2
+ "epoch": 17.03,
3
+ "train_loss": 1.4362963676452636,
4
+ "train_runtime": 8809.684,
5
+ "train_samples_per_second": 0.127,
6
+ "train_steps_per_second": 0.004
7
  }
trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.34375,
3
- "best_model_checkpoint": "finetuned-Accident-MultipleLabels-Video-subset-v2-checkpointing/checkpoint-24",
4
- "epoch": 8.085714285714285,
5
  "eval_steps": 500,
6
  "global_step": 35,
7
  "is_hyper_param_search": false,
@@ -9,137 +9,200 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.11,
13
- "eval_accuracy": 0.265625,
14
- "eval_loss": 1.856452226638794,
15
- "eval_runtime": 208.3919,
16
- "eval_samples_per_second": 0.307,
17
- "eval_steps_per_second": 0.077,
 
 
 
 
 
 
 
 
 
18
  "step": 4
19
  },
20
  {
21
- "epoch": 1.11,
22
- "eval_accuracy": 0.265625,
23
- "eval_loss": 1.867037296295166,
24
- "eval_runtime": 204.858,
25
- "eval_samples_per_second": 0.312,
26
- "eval_steps_per_second": 0.078,
 
 
 
 
 
 
 
 
 
27
  "step": 8
28
  },
29
  {
30
- "epoch": 2.06,
31
  "learning_rate": 4.032258064516129e-05,
32
- "loss": 1.8022,
 
 
 
 
 
 
 
 
 
33
  "step": 10
34
  },
35
  {
36
- "epoch": 2.11,
37
- "eval_accuracy": 0.21875,
38
- "eval_loss": 1.9593775272369385,
39
- "eval_runtime": 158.8606,
40
- "eval_samples_per_second": 0.403,
41
- "eval_steps_per_second": 0.101,
42
  "step": 12
43
  },
44
  {
45
- "epoch": 3.11,
46
- "eval_accuracy": 0.296875,
47
- "eval_loss": 1.9278614521026611,
48
- "eval_runtime": 163.5324,
49
- "eval_samples_per_second": 0.391,
50
- "eval_steps_per_second": 0.098,
 
 
 
 
 
 
 
 
 
51
  "step": 16
52
  },
53
  {
54
- "epoch": 4.11,
 
 
 
 
 
 
 
 
 
55
  "learning_rate": 2.4193548387096777e-05,
56
- "loss": 1.4448,
57
  "step": 20
58
  },
59
  {
60
- "epoch": 4.11,
61
- "eval_accuracy": 0.296875,
62
- "eval_loss": 1.910567283630371,
63
- "eval_runtime": 161.4632,
64
- "eval_samples_per_second": 0.396,
65
- "eval_steps_per_second": 0.099,
66
  "step": 20
67
  },
68
  {
69
- "epoch": 5.11,
70
- "eval_accuracy": 0.34375,
71
- "eval_loss": 1.8732622861862183,
72
- "eval_runtime": 158.3884,
73
- "eval_samples_per_second": 0.404,
74
- "eval_steps_per_second": 0.101,
 
 
 
 
 
 
 
 
 
75
  "step": 24
76
  },
77
  {
78
- "epoch": 6.11,
79
- "eval_accuracy": 0.3125,
80
- "eval_loss": 1.8884299993515015,
81
- "eval_runtime": 159.9497,
82
- "eval_samples_per_second": 0.4,
83
- "eval_steps_per_second": 0.1,
 
 
 
 
 
 
 
 
 
84
  "step": 28
85
  },
86
  {
87
- "epoch": 7.06,
88
  "learning_rate": 8.064516129032258e-06,
89
- "loss": 1.3906,
90
  "step": 30
91
  },
92
  {
93
- "epoch": 7.11,
94
- "eval_accuracy": 0.28125,
95
- "eval_loss": 1.8995435237884521,
96
- "eval_runtime": 165.6513,
97
- "eval_samples_per_second": 0.386,
98
- "eval_steps_per_second": 0.097,
 
 
 
 
 
 
 
 
 
99
  "step": 32
100
  },
101
  {
102
- "epoch": 8.09,
103
- "eval_accuracy": 0.28125,
104
- "eval_loss": 1.9018282890319824,
105
- "eval_runtime": 160.8854,
106
- "eval_samples_per_second": 0.398,
107
- "eval_steps_per_second": 0.099,
108
- "step": 35
109
  },
110
  {
111
- "epoch": 8.09,
112
- "step": 35,
113
- "total_flos": 6.978272853255782e+17,
114
- "train_loss": 1.5179050036839077,
115
- "train_runtime": 4008.8343,
116
- "train_samples_per_second": 0.14,
117
- "train_steps_per_second": 0.009
118
- },
119
- {
120
- "epoch": 8.09,
121
- "eval_accuracy": 0.25925925925925924,
122
- "eval_loss": 1.6813514232635498,
123
- "eval_runtime": 64.3768,
124
- "eval_samples_per_second": 0.419,
125
- "eval_steps_per_second": 0.109,
126
  "step": 35
127
  },
128
  {
129
- "epoch": 8.09,
130
- "eval_accuracy": 0.25925925925925924,
131
- "eval_loss": 1.6813513040542603,
132
- "eval_runtime": 64.4906,
133
- "eval_samples_per_second": 0.419,
134
- "eval_steps_per_second": 0.109,
135
- "step": 35
136
  }
137
  ],
138
  "logging_steps": 10,
139
  "max_steps": 35,
140
  "num_train_epochs": 9223372036854775807,
141
  "save_steps": 500,
142
- "total_flos": 6.978272853255782e+17,
143
  "trial_name": null,
144
  "trial_params": null
145
  }
 
1
  {
2
+ "best_metric": 0.390625,
3
+ "best_model_checkpoint": "finetuned-Accident-MultipleLabels-Video-subset-v2-checkpointing/checkpoint-4",
4
+ "epoch": 17.02857142857143,
5
  "eval_steps": 500,
6
  "global_step": 35,
7
  "is_hyper_param_search": false,
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.06,
13
+ "eval_accuracy": 0.359375,
14
+ "eval_loss": 1.7265217304229736,
15
+ "eval_runtime": 228.6142,
16
+ "eval_samples_per_second": 0.28,
17
+ "eval_steps_per_second": 0.035,
18
+ "step": 2
19
+ },
20
+ {
21
+ "epoch": 1.06,
22
+ "eval_accuracy": 0.390625,
23
+ "eval_loss": 1.6976414918899536,
24
+ "eval_runtime": 225.5421,
25
+ "eval_samples_per_second": 0.284,
26
+ "eval_steps_per_second": 0.035,
27
  "step": 4
28
  },
29
  {
30
+ "epoch": 2.06,
31
+ "eval_accuracy": 0.359375,
32
+ "eval_loss": 1.7503018379211426,
33
+ "eval_runtime": 176.7414,
34
+ "eval_samples_per_second": 0.362,
35
+ "eval_steps_per_second": 0.045,
36
+ "step": 6
37
+ },
38
+ {
39
+ "epoch": 3.06,
40
+ "eval_accuracy": 0.3125,
41
+ "eval_loss": 1.8830795288085938,
42
+ "eval_runtime": 175.1171,
43
+ "eval_samples_per_second": 0.365,
44
+ "eval_steps_per_second": 0.046,
45
  "step": 8
46
  },
47
  {
48
+ "epoch": 4.06,
49
  "learning_rate": 4.032258064516129e-05,
50
+ "loss": 1.7254,
51
+ "step": 10
52
+ },
53
+ {
54
+ "epoch": 4.06,
55
+ "eval_accuracy": 0.171875,
56
+ "eval_loss": 2.0285067558288574,
57
+ "eval_runtime": 184.7182,
58
+ "eval_samples_per_second": 0.346,
59
+ "eval_steps_per_second": 0.043,
60
  "step": 10
61
  },
62
  {
63
+ "epoch": 5.06,
64
+ "eval_accuracy": 0.28125,
65
+ "eval_loss": 2.039059638977051,
66
+ "eval_runtime": 178.8587,
67
+ "eval_samples_per_second": 0.358,
68
+ "eval_steps_per_second": 0.045,
69
  "step": 12
70
  },
71
  {
72
+ "epoch": 6.06,
73
+ "eval_accuracy": 0.328125,
74
+ "eval_loss": 1.9736883640289307,
75
+ "eval_runtime": 179.8546,
76
+ "eval_samples_per_second": 0.356,
77
+ "eval_steps_per_second": 0.044,
78
+ "step": 14
79
+ },
80
+ {
81
+ "epoch": 7.06,
82
+ "eval_accuracy": 0.375,
83
+ "eval_loss": 1.8998150825500488,
84
+ "eval_runtime": 172.5948,
85
+ "eval_samples_per_second": 0.371,
86
+ "eval_steps_per_second": 0.046,
87
  "step": 16
88
  },
89
  {
90
+ "epoch": 8.06,
91
+ "eval_accuracy": 0.375,
92
+ "eval_loss": 1.8785591125488281,
93
+ "eval_runtime": 169.9356,
94
+ "eval_samples_per_second": 0.377,
95
+ "eval_steps_per_second": 0.047,
96
+ "step": 18
97
+ },
98
+ {
99
+ "epoch": 9.06,
100
  "learning_rate": 2.4193548387096777e-05,
101
+ "loss": 1.394,
102
  "step": 20
103
  },
104
  {
105
+ "epoch": 9.06,
106
+ "eval_accuracy": 0.34375,
107
+ "eval_loss": 1.9054185152053833,
108
+ "eval_runtime": 179.2066,
109
+ "eval_samples_per_second": 0.357,
110
+ "eval_steps_per_second": 0.045,
111
  "step": 20
112
  },
113
  {
114
+ "epoch": 10.06,
115
+ "eval_accuracy": 0.328125,
116
+ "eval_loss": 1.9473646879196167,
117
+ "eval_runtime": 173.6519,
118
+ "eval_samples_per_second": 0.369,
119
+ "eval_steps_per_second": 0.046,
120
+ "step": 22
121
+ },
122
+ {
123
+ "epoch": 11.06,
124
+ "eval_accuracy": 0.328125,
125
+ "eval_loss": 2.003166675567627,
126
+ "eval_runtime": 174.1677,
127
+ "eval_samples_per_second": 0.367,
128
+ "eval_steps_per_second": 0.046,
129
  "step": 24
130
  },
131
  {
132
+ "epoch": 12.06,
133
+ "eval_accuracy": 0.328125,
134
+ "eval_loss": 2.072862386703491,
135
+ "eval_runtime": 196.1804,
136
+ "eval_samples_per_second": 0.326,
137
+ "eval_steps_per_second": 0.041,
138
+ "step": 26
139
+ },
140
+ {
141
+ "epoch": 13.06,
142
+ "eval_accuracy": 0.34375,
143
+ "eval_loss": 2.108105421066284,
144
+ "eval_runtime": 180.4592,
145
+ "eval_samples_per_second": 0.355,
146
+ "eval_steps_per_second": 0.044,
147
  "step": 28
148
  },
149
  {
150
+ "epoch": 14.06,
151
  "learning_rate": 8.064516129032258e-06,
152
+ "loss": 1.285,
153
  "step": 30
154
  },
155
  {
156
+ "epoch": 14.06,
157
+ "eval_accuracy": 0.328125,
158
+ "eval_loss": 2.1189751625061035,
159
+ "eval_runtime": 180.6898,
160
+ "eval_samples_per_second": 0.354,
161
+ "eval_steps_per_second": 0.044,
162
+ "step": 30
163
+ },
164
+ {
165
+ "epoch": 15.06,
166
+ "eval_accuracy": 0.34375,
167
+ "eval_loss": 2.1188015937805176,
168
+ "eval_runtime": 172.3883,
169
+ "eval_samples_per_second": 0.371,
170
+ "eval_steps_per_second": 0.046,
171
  "step": 32
172
  },
173
  {
174
+ "epoch": 16.06,
175
+ "eval_accuracy": 0.359375,
176
+ "eval_loss": 2.1155242919921875,
177
+ "eval_runtime": 169.8241,
178
+ "eval_samples_per_second": 0.377,
179
+ "eval_steps_per_second": 0.047,
180
+ "step": 34
181
  },
182
  {
183
+ "epoch": 17.03,
184
+ "eval_accuracy": 0.359375,
185
+ "eval_loss": 2.116347312927246,
186
+ "eval_runtime": 177.6799,
187
+ "eval_samples_per_second": 0.36,
188
+ "eval_steps_per_second": 0.045,
 
 
 
 
 
 
 
 
 
189
  "step": 35
190
  },
191
  {
192
+ "epoch": 17.03,
193
+ "step": 35,
194
+ "total_flos": 1.3956545706511565e+18,
195
+ "train_loss": 1.4362963676452636,
196
+ "train_runtime": 8809.684,
197
+ "train_samples_per_second": 0.127,
198
+ "train_steps_per_second": 0.004
199
  }
200
  ],
201
  "logging_steps": 10,
202
  "max_steps": 35,
203
  "num_train_epochs": 9223372036854775807,
204
  "save_steps": 500,
205
+ "total_flos": 1.3956545706511565e+18,
206
  "trial_name": null,
207
  "trial_params": null
208
  }