Augusto777 commited on
Commit
36b9dc8
1 Parent(s): 2fc032c

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.7450980392156863
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.6647
36
- - Accuracy: 0.7451
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.7843137254901961
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.6632
36
+ - Accuracy: 0.7843
37
 
38
  ## Model description
39
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 11.61,
3
  "eval_accuracy": 0.7843137254901961,
4
- "eval_loss": 0.662259042263031,
5
- "eval_runtime": 1.0269,
6
- "eval_samples_per_second": 49.664,
7
- "eval_steps_per_second": 1.948,
8
- "train_loss": 0.5402387758096059,
9
- "train_runtime": 360.9103,
10
- "train_samples_per_second": 65.401,
11
- "train_steps_per_second": 0.499
12
  }
 
1
  {
2
+ "epoch": 11.43,
3
  "eval_accuracy": 0.7843137254901961,
4
+ "eval_loss": 0.6632380485534668,
5
+ "eval_runtime": 1.0573,
6
+ "eval_samples_per_second": 48.238,
7
+ "eval_steps_per_second": 1.892,
8
+ "train_loss": 0.5450452705224355,
9
+ "train_runtime": 382.131,
10
+ "train_samples_per_second": 63.12,
11
+ "train_steps_per_second": 0.471
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 11.61,
3
  "eval_accuracy": 0.7843137254901961,
4
- "eval_loss": 0.662259042263031,
5
- "eval_runtime": 1.0269,
6
- "eval_samples_per_second": 49.664,
7
- "eval_steps_per_second": 1.948
8
  }
 
1
  {
2
+ "epoch": 11.43,
3
  "eval_accuracy": 0.7843137254901961,
4
+ "eval_loss": 0.6632380485534668,
5
+ "eval_runtime": 1.0573,
6
+ "eval_samples_per_second": 48.238,
7
+ "eval_steps_per_second": 1.892
8
  }
runs/Jun11_16-10-07_DESKTOP-SKBE9FB/events.out.tfevents.1718144279.DESKTOP-SKBE9FB.7192.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21c2bfd68cc9fffeb13536d5887d39f757ddb29022b6edbc32c7d7653772989f
3
+ size 411
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 11.61,
3
- "train_loss": 0.5402387758096059,
4
- "train_runtime": 360.9103,
5
- "train_samples_per_second": 65.401,
6
- "train_steps_per_second": 0.499
7
  }
 
1
  {
2
+ "epoch": 11.43,
3
+ "train_loss": 0.5450452705224355,
4
+ "train_runtime": 382.131,
5
+ "train_samples_per_second": 63.12,
6
+ "train_steps_per_second": 0.471
7
  }
trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "best_metric": 0.7843137254901961,
3
- "best_model_checkpoint": "vit-base-patch16-224-ve-U10-12\\checkpoint-108",
4
- "epoch": 11.612903225806452,
5
  "eval_steps": 500,
6
  "global_step": 180,
7
  "is_hyper_param_search": false,
@@ -9,229 +9,229 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.65,
13
  "learning_rate": 5.467836257309941e-05,
14
- "loss": 1.3659,
15
  "step": 10
16
  },
17
  {
18
- "epoch": 0.97,
19
  "eval_accuracy": 0.47058823529411764,
20
- "eval_loss": 1.2287312746047974,
21
- "eval_runtime": 0.9667,
22
- "eval_samples_per_second": 52.757,
23
- "eval_steps_per_second": 2.069,
24
  "step": 15
25
  },
26
  {
27
- "epoch": 1.29,
28
  "learning_rate": 5.1461988304093566e-05,
29
- "loss": 1.2407,
30
  "step": 20
31
  },
32
  {
33
- "epoch": 1.94,
34
  "learning_rate": 4.824561403508772e-05,
35
- "loss": 1.1063,
36
  "step": 30
37
  },
38
  {
39
- "epoch": 2.0,
40
- "eval_accuracy": 0.6862745098039216,
41
- "eval_loss": 1.0233995914459229,
42
- "eval_runtime": 0.8689,
43
- "eval_samples_per_second": 58.697,
44
- "eval_steps_per_second": 2.302,
45
  "step": 31
46
  },
47
  {
48
- "epoch": 2.58,
49
  "learning_rate": 4.502923976608187e-05,
50
- "loss": 0.9468,
51
  "step": 40
52
  },
53
  {
54
- "epoch": 2.97,
55
- "eval_accuracy": 0.6862745098039216,
56
- "eval_loss": 0.8665008544921875,
57
- "eval_runtime": 0.8118,
58
- "eval_samples_per_second": 62.826,
59
- "eval_steps_per_second": 2.464,
60
- "step": 46
61
  },
62
  {
63
- "epoch": 3.23,
64
  "learning_rate": 4.1812865497076025e-05,
65
- "loss": 0.8276,
66
  "step": 50
67
  },
68
  {
69
- "epoch": 3.87,
70
  "learning_rate": 3.859649122807018e-05,
71
- "loss": 0.6825,
72
  "step": 60
73
  },
74
  {
75
  "epoch": 4.0,
76
  "eval_accuracy": 0.7058823529411765,
77
- "eval_loss": 0.7481548190116882,
78
- "eval_runtime": 0.7724,
79
- "eval_samples_per_second": 66.031,
80
- "eval_steps_per_second": 2.589,
81
- "step": 62
82
  },
83
  {
84
- "epoch": 4.52,
85
  "learning_rate": 3.5380116959064324e-05,
86
- "loss": 0.5534,
87
  "step": 70
88
  },
89
  {
90
- "epoch": 4.97,
91
- "eval_accuracy": 0.7058823529411765,
92
- "eval_loss": 0.7608624696731567,
93
- "eval_runtime": 0.8338,
94
- "eval_samples_per_second": 61.167,
95
- "eval_steps_per_second": 2.399,
96
- "step": 77
97
  },
98
  {
99
- "epoch": 5.16,
100
  "learning_rate": 3.216374269005848e-05,
101
- "loss": 0.4733,
102
  "step": 80
103
  },
104
  {
105
- "epoch": 5.81,
106
  "learning_rate": 2.894736842105263e-05,
107
- "loss": 0.4019,
108
  "step": 90
109
  },
110
  {
111
- "epoch": 6.0,
112
  "eval_accuracy": 0.7254901960784313,
113
- "eval_loss": 0.7092276215553284,
114
- "eval_runtime": 0.7947,
115
- "eval_samples_per_second": 64.177,
116
- "eval_steps_per_second": 2.517,
117
- "step": 93
118
  },
119
  {
120
- "epoch": 6.45,
121
  "learning_rate": 2.5730994152046783e-05,
122
- "loss": 0.3323,
123
  "step": 100
124
  },
125
  {
126
- "epoch": 6.97,
127
- "eval_accuracy": 0.7843137254901961,
128
- "eval_loss": 0.662259042263031,
129
- "eval_runtime": 0.7839,
130
- "eval_samples_per_second": 65.057,
131
- "eval_steps_per_second": 2.551,
132
- "step": 108
133
  },
134
  {
135
- "epoch": 7.1,
136
- "learning_rate": 2.2514619883040936e-05,
137
- "loss": 0.2759,
 
 
 
138
  "step": 110
139
  },
140
  {
141
- "epoch": 7.74,
142
  "learning_rate": 1.929824561403509e-05,
143
- "loss": 0.2743,
144
  "step": 120
145
  },
146
  {
147
  "epoch": 8.0,
148
- "eval_accuracy": 0.7058823529411765,
149
- "eval_loss": 0.7407493591308594,
150
- "eval_runtime": 0.7753,
151
- "eval_samples_per_second": 65.783,
152
- "eval_steps_per_second": 2.58,
153
- "step": 124
154
  },
155
  {
156
- "epoch": 8.39,
157
  "learning_rate": 1.608187134502924e-05,
158
- "loss": 0.2411,
159
  "step": 130
160
  },
161
  {
162
- "epoch": 8.97,
163
- "eval_accuracy": 0.7647058823529411,
164
- "eval_loss": 0.6248741745948792,
165
- "eval_runtime": 0.8159,
166
- "eval_samples_per_second": 62.507,
167
- "eval_steps_per_second": 2.451,
168
- "step": 139
169
- },
170
- {
171
- "epoch": 9.03,
172
  "learning_rate": 1.2865497076023392e-05,
173
- "loss": 0.2379,
174
  "step": 140
175
  },
176
  {
177
- "epoch": 9.68,
 
 
 
 
 
 
 
 
 
178
  "learning_rate": 9.649122807017545e-06,
179
- "loss": 0.2021,
180
  "step": 150
181
  },
182
  {
183
- "epoch": 10.0,
184
  "eval_accuracy": 0.7450980392156863,
185
- "eval_loss": 0.7221617102622986,
186
- "eval_runtime": 0.7603,
187
- "eval_samples_per_second": 67.081,
188
- "eval_steps_per_second": 2.631,
189
- "step": 155
190
  },
191
  {
192
- "epoch": 10.32,
193
  "learning_rate": 6.432748538011696e-06,
194
- "loss": 0.195,
195
  "step": 160
196
  },
197
  {
198
- "epoch": 10.97,
199
  "learning_rate": 3.216374269005848e-06,
200
- "loss": 0.1925,
201
  "step": 170
202
  },
203
  {
204
- "epoch": 10.97,
205
- "eval_accuracy": 0.7058823529411765,
206
- "eval_loss": 0.7807687520980835,
207
- "eval_runtime": 0.7671,
208
- "eval_samples_per_second": 66.482,
209
- "eval_steps_per_second": 2.607,
210
- "step": 170
211
  },
212
  {
213
- "epoch": 11.61,
214
  "learning_rate": 0.0,
215
- "loss": 0.1748,
216
  "step": 180
217
  },
218
  {
219
- "epoch": 11.61,
220
- "eval_accuracy": 0.7254901960784313,
221
- "eval_loss": 0.7451220750808716,
222
- "eval_runtime": 0.7609,
223
- "eval_samples_per_second": 67.03,
224
- "eval_steps_per_second": 2.629,
225
  "step": 180
226
  },
227
  {
228
- "epoch": 11.61,
229
  "step": 180,
230
- "total_flos": 1.7709561831334625e+18,
231
- "train_loss": 0.5402387758096059,
232
- "train_runtime": 360.9103,
233
- "train_samples_per_second": 65.401,
234
- "train_steps_per_second": 0.499
235
  }
236
  ],
237
  "logging_steps": 10,
@@ -239,7 +239,7 @@
239
  "num_input_tokens_seen": 0,
240
  "num_train_epochs": 12,
241
  "save_steps": 500,
242
- "total_flos": 1.7709561831334625e+18,
243
  "train_batch_size": 32,
244
  "trial_name": null,
245
  "trial_params": null
 
1
  {
2
  "best_metric": 0.7843137254901961,
3
+ "best_model_checkpoint": "vit-base-patch16-224-ve-U10-12\\checkpoint-141",
4
+ "epoch": 11.428571428571429,
5
  "eval_steps": 500,
6
  "global_step": 180,
7
  "is_hyper_param_search": false,
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.63,
13
  "learning_rate": 5.467836257309941e-05,
14
+ "loss": 1.3629,
15
  "step": 10
16
  },
17
  {
18
+ "epoch": 0.95,
19
  "eval_accuracy": 0.47058823529411764,
20
+ "eval_loss": 1.2289341688156128,
21
+ "eval_runtime": 0.8291,
22
+ "eval_samples_per_second": 61.515,
23
+ "eval_steps_per_second": 2.412,
24
  "step": 15
25
  },
26
  {
27
+ "epoch": 1.27,
28
  "learning_rate": 5.1461988304093566e-05,
29
+ "loss": 1.2419,
30
  "step": 20
31
  },
32
  {
33
+ "epoch": 1.9,
34
  "learning_rate": 4.824561403508772e-05,
35
+ "loss": 1.1038,
36
  "step": 30
37
  },
38
  {
39
+ "epoch": 1.97,
40
+ "eval_accuracy": 0.5882352941176471,
41
+ "eval_loss": 1.041306734085083,
42
+ "eval_runtime": 0.8646,
43
+ "eval_samples_per_second": 58.985,
44
+ "eval_steps_per_second": 2.313,
45
  "step": 31
46
  },
47
  {
48
+ "epoch": 2.54,
49
  "learning_rate": 4.502923976608187e-05,
50
+ "loss": 0.9375,
51
  "step": 40
52
  },
53
  {
54
+ "epoch": 2.98,
55
+ "eval_accuracy": 0.5882352941176471,
56
+ "eval_loss": 0.8989145755767822,
57
+ "eval_runtime": 0.8079,
58
+ "eval_samples_per_second": 63.128,
59
+ "eval_steps_per_second": 2.476,
60
+ "step": 47
61
  },
62
  {
63
+ "epoch": 3.17,
64
  "learning_rate": 4.1812865497076025e-05,
65
+ "loss": 0.7972,
66
  "step": 50
67
  },
68
  {
69
+ "epoch": 3.81,
70
  "learning_rate": 3.859649122807018e-05,
71
+ "loss": 0.6917,
72
  "step": 60
73
  },
74
  {
75
  "epoch": 4.0,
76
  "eval_accuracy": 0.7058823529411765,
77
+ "eval_loss": 0.8519924283027649,
78
+ "eval_runtime": 0.8135,
79
+ "eval_samples_per_second": 62.692,
80
+ "eval_steps_per_second": 2.459,
81
+ "step": 63
82
  },
83
  {
84
+ "epoch": 4.44,
85
  "learning_rate": 3.5380116959064324e-05,
86
+ "loss": 0.5862,
87
  "step": 70
88
  },
89
  {
90
+ "epoch": 4.95,
91
+ "eval_accuracy": 0.7254901960784313,
92
+ "eval_loss": 0.6827210783958435,
93
+ "eval_runtime": 0.8863,
94
+ "eval_samples_per_second": 57.54,
95
+ "eval_steps_per_second": 2.256,
96
+ "step": 78
97
  },
98
  {
99
+ "epoch": 5.08,
100
  "learning_rate": 3.216374269005848e-05,
101
+ "loss": 0.5063,
102
  "step": 80
103
  },
104
  {
105
+ "epoch": 5.71,
106
  "learning_rate": 2.894736842105263e-05,
107
+ "loss": 0.4042,
108
  "step": 90
109
  },
110
  {
111
+ "epoch": 5.97,
112
  "eval_accuracy": 0.7254901960784313,
113
+ "eval_loss": 0.728096067905426,
114
+ "eval_runtime": 0.8825,
115
+ "eval_samples_per_second": 57.792,
116
+ "eval_steps_per_second": 2.266,
117
+ "step": 94
118
  },
119
  {
120
+ "epoch": 6.35,
121
  "learning_rate": 2.5730994152046783e-05,
122
+ "loss": 0.3605,
123
  "step": 100
124
  },
125
  {
126
+ "epoch": 6.98,
127
+ "learning_rate": 2.2514619883040936e-05,
128
+ "loss": 0.2987,
129
+ "step": 110
 
 
 
130
  },
131
  {
132
+ "epoch": 6.98,
133
+ "eval_accuracy": 0.7647058823529411,
134
+ "eval_loss": 0.7262123823165894,
135
+ "eval_runtime": 0.849,
136
+ "eval_samples_per_second": 60.074,
137
+ "eval_steps_per_second": 2.356,
138
  "step": 110
139
  },
140
  {
141
+ "epoch": 7.62,
142
  "learning_rate": 1.929824561403509e-05,
143
+ "loss": 0.2571,
144
  "step": 120
145
  },
146
  {
147
  "epoch": 8.0,
148
+ "eval_accuracy": 0.7254901960784313,
149
+ "eval_loss": 0.7603896856307983,
150
+ "eval_runtime": 0.8862,
151
+ "eval_samples_per_second": 57.552,
152
+ "eval_steps_per_second": 2.257,
153
+ "step": 126
154
  },
155
  {
156
+ "epoch": 8.25,
157
  "learning_rate": 1.608187134502924e-05,
158
+ "loss": 0.249,
159
  "step": 130
160
  },
161
  {
162
+ "epoch": 8.89,
 
 
 
 
 
 
 
 
 
163
  "learning_rate": 1.2865497076023392e-05,
164
+ "loss": 0.2326,
165
  "step": 140
166
  },
167
  {
168
+ "epoch": 8.95,
169
+ "eval_accuracy": 0.7843137254901961,
170
+ "eval_loss": 0.6632380485534668,
171
+ "eval_runtime": 0.7605,
172
+ "eval_samples_per_second": 67.061,
173
+ "eval_steps_per_second": 2.63,
174
+ "step": 141
175
+ },
176
+ {
177
+ "epoch": 9.52,
178
  "learning_rate": 9.649122807017545e-06,
179
+ "loss": 0.1994,
180
  "step": 150
181
  },
182
  {
183
+ "epoch": 9.97,
184
  "eval_accuracy": 0.7450980392156863,
185
+ "eval_loss": 0.6744426488876343,
186
+ "eval_runtime": 0.8645,
187
+ "eval_samples_per_second": 58.993,
188
+ "eval_steps_per_second": 2.313,
189
+ "step": 157
190
  },
191
  {
192
+ "epoch": 10.16,
193
  "learning_rate": 6.432748538011696e-06,
194
+ "loss": 0.2004,
195
  "step": 160
196
  },
197
  {
198
+ "epoch": 10.79,
199
  "learning_rate": 3.216374269005848e-06,
200
+ "loss": 0.1968,
201
  "step": 170
202
  },
203
  {
204
+ "epoch": 10.98,
205
+ "eval_accuracy": 0.7450980392156863,
206
+ "eval_loss": 0.6864146590232849,
207
+ "eval_runtime": 0.7962,
208
+ "eval_samples_per_second": 64.055,
209
+ "eval_steps_per_second": 2.512,
210
+ "step": 173
211
  },
212
  {
213
+ "epoch": 11.43,
214
  "learning_rate": 0.0,
215
+ "loss": 0.1847,
216
  "step": 180
217
  },
218
  {
219
+ "epoch": 11.43,
220
+ "eval_accuracy": 0.7450980392156863,
221
+ "eval_loss": 0.6646667122840881,
222
+ "eval_runtime": 0.7818,
223
+ "eval_samples_per_second": 65.235,
224
+ "eval_steps_per_second": 2.558,
225
  "step": 180
226
  },
227
  {
228
+ "epoch": 11.43,
229
  "step": 180,
230
+ "total_flos": 1.7803328819545866e+18,
231
+ "train_loss": 0.5450452705224355,
232
+ "train_runtime": 382.131,
233
+ "train_samples_per_second": 63.12,
234
+ "train_steps_per_second": 0.471
235
  }
236
  ],
237
  "logging_steps": 10,
 
239
  "num_input_tokens_seen": 0,
240
  "num_train_epochs": 12,
241
  "save_steps": 500,
242
+ "total_flos": 1.7803328819545866e+18,
243
  "train_batch_size": 32,
244
  "trial_name": null,
245
  "trial_params": null