Augusto777 commited on
Commit
1695856
1 Parent(s): 34fe695

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.8913043478260869
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.4598
36
- - Accuracy: 0.8913
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.9130434782608695
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.4436
36
+ - Accuracy: 0.9130
37
 
38
  ## Model description
39
 
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 22.15,
3
+ "eval_accuracy": 0.9130434782608695,
4
+ "eval_loss": 0.4435981810092926,
5
+ "eval_runtime": 1.0777,
6
+ "eval_samples_per_second": 42.684,
7
+ "eval_steps_per_second": 1.856,
8
+ "train_loss": 0.689174536201689,
9
+ "train_runtime": 307.4489,
10
+ "train_samples_per_second": 63.933,
11
+ "train_steps_per_second": 0.468
12
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 22.15,
3
+ "eval_accuracy": 0.9130434782608695,
4
+ "eval_loss": 0.4435981810092926,
5
+ "eval_runtime": 1.0777,
6
+ "eval_samples_per_second": 42.684,
7
+ "eval_steps_per_second": 1.856
8
+ }
runs/Jun11_19-14-06_DESKTOP-SKBE9FB/events.out.tfevents.1718155257.DESKTOP-SKBE9FB.15056.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72ac191069a0b41061a5c354b6b04f651bd7baffb5460c520896d45f00edd700
3
+ size 411
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 22.15,
3
+ "train_loss": 0.689174536201689,
4
+ "train_runtime": 307.4489,
5
+ "train_samples_per_second": 63.933,
6
+ "train_steps_per_second": 0.468
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,321 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9130434782608695,
3
+ "best_model_checkpoint": "vit-base-patch16-224-ve-U11-b-24\\checkpoint-117",
4
+ "epoch": 22.153846153846153,
5
+ "eval_steps": 500,
6
+ "global_step": 144,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.92,
13
+ "eval_accuracy": 0.5434782608695652,
14
+ "eval_loss": 1.3798073530197144,
15
+ "eval_runtime": 0.9211,
16
+ "eval_samples_per_second": 49.941,
17
+ "eval_steps_per_second": 2.171,
18
+ "step": 6
19
+ },
20
+ {
21
+ "epoch": 1.54,
22
+ "learning_rate": 5.419117647058824e-05,
23
+ "loss": 1.3792,
24
+ "step": 10
25
+ },
26
+ {
27
+ "epoch": 2.0,
28
+ "eval_accuracy": 0.6521739130434783,
29
+ "eval_loss": 1.3090617656707764,
30
+ "eval_runtime": 0.8387,
31
+ "eval_samples_per_second": 54.85,
32
+ "eval_steps_per_second": 2.385,
33
+ "step": 13
34
+ },
35
+ {
36
+ "epoch": 2.92,
37
+ "eval_accuracy": 0.5869565217391305,
38
+ "eval_loss": 1.2226966619491577,
39
+ "eval_runtime": 0.7418,
40
+ "eval_samples_per_second": 62.012,
41
+ "eval_steps_per_second": 2.696,
42
+ "step": 19
43
+ },
44
+ {
45
+ "epoch": 3.08,
46
+ "learning_rate": 5.0147058823529414e-05,
47
+ "loss": 1.2783,
48
+ "step": 20
49
+ },
50
+ {
51
+ "epoch": 4.0,
52
+ "eval_accuracy": 0.6086956521739131,
53
+ "eval_loss": 1.1262723207473755,
54
+ "eval_runtime": 0.7431,
55
+ "eval_samples_per_second": 61.9,
56
+ "eval_steps_per_second": 2.691,
57
+ "step": 26
58
+ },
59
+ {
60
+ "epoch": 4.62,
61
+ "learning_rate": 4.610294117647059e-05,
62
+ "loss": 1.1226,
63
+ "step": 30
64
+ },
65
+ {
66
+ "epoch": 4.92,
67
+ "eval_accuracy": 0.6521739130434783,
68
+ "eval_loss": 1.0465526580810547,
69
+ "eval_runtime": 0.7448,
70
+ "eval_samples_per_second": 61.765,
71
+ "eval_steps_per_second": 2.685,
72
+ "step": 32
73
+ },
74
+ {
75
+ "epoch": 6.0,
76
+ "eval_accuracy": 0.5869565217391305,
77
+ "eval_loss": 0.9854069352149963,
78
+ "eval_runtime": 0.7677,
79
+ "eval_samples_per_second": 59.917,
80
+ "eval_steps_per_second": 2.605,
81
+ "step": 39
82
+ },
83
+ {
84
+ "epoch": 6.15,
85
+ "learning_rate": 4.205882352941176e-05,
86
+ "loss": 0.9881,
87
+ "step": 40
88
+ },
89
+ {
90
+ "epoch": 6.92,
91
+ "eval_accuracy": 0.6956521739130435,
92
+ "eval_loss": 0.9302965402603149,
93
+ "eval_runtime": 0.7343,
94
+ "eval_samples_per_second": 62.642,
95
+ "eval_steps_per_second": 2.724,
96
+ "step": 45
97
+ },
98
+ {
99
+ "epoch": 7.69,
100
+ "learning_rate": 3.801470588235294e-05,
101
+ "loss": 0.8707,
102
+ "step": 50
103
+ },
104
+ {
105
+ "epoch": 8.0,
106
+ "eval_accuracy": 0.782608695652174,
107
+ "eval_loss": 0.8805552124977112,
108
+ "eval_runtime": 0.7752,
109
+ "eval_samples_per_second": 59.337,
110
+ "eval_steps_per_second": 2.58,
111
+ "step": 52
112
+ },
113
+ {
114
+ "epoch": 8.92,
115
+ "eval_accuracy": 0.782608695652174,
116
+ "eval_loss": 0.8234447240829468,
117
+ "eval_runtime": 0.726,
118
+ "eval_samples_per_second": 63.36,
119
+ "eval_steps_per_second": 2.755,
120
+ "step": 58
121
+ },
122
+ {
123
+ "epoch": 9.23,
124
+ "learning_rate": 3.397058823529412e-05,
125
+ "loss": 0.7604,
126
+ "step": 60
127
+ },
128
+ {
129
+ "epoch": 10.0,
130
+ "eval_accuracy": 0.8260869565217391,
131
+ "eval_loss": 0.7159415483474731,
132
+ "eval_runtime": 0.7512,
133
+ "eval_samples_per_second": 61.236,
134
+ "eval_steps_per_second": 2.662,
135
+ "step": 65
136
+ },
137
+ {
138
+ "epoch": 10.77,
139
+ "learning_rate": 2.992647058823529e-05,
140
+ "loss": 0.6452,
141
+ "step": 70
142
+ },
143
+ {
144
+ "epoch": 10.92,
145
+ "eval_accuracy": 0.8478260869565217,
146
+ "eval_loss": 0.6929341554641724,
147
+ "eval_runtime": 0.7972,
148
+ "eval_samples_per_second": 57.705,
149
+ "eval_steps_per_second": 2.509,
150
+ "step": 71
151
+ },
152
+ {
153
+ "epoch": 12.0,
154
+ "eval_accuracy": 0.8695652173913043,
155
+ "eval_loss": 0.6490562558174133,
156
+ "eval_runtime": 0.7845,
157
+ "eval_samples_per_second": 58.637,
158
+ "eval_steps_per_second": 2.549,
159
+ "step": 78
160
+ },
161
+ {
162
+ "epoch": 12.31,
163
+ "learning_rate": 2.5882352941176472e-05,
164
+ "loss": 0.5576,
165
+ "step": 80
166
+ },
167
+ {
168
+ "epoch": 12.92,
169
+ "eval_accuracy": 0.8478260869565217,
170
+ "eval_loss": 0.5923656225204468,
171
+ "eval_runtime": 0.7527,
172
+ "eval_samples_per_second": 61.115,
173
+ "eval_steps_per_second": 2.657,
174
+ "step": 84
175
+ },
176
+ {
177
+ "epoch": 13.85,
178
+ "learning_rate": 2.1838235294117645e-05,
179
+ "loss": 0.4708,
180
+ "step": 90
181
+ },
182
+ {
183
+ "epoch": 14.0,
184
+ "eval_accuracy": 0.8478260869565217,
185
+ "eval_loss": 0.5550963878631592,
186
+ "eval_runtime": 0.8057,
187
+ "eval_samples_per_second": 57.091,
188
+ "eval_steps_per_second": 2.482,
189
+ "step": 91
190
+ },
191
+ {
192
+ "epoch": 14.92,
193
+ "eval_accuracy": 0.8043478260869565,
194
+ "eval_loss": 0.6354050636291504,
195
+ "eval_runtime": 0.8771,
196
+ "eval_samples_per_second": 52.446,
197
+ "eval_steps_per_second": 2.28,
198
+ "step": 97
199
+ },
200
+ {
201
+ "epoch": 15.38,
202
+ "learning_rate": 1.7794117647058825e-05,
203
+ "loss": 0.422,
204
+ "step": 100
205
+ },
206
+ {
207
+ "epoch": 16.0,
208
+ "eval_accuracy": 0.8695652173913043,
209
+ "eval_loss": 0.5129868388175964,
210
+ "eval_runtime": 0.7568,
211
+ "eval_samples_per_second": 60.785,
212
+ "eval_steps_per_second": 2.643,
213
+ "step": 104
214
+ },
215
+ {
216
+ "epoch": 16.92,
217
+ "learning_rate": 1.375e-05,
218
+ "loss": 0.3546,
219
+ "step": 110
220
+ },
221
+ {
222
+ "epoch": 16.92,
223
+ "eval_accuracy": 0.8695652173913043,
224
+ "eval_loss": 0.5302236676216125,
225
+ "eval_runtime": 0.7453,
226
+ "eval_samples_per_second": 61.721,
227
+ "eval_steps_per_second": 2.684,
228
+ "step": 110
229
+ },
230
+ {
231
+ "epoch": 18.0,
232
+ "eval_accuracy": 0.9130434782608695,
233
+ "eval_loss": 0.4435981810092926,
234
+ "eval_runtime": 0.7717,
235
+ "eval_samples_per_second": 59.607,
236
+ "eval_steps_per_second": 2.592,
237
+ "step": 117
238
+ },
239
+ {
240
+ "epoch": 18.46,
241
+ "learning_rate": 9.705882352941177e-06,
242
+ "loss": 0.3353,
243
+ "step": 120
244
+ },
245
+ {
246
+ "epoch": 18.92,
247
+ "eval_accuracy": 0.8260869565217391,
248
+ "eval_loss": 0.5620782375335693,
249
+ "eval_runtime": 0.7372,
250
+ "eval_samples_per_second": 62.402,
251
+ "eval_steps_per_second": 2.713,
252
+ "step": 123
253
+ },
254
+ {
255
+ "epoch": 20.0,
256
+ "learning_rate": 5.661764705882353e-06,
257
+ "loss": 0.3106,
258
+ "step": 130
259
+ },
260
+ {
261
+ "epoch": 20.0,
262
+ "eval_accuracy": 0.8695652173913043,
263
+ "eval_loss": 0.4911867082118988,
264
+ "eval_runtime": 0.7695,
265
+ "eval_samples_per_second": 59.776,
266
+ "eval_steps_per_second": 2.599,
267
+ "step": 130
268
+ },
269
+ {
270
+ "epoch": 20.92,
271
+ "eval_accuracy": 0.8913043478260869,
272
+ "eval_loss": 0.4746726453304291,
273
+ "eval_runtime": 0.8093,
274
+ "eval_samples_per_second": 56.842,
275
+ "eval_steps_per_second": 2.471,
276
+ "step": 136
277
+ },
278
+ {
279
+ "epoch": 21.54,
280
+ "learning_rate": 1.6176470588235295e-06,
281
+ "loss": 0.312,
282
+ "step": 140
283
+ },
284
+ {
285
+ "epoch": 22.0,
286
+ "eval_accuracy": 0.8913043478260869,
287
+ "eval_loss": 0.46030691266059875,
288
+ "eval_runtime": 0.7427,
289
+ "eval_samples_per_second": 61.935,
290
+ "eval_steps_per_second": 2.693,
291
+ "step": 143
292
+ },
293
+ {
294
+ "epoch": 22.15,
295
+ "eval_accuracy": 0.8913043478260869,
296
+ "eval_loss": 0.4597944915294647,
297
+ "eval_runtime": 0.7386,
298
+ "eval_samples_per_second": 62.279,
299
+ "eval_steps_per_second": 2.708,
300
+ "step": 144
301
+ },
302
+ {
303
+ "epoch": 22.15,
304
+ "step": 144,
305
+ "total_flos": 1.4061948496538665e+18,
306
+ "train_loss": 0.689174536201689,
307
+ "train_runtime": 307.4489,
308
+ "train_samples_per_second": 63.933,
309
+ "train_steps_per_second": 0.468
310
+ }
311
+ ],
312
+ "logging_steps": 10,
313
+ "max_steps": 144,
314
+ "num_input_tokens_seen": 0,
315
+ "num_train_epochs": 24,
316
+ "save_steps": 500,
317
+ "total_flos": 1.4061948496538665e+18,
318
+ "train_batch_size": 32,
319
+ "trial_name": null,
320
+ "trial_params": null
321
+ }