Augusto777 commited on
Commit
2ba9260
1 Parent(s): 6975bce

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.7254901960784313
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.7451
36
- - Accuracy: 0.7255
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.7843137254901961
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.6623
36
+ - Accuracy: 0.7843
37
 
38
  ## Model description
39
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 11.43,
3
- "eval_accuracy": 0.8627450980392157,
4
- "eval_loss": 0.5809429883956909,
5
- "eval_runtime": 1.0773,
6
- "eval_samples_per_second": 47.339,
7
- "eval_steps_per_second": 1.856,
8
- "train_loss": 0.5459669225745731,
9
- "train_runtime": 356.8634,
10
- "train_samples_per_second": 67.589,
11
- "train_steps_per_second": 0.504
12
  }
 
1
  {
2
+ "epoch": 11.61,
3
+ "eval_accuracy": 0.7843137254901961,
4
+ "eval_loss": 0.662259042263031,
5
+ "eval_runtime": 1.0269,
6
+ "eval_samples_per_second": 49.664,
7
+ "eval_steps_per_second": 1.948,
8
+ "train_loss": 0.5402387758096059,
9
+ "train_runtime": 360.9103,
10
+ "train_samples_per_second": 65.401,
11
+ "train_steps_per_second": 0.499
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 11.43,
3
- "eval_accuracy": 0.8627450980392157,
4
- "eval_loss": 0.5809429883956909,
5
- "eval_runtime": 1.0773,
6
- "eval_samples_per_second": 47.339,
7
- "eval_steps_per_second": 1.856
8
  }
 
1
  {
2
+ "epoch": 11.61,
3
+ "eval_accuracy": 0.7843137254901961,
4
+ "eval_loss": 0.662259042263031,
5
+ "eval_runtime": 1.0269,
6
+ "eval_samples_per_second": 49.664,
7
+ "eval_steps_per_second": 1.948
8
  }
runs/Jun11_15-23-19_DESKTOP-SKBE9FB/events.out.tfevents.1718141549.DESKTOP-SKBE9FB.6016.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9b129bc72976bd7c1e3b2da6c686331fcb9716031d010fbe8ceb12baa104120
3
+ size 411
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 11.43,
3
- "train_loss": 0.5459669225745731,
4
- "train_runtime": 356.8634,
5
- "train_samples_per_second": 67.589,
6
- "train_steps_per_second": 0.504
7
  }
 
1
  {
2
+ "epoch": 11.61,
3
+ "train_loss": 0.5402387758096059,
4
+ "train_runtime": 360.9103,
5
+ "train_samples_per_second": 65.401,
6
+ "train_steps_per_second": 0.499
7
  }
trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.8627450980392157,
3
- "best_model_checkpoint": "vit-base-patch16-224-ve-U10-12\\checkpoint-94",
4
- "epoch": 11.428571428571429,
5
  "eval_steps": 500,
6
  "global_step": 180,
7
  "is_hyper_param_search": false,
@@ -9,229 +9,229 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.63,
13
  "learning_rate": 5.467836257309941e-05,
14
- "loss": 1.3634,
15
  "step": 10
16
  },
17
  {
18
- "epoch": 0.95,
19
- "eval_accuracy": 0.49019607843137253,
20
- "eval_loss": 1.228261113166809,
21
- "eval_runtime": 0.912,
22
- "eval_samples_per_second": 55.923,
23
- "eval_steps_per_second": 2.193,
24
  "step": 15
25
  },
26
  {
27
- "epoch": 1.27,
28
  "learning_rate": 5.1461988304093566e-05,
29
- "loss": 1.2422,
30
  "step": 20
31
  },
32
  {
33
- "epoch": 1.9,
34
  "learning_rate": 4.824561403508772e-05,
35
- "loss": 1.099,
36
  "step": 30
37
  },
38
  {
39
- "epoch": 1.97,
40
- "eval_accuracy": 0.6274509803921569,
41
- "eval_loss": 1.009804606437683,
42
- "eval_runtime": 0.7828,
43
- "eval_samples_per_second": 65.149,
44
- "eval_steps_per_second": 2.555,
45
  "step": 31
46
  },
47
  {
48
- "epoch": 2.54,
49
  "learning_rate": 4.502923976608187e-05,
50
- "loss": 0.9373,
51
  "step": 40
52
  },
53
  {
54
- "epoch": 2.98,
55
- "eval_accuracy": 0.6666666666666666,
56
- "eval_loss": 0.8729690909385681,
57
- "eval_runtime": 0.7821,
58
- "eval_samples_per_second": 65.206,
59
- "eval_steps_per_second": 2.557,
60
- "step": 47
61
  },
62
  {
63
- "epoch": 3.17,
64
  "learning_rate": 4.1812865497076025e-05,
65
- "loss": 0.8023,
66
  "step": 50
67
  },
68
  {
69
- "epoch": 3.81,
70
  "learning_rate": 3.859649122807018e-05,
71
- "loss": 0.7066,
72
  "step": 60
73
  },
74
  {
75
  "epoch": 4.0,
76
- "eval_accuracy": 0.803921568627451,
77
- "eval_loss": 0.6674012541770935,
78
- "eval_runtime": 0.7999,
79
- "eval_samples_per_second": 63.759,
80
- "eval_steps_per_second": 2.5,
81
- "step": 63
82
  },
83
  {
84
- "epoch": 4.44,
85
  "learning_rate": 3.5380116959064324e-05,
86
- "loss": 0.6035,
87
  "step": 70
88
  },
89
  {
90
- "epoch": 4.95,
91
- "eval_accuracy": 0.7647058823529411,
92
- "eval_loss": 0.6062445044517517,
93
- "eval_runtime": 0.7697,
94
- "eval_samples_per_second": 66.263,
95
- "eval_steps_per_second": 2.599,
96
- "step": 78
97
  },
98
  {
99
- "epoch": 5.08,
100
  "learning_rate": 3.216374269005848e-05,
101
- "loss": 0.5052,
102
  "step": 80
103
  },
104
  {
105
- "epoch": 5.71,
106
  "learning_rate": 2.894736842105263e-05,
107
- "loss": 0.4011,
108
  "step": 90
109
  },
110
  {
111
- "epoch": 5.97,
112
- "eval_accuracy": 0.8627450980392157,
113
- "eval_loss": 0.5809429883956909,
114
- "eval_runtime": 0.7759,
115
- "eval_samples_per_second": 65.729,
116
- "eval_steps_per_second": 2.578,
117
- "step": 94
118
  },
119
  {
120
- "epoch": 6.35,
121
  "learning_rate": 2.5730994152046783e-05,
122
- "loss": 0.3438,
123
  "step": 100
124
  },
125
  {
126
- "epoch": 6.98,
127
- "learning_rate": 2.2514619883040936e-05,
128
- "loss": 0.2799,
129
- "step": 110
 
 
 
130
  },
131
  {
132
- "epoch": 6.98,
133
- "eval_accuracy": 0.803921568627451,
134
- "eval_loss": 0.623532235622406,
135
- "eval_runtime": 0.8145,
136
- "eval_samples_per_second": 62.613,
137
- "eval_steps_per_second": 2.455,
138
  "step": 110
139
  },
140
  {
141
- "epoch": 7.62,
142
  "learning_rate": 1.929824561403509e-05,
143
- "loss": 0.2572,
144
  "step": 120
145
  },
146
  {
147
  "epoch": 8.0,
148
- "eval_accuracy": 0.7647058823529411,
149
- "eval_loss": 0.669582724571228,
150
- "eval_runtime": 0.778,
151
- "eval_samples_per_second": 65.555,
152
- "eval_steps_per_second": 2.571,
153
- "step": 126
154
  },
155
  {
156
- "epoch": 8.25,
157
  "learning_rate": 1.608187134502924e-05,
158
- "loss": 0.2402,
159
  "step": 130
160
  },
161
  {
162
- "epoch": 8.89,
163
- "learning_rate": 1.2865497076023392e-05,
164
- "loss": 0.2384,
165
- "step": 140
 
 
 
166
  },
167
  {
168
- "epoch": 8.95,
169
- "eval_accuracy": 0.7647058823529411,
170
- "eval_loss": 0.6868889927864075,
171
- "eval_runtime": 0.7916,
172
- "eval_samples_per_second": 64.426,
173
- "eval_steps_per_second": 2.526,
174
- "step": 141
175
  },
176
  {
177
- "epoch": 9.52,
178
  "learning_rate": 9.649122807017545e-06,
179
- "loss": 0.2104,
180
  "step": 150
181
  },
182
  {
183
- "epoch": 9.97,
184
- "eval_accuracy": 0.7254901960784313,
185
- "eval_loss": 0.7198700308799744,
186
- "eval_runtime": 0.7795,
187
- "eval_samples_per_second": 65.43,
188
- "eval_steps_per_second": 2.566,
189
- "step": 157
190
  },
191
  {
192
- "epoch": 10.16,
193
  "learning_rate": 6.432748538011696e-06,
194
- "loss": 0.2159,
195
  "step": 160
196
  },
197
  {
198
- "epoch": 10.79,
199
  "learning_rate": 3.216374269005848e-06,
200
- "loss": 0.1894,
201
  "step": 170
202
  },
203
  {
204
- "epoch": 10.98,
205
- "eval_accuracy": 0.8431372549019608,
206
- "eval_loss": 0.5567971467971802,
207
- "eval_runtime": 0.7722,
208
- "eval_samples_per_second": 66.043,
209
- "eval_steps_per_second": 2.59,
210
- "step": 173
211
  },
212
  {
213
- "epoch": 11.43,
214
  "learning_rate": 0.0,
215
- "loss": 0.1917,
216
  "step": 180
217
  },
218
  {
219
- "epoch": 11.43,
220
- "eval_accuracy": 0.8431372549019608,
221
- "eval_loss": 0.5610877275466919,
222
- "eval_runtime": 0.7721,
223
- "eval_samples_per_second": 66.054,
224
- "eval_steps_per_second": 2.59,
225
  "step": 180
226
  },
227
  {
228
- "epoch": 11.43,
229
  "step": 180,
230
- "total_flos": 1.7803328819545866e+18,
231
- "train_loss": 0.5459669225745731,
232
- "train_runtime": 356.8634,
233
- "train_samples_per_second": 67.589,
234
- "train_steps_per_second": 0.504
235
  }
236
  ],
237
  "logging_steps": 10,
@@ -239,7 +239,7 @@
239
  "num_input_tokens_seen": 0,
240
  "num_train_epochs": 12,
241
  "save_steps": 500,
242
- "total_flos": 1.7803328819545866e+18,
243
  "train_batch_size": 32,
244
  "trial_name": null,
245
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.7843137254901961,
3
+ "best_model_checkpoint": "vit-base-patch16-224-ve-U10-12\\checkpoint-108",
4
+ "epoch": 11.612903225806452,
5
  "eval_steps": 500,
6
  "global_step": 180,
7
  "is_hyper_param_search": false,
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.65,
13
  "learning_rate": 5.467836257309941e-05,
14
+ "loss": 1.3659,
15
  "step": 10
16
  },
17
  {
18
+ "epoch": 0.97,
19
+ "eval_accuracy": 0.47058823529411764,
20
+ "eval_loss": 1.2287312746047974,
21
+ "eval_runtime": 0.9667,
22
+ "eval_samples_per_second": 52.757,
23
+ "eval_steps_per_second": 2.069,
24
  "step": 15
25
  },
26
  {
27
+ "epoch": 1.29,
28
  "learning_rate": 5.1461988304093566e-05,
29
+ "loss": 1.2407,
30
  "step": 20
31
  },
32
  {
33
+ "epoch": 1.94,
34
  "learning_rate": 4.824561403508772e-05,
35
+ "loss": 1.1063,
36
  "step": 30
37
  },
38
  {
39
+ "epoch": 2.0,
40
+ "eval_accuracy": 0.6862745098039216,
41
+ "eval_loss": 1.0233995914459229,
42
+ "eval_runtime": 0.8689,
43
+ "eval_samples_per_second": 58.697,
44
+ "eval_steps_per_second": 2.302,
45
  "step": 31
46
  },
47
  {
48
+ "epoch": 2.58,
49
  "learning_rate": 4.502923976608187e-05,
50
+ "loss": 0.9468,
51
  "step": 40
52
  },
53
  {
54
+ "epoch": 2.97,
55
+ "eval_accuracy": 0.6862745098039216,
56
+ "eval_loss": 0.8665008544921875,
57
+ "eval_runtime": 0.8118,
58
+ "eval_samples_per_second": 62.826,
59
+ "eval_steps_per_second": 2.464,
60
+ "step": 46
61
  },
62
  {
63
+ "epoch": 3.23,
64
  "learning_rate": 4.1812865497076025e-05,
65
+ "loss": 0.8276,
66
  "step": 50
67
  },
68
  {
69
+ "epoch": 3.87,
70
  "learning_rate": 3.859649122807018e-05,
71
+ "loss": 0.6825,
72
  "step": 60
73
  },
74
  {
75
  "epoch": 4.0,
76
+ "eval_accuracy": 0.7058823529411765,
77
+ "eval_loss": 0.7481548190116882,
78
+ "eval_runtime": 0.7724,
79
+ "eval_samples_per_second": 66.031,
80
+ "eval_steps_per_second": 2.589,
81
+ "step": 62
82
  },
83
  {
84
+ "epoch": 4.52,
85
  "learning_rate": 3.5380116959064324e-05,
86
+ "loss": 0.5534,
87
  "step": 70
88
  },
89
  {
90
+ "epoch": 4.97,
91
+ "eval_accuracy": 0.7058823529411765,
92
+ "eval_loss": 0.7608624696731567,
93
+ "eval_runtime": 0.8338,
94
+ "eval_samples_per_second": 61.167,
95
+ "eval_steps_per_second": 2.399,
96
+ "step": 77
97
  },
98
  {
99
+ "epoch": 5.16,
100
  "learning_rate": 3.216374269005848e-05,
101
+ "loss": 0.4733,
102
  "step": 80
103
  },
104
  {
105
+ "epoch": 5.81,
106
  "learning_rate": 2.894736842105263e-05,
107
+ "loss": 0.4019,
108
  "step": 90
109
  },
110
  {
111
+ "epoch": 6.0,
112
+ "eval_accuracy": 0.7254901960784313,
113
+ "eval_loss": 0.7092276215553284,
114
+ "eval_runtime": 0.7947,
115
+ "eval_samples_per_second": 64.177,
116
+ "eval_steps_per_second": 2.517,
117
+ "step": 93
118
  },
119
  {
120
+ "epoch": 6.45,
121
  "learning_rate": 2.5730994152046783e-05,
122
+ "loss": 0.3323,
123
  "step": 100
124
  },
125
  {
126
+ "epoch": 6.97,
127
+ "eval_accuracy": 0.7843137254901961,
128
+ "eval_loss": 0.662259042263031,
129
+ "eval_runtime": 0.7839,
130
+ "eval_samples_per_second": 65.057,
131
+ "eval_steps_per_second": 2.551,
132
+ "step": 108
133
  },
134
  {
135
+ "epoch": 7.1,
136
+ "learning_rate": 2.2514619883040936e-05,
137
+ "loss": 0.2759,
 
 
 
138
  "step": 110
139
  },
140
  {
141
+ "epoch": 7.74,
142
  "learning_rate": 1.929824561403509e-05,
143
+ "loss": 0.2743,
144
  "step": 120
145
  },
146
  {
147
  "epoch": 8.0,
148
+ "eval_accuracy": 0.7058823529411765,
149
+ "eval_loss": 0.7407493591308594,
150
+ "eval_runtime": 0.7753,
151
+ "eval_samples_per_second": 65.783,
152
+ "eval_steps_per_second": 2.58,
153
+ "step": 124
154
  },
155
  {
156
+ "epoch": 8.39,
157
  "learning_rate": 1.608187134502924e-05,
158
+ "loss": 0.2411,
159
  "step": 130
160
  },
161
  {
162
+ "epoch": 8.97,
163
+ "eval_accuracy": 0.7647058823529411,
164
+ "eval_loss": 0.6248741745948792,
165
+ "eval_runtime": 0.8159,
166
+ "eval_samples_per_second": 62.507,
167
+ "eval_steps_per_second": 2.451,
168
+ "step": 139
169
  },
170
  {
171
+ "epoch": 9.03,
172
+ "learning_rate": 1.2865497076023392e-05,
173
+ "loss": 0.2379,
174
+ "step": 140
 
 
 
175
  },
176
  {
177
+ "epoch": 9.68,
178
  "learning_rate": 9.649122807017545e-06,
179
+ "loss": 0.2021,
180
  "step": 150
181
  },
182
  {
183
+ "epoch": 10.0,
184
+ "eval_accuracy": 0.7450980392156863,
185
+ "eval_loss": 0.7221617102622986,
186
+ "eval_runtime": 0.7603,
187
+ "eval_samples_per_second": 67.081,
188
+ "eval_steps_per_second": 2.631,
189
+ "step": 155
190
  },
191
  {
192
+ "epoch": 10.32,
193
  "learning_rate": 6.432748538011696e-06,
194
+ "loss": 0.195,
195
  "step": 160
196
  },
197
  {
198
+ "epoch": 10.97,
199
  "learning_rate": 3.216374269005848e-06,
200
+ "loss": 0.1925,
201
  "step": 170
202
  },
203
  {
204
+ "epoch": 10.97,
205
+ "eval_accuracy": 0.7058823529411765,
206
+ "eval_loss": 0.7807687520980835,
207
+ "eval_runtime": 0.7671,
208
+ "eval_samples_per_second": 66.482,
209
+ "eval_steps_per_second": 2.607,
210
+ "step": 170
211
  },
212
  {
213
+ "epoch": 11.61,
214
  "learning_rate": 0.0,
215
+ "loss": 0.1748,
216
  "step": 180
217
  },
218
  {
219
+ "epoch": 11.61,
220
+ "eval_accuracy": 0.7254901960784313,
221
+ "eval_loss": 0.7451220750808716,
222
+ "eval_runtime": 0.7609,
223
+ "eval_samples_per_second": 67.03,
224
+ "eval_steps_per_second": 2.629,
225
  "step": 180
226
  },
227
  {
228
+ "epoch": 11.61,
229
  "step": 180,
230
+ "total_flos": 1.7709561831334625e+18,
231
+ "train_loss": 0.5402387758096059,
232
+ "train_runtime": 360.9103,
233
+ "train_samples_per_second": 65.401,
234
+ "train_steps_per_second": 0.499
235
  }
236
  ],
237
  "logging_steps": 10,
 
239
  "num_input_tokens_seen": 0,
240
  "num_train_epochs": 12,
241
  "save_steps": 500,
242
+ "total_flos": 1.7709561831334625e+18,
243
  "train_batch_size": 32,
244
  "trial_name": null,
245
  "trial_params": null