vuongnhathien commited on
Commit
9ec962f
1 Parent(s): cae8610

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.8878727634194831
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.3921
36
- - Accuracy: 0.8879
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.9021825396825397
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.3568
36
+ - Accuracy: 0.9022
37
 
38
  ## Model description
39
 
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "total_flos": 1.3627285673563054e+19,
4
+ "train_loss": 0.8061258281360973,
5
+ "train_runtime": 7150.5683,
6
+ "train_samples_per_second": 24.587,
7
+ "train_steps_per_second": 0.385
8
+ }
runs/May27_06-51-20_c5e46e9fa53c/events.out.tfevents.1716800038.c5e46e9fa53c.24.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9caa326269a7bab82ca52cc5322987c1b3e330d23334737a6188b13e22551bc5
3
+ size 411
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "total_flos": 1.3627285673563054e+19,
4
+ "train_loss": 0.8061258281360973,
5
+ "train_runtime": 7150.5683,
6
+ "train_samples_per_second": 24.587,
7
+ "train_steps_per_second": 0.385
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,309 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.3921276926994324,
3
+ "best_model_checkpoint": "./vit-base-3e-5-randaug/checkpoint-2750",
4
+ "epoch": 10.0,
5
+ "eval_steps": 500,
6
+ "global_step": 2750,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.36,
13
+ "grad_norm": 4.155110836029053,
14
+ "learning_rate": 2.9902226030228252e-05,
15
+ "loss": 2.7863,
16
+ "step": 100
17
+ },
18
+ {
19
+ "epoch": 0.73,
20
+ "grad_norm": 4.886130332946777,
21
+ "learning_rate": 2.9610178754135005e-05,
22
+ "loss": 1.6815,
23
+ "step": 200
24
+ },
25
+ {
26
+ "epoch": 1.0,
27
+ "eval_accuracy": 0.7737574552683897,
28
+ "eval_loss": 0.9074916839599609,
29
+ "eval_runtime": 54.9169,
30
+ "eval_samples_per_second": 45.796,
31
+ "eval_steps_per_second": 0.728,
32
+ "step": 275
33
+ },
34
+ {
35
+ "epoch": 1.09,
36
+ "grad_norm": 4.915349960327148,
37
+ "learning_rate": 2.9127665454592872e-05,
38
+ "loss": 1.2844,
39
+ "step": 300
40
+ },
41
+ {
42
+ "epoch": 1.45,
43
+ "grad_norm": 4.22341775894165,
44
+ "learning_rate": 2.8460976430370375e-05,
45
+ "loss": 1.06,
46
+ "step": 400
47
+ },
48
+ {
49
+ "epoch": 1.82,
50
+ "grad_norm": 4.15113639831543,
51
+ "learning_rate": 2.7618802992467718e-05,
52
+ "loss": 0.9759,
53
+ "step": 500
54
+ },
55
+ {
56
+ "epoch": 2.0,
57
+ "eval_accuracy": 0.8500994035785289,
58
+ "eval_loss": 0.5867449641227722,
59
+ "eval_runtime": 54.5476,
60
+ "eval_samples_per_second": 46.106,
61
+ "eval_steps_per_second": 0.733,
62
+ "step": 550
63
+ },
64
+ {
65
+ "epoch": 2.18,
66
+ "grad_norm": 4.799998760223389,
67
+ "learning_rate": 2.661212415958624e-05,
68
+ "loss": 0.9053,
69
+ "step": 600
70
+ },
71
+ {
72
+ "epoch": 2.55,
73
+ "grad_norm": 4.3418684005737305,
74
+ "learning_rate": 2.5454063529829405e-05,
75
+ "loss": 0.8298,
76
+ "step": 700
77
+ },
78
+ {
79
+ "epoch": 2.91,
80
+ "grad_norm": 4.906313896179199,
81
+ "learning_rate": 2.4159718194531573e-05,
82
+ "loss": 0.7955,
83
+ "step": 800
84
+ },
85
+ {
86
+ "epoch": 3.0,
87
+ "eval_accuracy": 0.8548707753479126,
88
+ "eval_loss": 0.5190673470497131,
89
+ "eval_runtime": 55.308,
90
+ "eval_samples_per_second": 45.473,
91
+ "eval_steps_per_second": 0.723,
92
+ "step": 825
93
+ },
94
+ {
95
+ "epoch": 3.27,
96
+ "grad_norm": 5.728692531585693,
97
+ "learning_rate": 2.274596192458443e-05,
98
+ "loss": 0.7404,
99
+ "step": 900
100
+ },
101
+ {
102
+ "epoch": 3.64,
103
+ "grad_norm": 4.377862453460693,
104
+ "learning_rate": 2.12312251950283e-05,
105
+ "loss": 0.7126,
106
+ "step": 1000
107
+ },
108
+ {
109
+ "epoch": 4.0,
110
+ "grad_norm": 4.678811550140381,
111
+ "learning_rate": 1.963525491562421e-05,
112
+ "loss": 0.7056,
113
+ "step": 1100
114
+ },
115
+ {
116
+ "epoch": 4.0,
117
+ "eval_accuracy": 0.8755467196819086,
118
+ "eval_loss": 0.45482131838798523,
119
+ "eval_runtime": 55.04,
120
+ "eval_samples_per_second": 45.694,
121
+ "eval_steps_per_second": 0.727,
122
+ "step": 1100
123
+ },
124
+ {
125
+ "epoch": 4.36,
126
+ "grad_norm": 4.7580246925354,
127
+ "learning_rate": 1.7978856999686182e-05,
128
+ "loss": 0.6839,
129
+ "step": 1200
130
+ },
131
+ {
132
+ "epoch": 4.73,
133
+ "grad_norm": 4.103386878967285,
134
+ "learning_rate": 1.6283625127182596e-05,
135
+ "loss": 0.6455,
136
+ "step": 1300
137
+ },
138
+ {
139
+ "epoch": 5.0,
140
+ "eval_accuracy": 0.8854870775347913,
141
+ "eval_loss": 0.42557355761528015,
142
+ "eval_runtime": 55.0116,
143
+ "eval_samples_per_second": 45.718,
144
+ "eval_steps_per_second": 0.727,
145
+ "step": 1375
146
+ },
147
+ {
148
+ "epoch": 5.09,
149
+ "grad_norm": 4.85685396194458,
150
+ "learning_rate": 1.4571659238094557e-05,
151
+ "loss": 0.6445,
152
+ "step": 1400
153
+ },
154
+ {
155
+ "epoch": 5.45,
156
+ "grad_norm": 4.542230606079102,
157
+ "learning_rate": 1.2865277425900725e-05,
158
+ "loss": 0.5996,
159
+ "step": 1500
160
+ },
161
+ {
162
+ "epoch": 5.82,
163
+ "grad_norm": 3.4589812755584717,
164
+ "learning_rate": 1.11867249870977e-05,
165
+ "loss": 0.6249,
166
+ "step": 1600
167
+ },
168
+ {
169
+ "epoch": 6.0,
170
+ "eval_accuracy": 0.8846918489065606,
171
+ "eval_loss": 0.411356657743454,
172
+ "eval_runtime": 54.1236,
173
+ "eval_samples_per_second": 46.468,
174
+ "eval_steps_per_second": 0.739,
175
+ "step": 1650
176
+ },
177
+ {
178
+ "epoch": 6.18,
179
+ "grad_norm": 3.62654972076416,
180
+ "learning_rate": 9.557884419740387e-06,
181
+ "loss": 0.6076,
182
+ "step": 1700
183
+ },
184
+ {
185
+ "epoch": 6.55,
186
+ "grad_norm": 4.838754177093506,
187
+ "learning_rate": 7.999990151614895e-06,
188
+ "loss": 0.5802,
189
+ "step": 1800
190
+ },
191
+ {
192
+ "epoch": 6.91,
193
+ "grad_norm": 4.127110004425049,
194
+ "learning_rate": 6.533351716998466e-06,
195
+ "loss": 0.5742,
196
+ "step": 1900
197
+ },
198
+ {
199
+ "epoch": 7.0,
200
+ "eval_accuracy": 0.8874751491053678,
201
+ "eval_loss": 0.4025728404521942,
202
+ "eval_runtime": 54.4896,
203
+ "eval_samples_per_second": 46.156,
204
+ "eval_steps_per_second": 0.734,
205
+ "step": 1925
206
+ },
207
+ {
208
+ "epoch": 7.27,
209
+ "grad_norm": 3.6499452590942383,
210
+ "learning_rate": 5.177088990820725e-06,
211
+ "loss": 0.5646,
212
+ "step": 2000
213
+ },
214
+ {
215
+ "epoch": 7.64,
216
+ "grad_norm": 3.194026231765747,
217
+ "learning_rate": 3.948882931853924e-06,
218
+ "loss": 0.5627,
219
+ "step": 2100
220
+ },
221
+ {
222
+ "epoch": 8.0,
223
+ "grad_norm": 4.581117630004883,
224
+ "learning_rate": 2.86474508437579e-06,
225
+ "loss": 0.5782,
226
+ "step": 2200
227
+ },
228
+ {
229
+ "epoch": 8.0,
230
+ "eval_accuracy": 0.890258449304175,
231
+ "eval_loss": 0.3943153917789459,
232
+ "eval_runtime": 54.2999,
233
+ "eval_samples_per_second": 46.317,
234
+ "eval_steps_per_second": 0.737,
235
+ "step": 2200
236
+ },
237
+ {
238
+ "epoch": 8.36,
239
+ "grad_norm": 4.3230791091918945,
240
+ "learning_rate": 1.9388088432033446e-06,
241
+ "loss": 0.5551,
242
+ "step": 2300
243
+ },
244
+ {
245
+ "epoch": 8.73,
246
+ "grad_norm": 4.666913032531738,
247
+ "learning_rate": 1.1831452032772499e-06,
248
+ "loss": 0.5383,
249
+ "step": 2400
250
+ },
251
+ {
252
+ "epoch": 9.0,
253
+ "eval_accuracy": 0.8882703777335984,
254
+ "eval_loss": 0.3928951919078827,
255
+ "eval_runtime": 54.0056,
256
+ "eval_samples_per_second": 46.569,
257
+ "eval_steps_per_second": 0.741,
258
+ "step": 2475
259
+ },
260
+ {
261
+ "epoch": 9.09,
262
+ "grad_norm": 5.079577922821045,
263
+ "learning_rate": 6.076053957825411e-07,
264
+ "loss": 0.5563,
265
+ "step": 2500
266
+ },
267
+ {
268
+ "epoch": 9.45,
269
+ "grad_norm": 4.677091598510742,
270
+ "learning_rate": 2.1969246228460526e-07,
271
+ "loss": 0.5505,
272
+ "step": 2600
273
+ },
274
+ {
275
+ "epoch": 9.82,
276
+ "grad_norm": 2.785017967224121,
277
+ "learning_rate": 2.4463441107965278e-08,
278
+ "loss": 0.5495,
279
+ "step": 2700
280
+ },
281
+ {
282
+ "epoch": 10.0,
283
+ "eval_accuracy": 0.8878727634194831,
284
+ "eval_loss": 0.3921276926994324,
285
+ "eval_runtime": 55.0192,
286
+ "eval_samples_per_second": 45.711,
287
+ "eval_steps_per_second": 0.727,
288
+ "step": 2750
289
+ },
290
+ {
291
+ "epoch": 10.0,
292
+ "step": 2750,
293
+ "total_flos": 1.3627285673563054e+19,
294
+ "train_loss": 0.8061258281360973,
295
+ "train_runtime": 7150.5683,
296
+ "train_samples_per_second": 24.587,
297
+ "train_steps_per_second": 0.385
298
+ }
299
+ ],
300
+ "logging_steps": 100,
301
+ "max_steps": 2750,
302
+ "num_input_tokens_seen": 0,
303
+ "num_train_epochs": 10,
304
+ "save_steps": 500,
305
+ "total_flos": 1.3627285673563054e+19,
306
+ "train_batch_size": 64,
307
+ "trial_name": null,
308
+ "trial_params": null
309
+ }