vuongnhathien commited on
Commit
334e0a8
1 Parent(s): 6be9957

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.9204771371769384
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [facebook/convnextv2-nano-22k-384](https://huggingface.co/facebook/convnextv2-nano-22k-384) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.2866
36
- - Accuracy: 0.9205
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.9275793650793651
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [facebook/convnextv2-nano-22k-384](https://huggingface.co/facebook/convnextv2-nano-22k-384) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.2728
36
+ - Accuracy: 0.9276
37
 
38
  ## Model description
39
 
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "total_flos": 7.000491898906214e+18,
4
+ "train_loss": 0.3542752295407382,
5
+ "train_runtime": 6594.6916,
6
+ "train_samples_per_second": 26.659,
7
+ "train_steps_per_second": 0.417
8
+ }
runs/May23_16-45-33_a8d550d17b97/events.out.tfevents.1716489537.a8d550d17b97.23.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e70f09d596da8464b893ae11127c50c02712d8c5a08ed066de1a6614d8c6487
3
+ size 411
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "total_flos": 7.000491898906214e+18,
4
+ "train_loss": 0.3542752295407382,
5
+ "train_runtime": 6594.6916,
6
+ "train_samples_per_second": 26.659,
7
+ "train_steps_per_second": 0.417
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,309 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.2866075932979584,
3
+ "best_model_checkpoint": "./convnext-nano-1e-4-augment/checkpoint-2750",
4
+ "epoch": 10.0,
5
+ "eval_steps": 500,
6
+ "global_step": 2750,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.36,
13
+ "grad_norm": 11.396906852722168,
14
+ "learning_rate": 9.967408676742751e-05,
15
+ "loss": 1.7369,
16
+ "step": 100
17
+ },
18
+ {
19
+ "epoch": 0.73,
20
+ "grad_norm": 14.72342300415039,
21
+ "learning_rate": 9.870059584711668e-05,
22
+ "loss": 0.8282,
23
+ "step": 200
24
+ },
25
+ {
26
+ "epoch": 1.0,
27
+ "eval_accuracy": 0.8536779324055666,
28
+ "eval_loss": 0.5148155689239502,
29
+ "eval_runtime": 61.4101,
30
+ "eval_samples_per_second": 40.954,
31
+ "eval_steps_per_second": 0.651,
32
+ "step": 275
33
+ },
34
+ {
35
+ "epoch": 1.09,
36
+ "grad_norm": 16.179250717163086,
37
+ "learning_rate": 9.709221818197624e-05,
38
+ "loss": 0.6581,
39
+ "step": 300
40
+ },
41
+ {
42
+ "epoch": 1.45,
43
+ "grad_norm": 10.215620994567871,
44
+ "learning_rate": 9.486992143456792e-05,
45
+ "loss": 0.5141,
46
+ "step": 400
47
+ },
48
+ {
49
+ "epoch": 1.82,
50
+ "grad_norm": 8.687200546264648,
51
+ "learning_rate": 9.206267664155907e-05,
52
+ "loss": 0.5209,
53
+ "step": 500
54
+ },
55
+ {
56
+ "epoch": 2.0,
57
+ "eval_accuracy": 0.88389662027833,
58
+ "eval_loss": 0.4150846004486084,
59
+ "eval_runtime": 61.5346,
60
+ "eval_samples_per_second": 40.871,
61
+ "eval_steps_per_second": 0.65,
62
+ "step": 550
63
+ },
64
+ {
65
+ "epoch": 2.18,
66
+ "grad_norm": 10.711565971374512,
67
+ "learning_rate": 8.870708053195413e-05,
68
+ "loss": 0.4456,
69
+ "step": 600
70
+ },
71
+ {
72
+ "epoch": 2.55,
73
+ "grad_norm": 9.642666816711426,
74
+ "learning_rate": 8.484687843276469e-05,
75
+ "loss": 0.4067,
76
+ "step": 700
77
+ },
78
+ {
79
+ "epoch": 2.91,
80
+ "grad_norm": 11.507894515991211,
81
+ "learning_rate": 8.053239398177191e-05,
82
+ "loss": 0.3867,
83
+ "step": 800
84
+ },
85
+ {
86
+ "epoch": 3.0,
87
+ "eval_accuracy": 0.9009940357852882,
88
+ "eval_loss": 0.3642739951610565,
89
+ "eval_runtime": 61.3025,
90
+ "eval_samples_per_second": 41.026,
91
+ "eval_steps_per_second": 0.653,
92
+ "step": 825
93
+ },
94
+ {
95
+ "epoch": 3.27,
96
+ "grad_norm": 13.279052734375,
97
+ "learning_rate": 7.58198730819481e-05,
98
+ "loss": 0.3452,
99
+ "step": 900
100
+ },
101
+ {
102
+ "epoch": 3.64,
103
+ "grad_norm": 9.233952522277832,
104
+ "learning_rate": 7.077075065009433e-05,
105
+ "loss": 0.3216,
106
+ "step": 1000
107
+ },
108
+ {
109
+ "epoch": 4.0,
110
+ "grad_norm": 9.883641242980957,
111
+ "learning_rate": 6.545084971874738e-05,
112
+ "loss": 0.3183,
113
+ "step": 1100
114
+ },
115
+ {
116
+ "epoch": 4.0,
117
+ "eval_accuracy": 0.9049701789264414,
118
+ "eval_loss": 0.3240828812122345,
119
+ "eval_runtime": 61.2041,
120
+ "eval_samples_per_second": 41.092,
121
+ "eval_steps_per_second": 0.654,
122
+ "step": 1100
123
+ },
124
+ {
125
+ "epoch": 4.36,
126
+ "grad_norm": 10.317498207092285,
127
+ "learning_rate": 5.992952333228728e-05,
128
+ "loss": 0.2789,
129
+ "step": 1200
130
+ },
131
+ {
132
+ "epoch": 4.73,
133
+ "grad_norm": 6.958377838134766,
134
+ "learning_rate": 5.427875042394199e-05,
135
+ "loss": 0.2679,
136
+ "step": 1300
137
+ },
138
+ {
139
+ "epoch": 5.0,
140
+ "eval_accuracy": 0.904572564612326,
141
+ "eval_loss": 0.32900604605674744,
142
+ "eval_runtime": 61.4874,
143
+ "eval_samples_per_second": 40.903,
144
+ "eval_steps_per_second": 0.651,
145
+ "step": 1375
146
+ },
147
+ {
148
+ "epoch": 5.09,
149
+ "grad_norm": 7.9765119552612305,
150
+ "learning_rate": 4.85721974603152e-05,
151
+ "loss": 0.261,
152
+ "step": 1400
153
+ },
154
+ {
155
+ "epoch": 5.45,
156
+ "grad_norm": 6.655781269073486,
157
+ "learning_rate": 4.288425808633575e-05,
158
+ "loss": 0.2243,
159
+ "step": 1500
160
+ },
161
+ {
162
+ "epoch": 5.82,
163
+ "grad_norm": 9.778780937194824,
164
+ "learning_rate": 3.728908329032567e-05,
165
+ "loss": 0.2364,
166
+ "step": 1600
167
+ },
168
+ {
169
+ "epoch": 6.0,
170
+ "eval_accuracy": 0.9137176938369781,
171
+ "eval_loss": 0.30884459614753723,
172
+ "eval_runtime": 61.4411,
173
+ "eval_samples_per_second": 40.934,
174
+ "eval_steps_per_second": 0.651,
175
+ "step": 1650
176
+ },
177
+ {
178
+ "epoch": 6.18,
179
+ "grad_norm": 6.904848098754883,
180
+ "learning_rate": 3.1859614732467954e-05,
181
+ "loss": 0.2176,
182
+ "step": 1700
183
+ },
184
+ {
185
+ "epoch": 6.55,
186
+ "grad_norm": 6.360904216766357,
187
+ "learning_rate": 2.6666633838716314e-05,
188
+ "loss": 0.1943,
189
+ "step": 1800
190
+ },
191
+ {
192
+ "epoch": 6.91,
193
+ "grad_norm": 9.572250366210938,
194
+ "learning_rate": 2.1777839056661554e-05,
195
+ "loss": 0.1981,
196
+ "step": 1900
197
+ },
198
+ {
199
+ "epoch": 7.0,
200
+ "eval_accuracy": 0.9137176938369781,
201
+ "eval_loss": 0.29816073179244995,
202
+ "eval_runtime": 62.0018,
203
+ "eval_samples_per_second": 40.563,
204
+ "eval_steps_per_second": 0.645,
205
+ "step": 1925
206
+ },
207
+ {
208
+ "epoch": 7.27,
209
+ "grad_norm": 4.384122371673584,
210
+ "learning_rate": 1.725696330273575e-05,
211
+ "loss": 0.1778,
212
+ "step": 2000
213
+ },
214
+ {
215
+ "epoch": 7.64,
216
+ "grad_norm": 7.344178199768066,
217
+ "learning_rate": 1.3162943106179749e-05,
218
+ "loss": 0.1692,
219
+ "step": 2100
220
+ },
221
+ {
222
+ "epoch": 8.0,
223
+ "grad_norm": 5.066224575042725,
224
+ "learning_rate": 9.549150281252633e-06,
225
+ "loss": 0.1704,
226
+ "step": 2200
227
+ },
228
+ {
229
+ "epoch": 8.0,
230
+ "eval_accuracy": 0.9168986083499006,
231
+ "eval_loss": 0.2899409532546997,
232
+ "eval_runtime": 61.3116,
233
+ "eval_samples_per_second": 41.02,
234
+ "eval_steps_per_second": 0.652,
235
+ "step": 2200
236
+ },
237
+ {
238
+ "epoch": 8.36,
239
+ "grad_norm": 7.729918003082275,
240
+ "learning_rate": 6.462696144011149e-06,
241
+ "loss": 0.1627,
242
+ "step": 2300
243
+ },
244
+ {
245
+ "epoch": 8.73,
246
+ "grad_norm": 9.76986312866211,
247
+ "learning_rate": 3.9438173442575e-06,
248
+ "loss": 0.1572,
249
+ "step": 2400
250
+ },
251
+ {
252
+ "epoch": 9.0,
253
+ "eval_accuracy": 0.920079522862823,
254
+ "eval_loss": 0.2868165671825409,
255
+ "eval_runtime": 61.3101,
256
+ "eval_samples_per_second": 41.021,
257
+ "eval_steps_per_second": 0.652,
258
+ "step": 2475
259
+ },
260
+ {
261
+ "epoch": 9.09,
262
+ "grad_norm": 7.546455383300781,
263
+ "learning_rate": 2.0253513192751373e-06,
264
+ "loss": 0.1548,
265
+ "step": 2500
266
+ },
267
+ {
268
+ "epoch": 9.45,
269
+ "grad_norm": 8.111244201660156,
270
+ "learning_rate": 7.323082076153509e-07,
271
+ "loss": 0.1519,
272
+ "step": 2600
273
+ },
274
+ {
275
+ "epoch": 9.82,
276
+ "grad_norm": 8.917200088500977,
277
+ "learning_rate": 8.15448036932176e-08,
278
+ "loss": 0.168,
279
+ "step": 2700
280
+ },
281
+ {
282
+ "epoch": 10.0,
283
+ "eval_accuracy": 0.9204771371769384,
284
+ "eval_loss": 0.2866075932979584,
285
+ "eval_runtime": 61.2534,
286
+ "eval_samples_per_second": 41.059,
287
+ "eval_steps_per_second": 0.653,
288
+ "step": 2750
289
+ },
290
+ {
291
+ "epoch": 10.0,
292
+ "step": 2750,
293
+ "total_flos": 7.000491898906214e+18,
294
+ "train_loss": 0.3542752295407382,
295
+ "train_runtime": 6594.6916,
296
+ "train_samples_per_second": 26.659,
297
+ "train_steps_per_second": 0.417
298
+ }
299
+ ],
300
+ "logging_steps": 100,
301
+ "max_steps": 2750,
302
+ "num_input_tokens_seen": 0,
303
+ "num_train_epochs": 10,
304
+ "save_steps": 500,
305
+ "total_flos": 7.000491898906214e+18,
306
+ "train_batch_size": 64,
307
+ "trial_name": null,
308
+ "trial_params": null
309
+ }