Isaskar commited on
Commit
27487c3
1 Parent(s): 1b58577

End of training

Browse files
README.md CHANGED
@@ -23,10 +23,10 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 0.7563587684069611
27
  - name: F1
28
  type: f1
29
- value: 0.6330645161290323
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -36,9 +36,9 @@ should probably proofread and complete it, then remove this comment. -->
36
 
37
  This model is a fine-tuned version of [facebook/dinov2-base](https://huggingface.co/facebook/dinov2-base) on the imagefolder dataset.
38
  It achieves the following results on the evaluation set:
39
- - Loss: 0.6111
40
- - Accuracy: 0.7564
41
- - F1: 0.6331
42
 
43
  ## Model description
44
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.7188755020080321
27
  - name: F1
28
  type: f1
29
+ value: 0.6332945285215367
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
36
 
37
  This model is a fine-tuned version of [facebook/dinov2-base](https://huggingface.co/facebook/dinov2-base) on the imagefolder dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.5700
40
+ - Accuracy: 0.7189
41
+ - F1: 0.6333
42
 
43
  ## Model description
44
 
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.914691943127962,
3
+ "eval_accuracy": 0.7188755020080321,
4
+ "eval_f1": 0.6332945285215367,
5
+ "eval_loss": 0.5700241923332214,
6
+ "eval_runtime": 52.2777,
7
+ "eval_samples_per_second": 42.867,
8
+ "eval_steps_per_second": 1.358,
9
+ "total_flos": 3.110854122492383e+18,
10
+ "train_loss": 0.474308407268463,
11
+ "train_runtime": 2029.1858,
12
+ "train_samples_per_second": 19.873,
13
+ "train_steps_per_second": 0.154
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.914691943127962,
3
+ "eval_accuracy": 0.7188755020080321,
4
+ "eval_f1": 0.6332945285215367,
5
+ "eval_loss": 0.5700241923332214,
6
+ "eval_runtime": 52.2777,
7
+ "eval_samples_per_second": 42.867,
8
+ "eval_steps_per_second": 1.358
9
+ }
runs/May13_11-57-01_70f368d74d1d/events.out.tfevents.1715603537.70f368d74d1d.204.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25bbaead31902bedc5ee67d8ec832cb76ceda58e19745ffc3ff5aee2322de2ea
3
+ size 457
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.914691943127962,
3
+ "total_flos": 3.110854122492383e+18,
4
+ "train_loss": 0.474308407268463,
5
+ "train_runtime": 2029.1858,
6
+ "train_samples_per_second": 19.873,
7
+ "train_steps_per_second": 0.154
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,307 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.6332945285215367,
3
+ "best_model_checkpoint": "dinov2-base-ODIR-5K/checkpoint-263",
4
+ "epoch": 5.914691943127962,
5
+ "eval_steps": 500,
6
+ "global_step": 312,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.1895734597156398,
13
+ "grad_norm": 151.11000061035156,
14
+ "learning_rate": 1.5625e-05,
15
+ "loss": 0.7609,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.3791469194312796,
20
+ "grad_norm": 34.450782775878906,
21
+ "learning_rate": 3.125e-05,
22
+ "loss": 0.6601,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 0.5687203791469194,
27
+ "grad_norm": 58.26628112792969,
28
+ "learning_rate": 4.6875e-05,
29
+ "loss": 0.6456,
30
+ "step": 30
31
+ },
32
+ {
33
+ "epoch": 0.7582938388625592,
34
+ "grad_norm": 36.494163513183594,
35
+ "learning_rate": 4.8571428571428576e-05,
36
+ "loss": 0.7091,
37
+ "step": 40
38
+ },
39
+ {
40
+ "epoch": 0.9478672985781991,
41
+ "grad_norm": 71.59378051757812,
42
+ "learning_rate": 4.678571428571429e-05,
43
+ "loss": 0.6374,
44
+ "step": 50
45
+ },
46
+ {
47
+ "epoch": 0.985781990521327,
48
+ "eval_accuracy": 0.6778224007139669,
49
+ "eval_f1": 0.20309050772626933,
50
+ "eval_loss": 0.6185599565505981,
51
+ "eval_runtime": 48.0839,
52
+ "eval_samples_per_second": 46.606,
53
+ "eval_steps_per_second": 1.477,
54
+ "step": 52
55
+ },
56
+ {
57
+ "epoch": 1.1374407582938388,
58
+ "grad_norm": 30.247587203979492,
59
+ "learning_rate": 4.5e-05,
60
+ "loss": 0.5721,
61
+ "step": 60
62
+ },
63
+ {
64
+ "epoch": 1.3270142180094786,
65
+ "grad_norm": 39.30122756958008,
66
+ "learning_rate": 4.3214285714285716e-05,
67
+ "loss": 0.6093,
68
+ "step": 70
69
+ },
70
+ {
71
+ "epoch": 1.5165876777251186,
72
+ "grad_norm": 32.839881896972656,
73
+ "learning_rate": 4.1428571428571437e-05,
74
+ "loss": 0.5805,
75
+ "step": 80
76
+ },
77
+ {
78
+ "epoch": 1.7061611374407581,
79
+ "grad_norm": 15.105513572692871,
80
+ "learning_rate": 3.964285714285714e-05,
81
+ "loss": 0.5933,
82
+ "step": 90
83
+ },
84
+ {
85
+ "epoch": 1.8957345971563981,
86
+ "grad_norm": 12.636411666870117,
87
+ "learning_rate": 3.785714285714286e-05,
88
+ "loss": 0.5789,
89
+ "step": 100
90
+ },
91
+ {
92
+ "epoch": 1.9905213270142181,
93
+ "eval_accuracy": 0.715305667112896,
94
+ "eval_f1": 0.3793774319066148,
95
+ "eval_loss": 0.5660730600357056,
96
+ "eval_runtime": 48.0436,
97
+ "eval_samples_per_second": 46.645,
98
+ "eval_steps_per_second": 1.478,
99
+ "step": 105
100
+ },
101
+ {
102
+ "epoch": 2.085308056872038,
103
+ "grad_norm": 10.535428047180176,
104
+ "learning_rate": 3.607142857142857e-05,
105
+ "loss": 0.5118,
106
+ "step": 110
107
+ },
108
+ {
109
+ "epoch": 2.2748815165876777,
110
+ "grad_norm": 20.61358642578125,
111
+ "learning_rate": 3.428571428571429e-05,
112
+ "loss": 0.5222,
113
+ "step": 120
114
+ },
115
+ {
116
+ "epoch": 2.4644549763033177,
117
+ "grad_norm": 16.988859176635742,
118
+ "learning_rate": 3.2500000000000004e-05,
119
+ "loss": 0.552,
120
+ "step": 130
121
+ },
122
+ {
123
+ "epoch": 2.654028436018957,
124
+ "grad_norm": 27.578903198242188,
125
+ "learning_rate": 3.071428571428572e-05,
126
+ "loss": 0.5025,
127
+ "step": 140
128
+ },
129
+ {
130
+ "epoch": 2.843601895734597,
131
+ "grad_norm": 7.29171895980835,
132
+ "learning_rate": 2.8928571428571434e-05,
133
+ "loss": 0.5368,
134
+ "step": 150
135
+ },
136
+ {
137
+ "epoch": 2.995260663507109,
138
+ "eval_accuracy": 0.7407407407407407,
139
+ "eval_f1": 0.5756026296566837,
140
+ "eval_loss": 0.5333759188652039,
141
+ "eval_runtime": 48.0715,
142
+ "eval_samples_per_second": 46.618,
143
+ "eval_steps_per_second": 1.477,
144
+ "step": 158
145
+ },
146
+ {
147
+ "epoch": 3.0331753554502368,
148
+ "grad_norm": 10.034445762634277,
149
+ "learning_rate": 2.714285714285714e-05,
150
+ "loss": 0.4669,
151
+ "step": 160
152
+ },
153
+ {
154
+ "epoch": 3.2227488151658767,
155
+ "grad_norm": 10.450629234313965,
156
+ "learning_rate": 2.5357142857142858e-05,
157
+ "loss": 0.4631,
158
+ "step": 170
159
+ },
160
+ {
161
+ "epoch": 3.4123222748815167,
162
+ "grad_norm": 17.410293579101562,
163
+ "learning_rate": 2.357142857142857e-05,
164
+ "loss": 0.4565,
165
+ "step": 180
166
+ },
167
+ {
168
+ "epoch": 3.6018957345971563,
169
+ "grad_norm": 11.578069686889648,
170
+ "learning_rate": 2.1785714285714288e-05,
171
+ "loss": 0.4292,
172
+ "step": 190
173
+ },
174
+ {
175
+ "epoch": 3.7914691943127963,
176
+ "grad_norm": 12.56495189666748,
177
+ "learning_rate": 2e-05,
178
+ "loss": 0.4289,
179
+ "step": 200
180
+ },
181
+ {
182
+ "epoch": 3.9810426540284363,
183
+ "grad_norm": 11.08157730102539,
184
+ "learning_rate": 1.8214285714285715e-05,
185
+ "loss": 0.4162,
186
+ "step": 210
187
+ },
188
+ {
189
+ "epoch": 4.0,
190
+ "eval_accuracy": 0.6983489513609995,
191
+ "eval_f1": 0.6197975253093364,
192
+ "eval_loss": 0.574705183506012,
193
+ "eval_runtime": 48.2487,
194
+ "eval_samples_per_second": 46.447,
195
+ "eval_steps_per_second": 1.472,
196
+ "step": 211
197
+ },
198
+ {
199
+ "epoch": 4.170616113744076,
200
+ "grad_norm": 16.88544273376465,
201
+ "learning_rate": 1.642857142857143e-05,
202
+ "loss": 0.3839,
203
+ "step": 220
204
+ },
205
+ {
206
+ "epoch": 4.360189573459715,
207
+ "grad_norm": 10.79478931427002,
208
+ "learning_rate": 1.4642857142857144e-05,
209
+ "loss": 0.3881,
210
+ "step": 230
211
+ },
212
+ {
213
+ "epoch": 4.549763033175355,
214
+ "grad_norm": 19.362905502319336,
215
+ "learning_rate": 1.2857142857142857e-05,
216
+ "loss": 0.3377,
217
+ "step": 240
218
+ },
219
+ {
220
+ "epoch": 4.739336492890995,
221
+ "grad_norm": 14.351540565490723,
222
+ "learning_rate": 1.107142857142857e-05,
223
+ "loss": 0.348,
224
+ "step": 250
225
+ },
226
+ {
227
+ "epoch": 4.928909952606635,
228
+ "grad_norm": 12.308573722839355,
229
+ "learning_rate": 9.285714285714286e-06,
230
+ "loss": 0.3679,
231
+ "step": 260
232
+ },
233
+ {
234
+ "epoch": 4.9857819905213265,
235
+ "eval_accuracy": 0.7188755020080321,
236
+ "eval_f1": 0.6332945285215367,
237
+ "eval_loss": 0.5700241923332214,
238
+ "eval_runtime": 48.6206,
239
+ "eval_samples_per_second": 46.092,
240
+ "eval_steps_per_second": 1.46,
241
+ "step": 263
242
+ },
243
+ {
244
+ "epoch": 5.118483412322275,
245
+ "grad_norm": 6.65657377243042,
246
+ "learning_rate": 7.5e-06,
247
+ "loss": 0.3325,
248
+ "step": 270
249
+ },
250
+ {
251
+ "epoch": 5.308056872037914,
252
+ "grad_norm": 14.3682222366333,
253
+ "learning_rate": 5.7142857142857145e-06,
254
+ "loss": 0.2559,
255
+ "step": 280
256
+ },
257
+ {
258
+ "epoch": 5.497630331753554,
259
+ "grad_norm": 14.902679443359375,
260
+ "learning_rate": 3.928571428571429e-06,
261
+ "loss": 0.238,
262
+ "step": 290
263
+ },
264
+ {
265
+ "epoch": 5.687203791469194,
266
+ "grad_norm": 12.136739730834961,
267
+ "learning_rate": 2.142857142857143e-06,
268
+ "loss": 0.2202,
269
+ "step": 300
270
+ },
271
+ {
272
+ "epoch": 5.876777251184834,
273
+ "grad_norm": 14.554306030273438,
274
+ "learning_rate": 3.5714285714285716e-07,
275
+ "loss": 0.2431,
276
+ "step": 310
277
+ },
278
+ {
279
+ "epoch": 5.914691943127962,
280
+ "eval_accuracy": 0.7563587684069611,
281
+ "eval_f1": 0.6330645161290323,
282
+ "eval_loss": 0.6110782027244568,
283
+ "eval_runtime": 48.257,
284
+ "eval_samples_per_second": 46.439,
285
+ "eval_steps_per_second": 1.471,
286
+ "step": 312
287
+ },
288
+ {
289
+ "epoch": 5.914691943127962,
290
+ "step": 312,
291
+ "total_flos": 3.110854122492383e+18,
292
+ "train_loss": 0.474308407268463,
293
+ "train_runtime": 2029.1858,
294
+ "train_samples_per_second": 19.873,
295
+ "train_steps_per_second": 0.154
296
+ }
297
+ ],
298
+ "logging_steps": 10,
299
+ "max_steps": 312,
300
+ "num_input_tokens_seen": 0,
301
+ "num_train_epochs": 6,
302
+ "save_steps": 500,
303
+ "total_flos": 3.110854122492383e+18,
304
+ "train_batch_size": 32,
305
+ "trial_name": null,
306
+ "trial_params": null
307
+ }