JorgeGIT commited on
Commit
7029aa1
1 Parent(s): e52a769

Model save

Browse files
README.md CHANGED
@@ -32,7 +32,7 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.0870
36
  - Accuracy: 0.9774
37
 
38
  ## Model description
@@ -58,16 +58,19 @@ The following hyperparameters were used during training:
58
  - seed: 42
59
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
60
  - lr_scheduler_type: linear
61
- - num_epochs: 10
62
  - mixed_precision_training: Native AMP
63
 
64
  ### Training results
65
 
66
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
67
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
68
- | 0.1606 | 2.94 | 100 | 0.1829 | 0.9511 |
69
- | 0.1895 | 5.88 | 200 | 0.1441 | 0.9662 |
70
- | 0.0423 | 8.82 | 300 | 0.0870 | 0.9774 |
 
 
 
71
 
72
 
73
  ### Framework versions
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.1073
36
  - Accuracy: 0.9774
37
 
38
  ## Model description
 
58
  - seed: 42
59
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
60
  - lr_scheduler_type: linear
61
+ - num_epochs: 20
62
  - mixed_precision_training: Native AMP
63
 
64
  ### Training results
65
 
66
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
67
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
68
+ | 0.0673 | 2.94 | 100 | 0.1144 | 0.9699 |
69
+ | 0.0639 | 5.88 | 200 | 0.1431 | 0.9549 |
70
+ | 0.0491 | 8.82 | 300 | 0.2439 | 0.9436 |
71
+ | 0.0532 | 11.76 | 400 | 0.1389 | 0.9624 |
72
+ | 0.0636 | 14.71 | 500 | 0.1537 | 0.9624 |
73
+ | 0.0493 | 17.65 | 600 | 0.1073 | 0.9774 |
74
 
75
 
76
  ### Framework versions
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 4.0,
3
- "eval_accuracy": 0.9548872180451128,
4
- "eval_loss": 0.18233025074005127,
5
- "eval_runtime": 2.6375,
6
- "eval_samples_per_second": 100.853,
7
- "eval_steps_per_second": 12.891,
8
- "total_flos": 3.292007238315049e+17,
9
- "train_loss": 0.5091555158593761,
10
- "train_runtime": 958.3438,
11
- "train_samples_per_second": 4.433,
12
- "train_steps_per_second": 0.28
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.9774436090225563,
4
+ "eval_loss": 0.08701933920383453,
5
+ "eval_runtime": 6.074,
6
+ "eval_samples_per_second": 43.794,
7
+ "eval_steps_per_second": 5.598,
8
+ "total_flos": 8.230018095787622e+17,
9
+ "train_loss": 0.1465345554492053,
10
+ "train_runtime": 221.0307,
11
+ "train_samples_per_second": 48.048,
12
+ "train_steps_per_second": 1.538
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 4.0,
3
- "eval_accuracy": 0.9548872180451128,
4
- "eval_loss": 0.18233025074005127,
5
- "eval_runtime": 2.6375,
6
- "eval_samples_per_second": 100.853,
7
- "eval_steps_per_second": 12.891
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.9774436090225563,
4
+ "eval_loss": 0.08701933920383453,
5
+ "eval_runtime": 6.074,
6
+ "eval_samples_per_second": 43.794,
7
+ "eval_steps_per_second": 5.598
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86d8fbbe5587bcb92891682aa722012947d3377ee2016b310819dd2600bc17ef
3
  size 343239356
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:411fb8baf76f74b477a876b3be53846a6c2c51f9277cb00a81542425c237112f
3
  size 343239356
runs/Nov30_23-24-53_6c26dad0aabb/events.out.tfevents.1701388197.6c26dad0aabb.7066.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06a65913484bc16a9200120c328bc649062568aeac6e2385df8965cf3585a7ee
3
+ size 411
runs/Nov30_23-50-18_6c26dad0aabb/events.out.tfevents.1701388227.6c26dad0aabb.7066.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76b8a5911036db92b1652c997605f1151504fc201444bcd1bdd0c2322b086fd9
3
+ size 17453
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 4.0,
3
- "total_flos": 3.292007238315049e+17,
4
- "train_loss": 0.5091555158593761,
5
- "train_runtime": 958.3438,
6
- "train_samples_per_second": 4.433,
7
- "train_steps_per_second": 0.28
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 8.230018095787622e+17,
4
+ "train_loss": 0.1465345554492053,
5
+ "train_runtime": 221.0307,
6
+ "train_samples_per_second": 48.048,
7
+ "train_steps_per_second": 1.538
8
  }
trainer_state.json CHANGED
@@ -1,202 +1,259 @@
1
  {
2
- "best_metric": 0.18233025074005127,
3
- "best_model_checkpoint": "finetuned-Leukemia-cell/checkpoint-200",
4
- "epoch": 4.0,
5
  "eval_steps": 100,
6
- "global_step": 268,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.15,
13
- "learning_rate": 0.00019253731343283584,
14
- "loss": 1.7951,
15
  "step": 10
16
  },
17
  {
18
- "epoch": 0.3,
19
- "learning_rate": 0.00018507462686567165,
20
- "loss": 1.3572,
21
  "step": 20
22
  },
23
  {
24
- "epoch": 0.45,
25
- "learning_rate": 0.00017761194029850748,
26
- "loss": 0.98,
27
  "step": 30
28
  },
29
  {
30
- "epoch": 0.6,
31
- "learning_rate": 0.00017014925373134328,
32
- "loss": 0.9394,
33
  "step": 40
34
  },
35
  {
36
- "epoch": 0.75,
37
- "learning_rate": 0.00016268656716417911,
38
- "loss": 0.7973,
39
  "step": 50
40
  },
41
  {
42
- "epoch": 0.9,
43
- "learning_rate": 0.00015522388059701495,
44
- "loss": 0.8591,
45
  "step": 60
46
  },
47
  {
48
- "epoch": 1.04,
49
- "learning_rate": 0.00014776119402985075,
50
- "loss": 0.6357,
51
  "step": 70
52
  },
53
  {
54
- "epoch": 1.19,
55
- "learning_rate": 0.00014029850746268658,
56
- "loss": 0.6522,
57
  "step": 80
58
  },
59
  {
60
- "epoch": 1.34,
61
- "learning_rate": 0.0001328358208955224,
62
- "loss": 0.495,
63
  "step": 90
64
  },
65
  {
66
- "epoch": 1.49,
67
- "learning_rate": 0.00012537313432835822,
68
- "loss": 0.4862,
69
  "step": 100
70
  },
71
  {
72
- "epoch": 1.49,
73
- "eval_accuracy": 0.9172932330827067,
74
- "eval_loss": 0.4092223644256592,
75
- "eval_runtime": 173.193,
76
- "eval_samples_per_second": 1.536,
77
- "eval_steps_per_second": 0.196,
78
  "step": 100
79
  },
80
  {
81
- "epoch": 1.64,
82
- "learning_rate": 0.00011791044776119405,
83
- "loss": 0.5047,
84
  "step": 110
85
  },
86
  {
87
- "epoch": 1.79,
88
- "learning_rate": 0.00011044776119402987,
89
- "loss": 0.3878,
90
  "step": 120
91
  },
92
  {
93
- "epoch": 1.94,
94
- "learning_rate": 0.00010298507462686569,
95
- "loss": 0.43,
96
  "step": 130
97
  },
98
  {
99
- "epoch": 2.09,
100
- "learning_rate": 9.552238805970149e-05,
101
- "loss": 0.3441,
102
  "step": 140
103
  },
104
  {
105
- "epoch": 2.24,
106
- "learning_rate": 8.805970149253732e-05,
107
- "loss": 0.3271,
108
  "step": 150
109
  },
110
  {
111
- "epoch": 2.39,
112
- "learning_rate": 8.059701492537314e-05,
113
- "loss": 0.3415,
114
  "step": 160
115
  },
116
  {
117
- "epoch": 2.54,
118
- "learning_rate": 7.313432835820896e-05,
119
- "loss": 0.293,
120
  "step": 170
121
  },
122
  {
123
- "epoch": 2.69,
124
- "learning_rate": 6.567164179104478e-05,
125
- "loss": 0.2864,
126
  "step": 180
127
  },
128
  {
129
- "epoch": 2.84,
130
- "learning_rate": 5.82089552238806e-05,
131
- "loss": 0.2873,
132
  "step": 190
133
  },
134
  {
135
- "epoch": 2.99,
136
- "learning_rate": 5.074626865671642e-05,
137
- "loss": 0.2095,
138
  "step": 200
139
  },
140
  {
141
- "epoch": 2.99,
142
- "eval_accuracy": 0.9548872180451128,
143
- "eval_loss": 0.18233025074005127,
144
- "eval_runtime": 2.578,
145
- "eval_samples_per_second": 103.183,
146
- "eval_steps_per_second": 13.189,
147
  "step": 200
148
  },
149
  {
150
- "epoch": 3.13,
151
- "learning_rate": 4.328358208955224e-05,
152
- "loss": 0.1822,
153
  "step": 210
154
  },
155
  {
156
- "epoch": 3.28,
157
- "learning_rate": 3.582089552238806e-05,
158
- "loss": 0.228,
159
  "step": 220
160
  },
161
  {
162
- "epoch": 3.43,
163
- "learning_rate": 2.835820895522388e-05,
164
- "loss": 0.1377,
165
  "step": 230
166
  },
167
  {
168
- "epoch": 3.58,
169
- "learning_rate": 2.0895522388059702e-05,
170
- "loss": 0.2099,
171
  "step": 240
172
  },
173
  {
174
- "epoch": 3.73,
175
- "learning_rate": 1.3432835820895523e-05,
176
- "loss": 0.1576,
177
  "step": 250
178
  },
179
  {
180
- "epoch": 3.88,
181
- "learning_rate": 5.970149253731343e-06,
182
- "loss": 0.1394,
183
  "step": 260
184
  },
185
  {
186
- "epoch": 4.0,
187
- "step": 268,
188
- "total_flos": 3.292007238315049e+17,
189
- "train_loss": 0.5091555158593761,
190
- "train_runtime": 958.3438,
191
- "train_samples_per_second": 4.433,
192
- "train_steps_per_second": 0.28
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
193
  }
194
  ],
195
  "logging_steps": 10,
196
- "max_steps": 268,
197
- "num_train_epochs": 4,
198
  "save_steps": 100,
199
- "total_flos": 3.292007238315049e+17,
200
  "trial_name": null,
201
  "trial_params": null
202
  }
 
1
  {
2
+ "best_metric": 0.08701933920383453,
3
+ "best_model_checkpoint": "finetuned-Leukemia-cell/checkpoint-300",
4
+ "epoch": 10.0,
5
  "eval_steps": 100,
6
+ "global_step": 340,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.29,
13
+ "learning_rate": 0.00019411764705882354,
14
+ "loss": 0.5837,
15
  "step": 10
16
  },
17
  {
18
+ "epoch": 0.59,
19
+ "learning_rate": 0.00018823529411764707,
20
+ "loss": 0.2956,
21
  "step": 20
22
  },
23
  {
24
+ "epoch": 0.88,
25
+ "learning_rate": 0.0001823529411764706,
26
+ "loss": 0.279,
27
  "step": 30
28
  },
29
  {
30
+ "epoch": 1.18,
31
+ "learning_rate": 0.00017647058823529413,
32
+ "loss": 0.1566,
33
  "step": 40
34
  },
35
  {
36
+ "epoch": 1.47,
37
+ "learning_rate": 0.00017058823529411766,
38
+ "loss": 0.1042,
39
  "step": 50
40
  },
41
  {
42
+ "epoch": 1.76,
43
+ "learning_rate": 0.0001647058823529412,
44
+ "loss": 0.176,
45
  "step": 60
46
  },
47
  {
48
+ "epoch": 2.06,
49
+ "learning_rate": 0.0001588235294117647,
50
+ "loss": 0.1231,
51
  "step": 70
52
  },
53
  {
54
+ "epoch": 2.35,
55
+ "learning_rate": 0.00015294117647058822,
56
+ "loss": 0.0952,
57
  "step": 80
58
  },
59
  {
60
+ "epoch": 2.65,
61
+ "learning_rate": 0.00014705882352941178,
62
+ "loss": 0.1003,
63
  "step": 90
64
  },
65
  {
66
+ "epoch": 2.94,
67
+ "learning_rate": 0.0001411764705882353,
68
+ "loss": 0.1606,
69
  "step": 100
70
  },
71
  {
72
+ "epoch": 2.94,
73
+ "eval_accuracy": 0.9511278195488722,
74
+ "eval_loss": 0.18294382095336914,
75
+ "eval_runtime": 2.8739,
76
+ "eval_samples_per_second": 92.556,
77
+ "eval_steps_per_second": 11.83,
78
  "step": 100
79
  },
80
  {
81
+ "epoch": 3.24,
82
+ "learning_rate": 0.00013529411764705884,
83
+ "loss": 0.2204,
84
  "step": 110
85
  },
86
  {
87
+ "epoch": 3.53,
88
+ "learning_rate": 0.00012941176470588237,
89
+ "loss": 0.2845,
90
  "step": 120
91
  },
92
  {
93
+ "epoch": 3.82,
94
+ "learning_rate": 0.0001235294117647059,
95
+ "loss": 0.2104,
96
  "step": 130
97
  },
98
  {
99
+ "epoch": 4.12,
100
+ "learning_rate": 0.00011764705882352942,
101
+ "loss": 0.2029,
102
  "step": 140
103
  },
104
  {
105
+ "epoch": 4.41,
106
+ "learning_rate": 0.00011176470588235294,
107
+ "loss": 0.1105,
108
  "step": 150
109
  },
110
  {
111
+ "epoch": 4.71,
112
+ "learning_rate": 0.00010588235294117647,
113
+ "loss": 0.177,
114
  "step": 160
115
  },
116
  {
117
+ "epoch": 5.0,
118
+ "learning_rate": 0.0001,
119
+ "loss": 0.1881,
120
  "step": 170
121
  },
122
  {
123
+ "epoch": 5.29,
124
+ "learning_rate": 9.411764705882353e-05,
125
+ "loss": 0.1445,
126
  "step": 180
127
  },
128
  {
129
+ "epoch": 5.59,
130
+ "learning_rate": 8.823529411764706e-05,
131
+ "loss": 0.0891,
132
  "step": 190
133
  },
134
  {
135
+ "epoch": 5.88,
136
+ "learning_rate": 8.23529411764706e-05,
137
+ "loss": 0.1895,
138
  "step": 200
139
  },
140
  {
141
+ "epoch": 5.88,
142
+ "eval_accuracy": 0.9661654135338346,
143
+ "eval_loss": 0.14408943057060242,
144
+ "eval_runtime": 2.3757,
145
+ "eval_samples_per_second": 111.968,
146
+ "eval_steps_per_second": 14.312,
147
  "step": 200
148
  },
149
  {
150
+ "epoch": 6.18,
151
+ "learning_rate": 7.647058823529411e-05,
152
+ "loss": 0.1095,
153
  "step": 210
154
  },
155
  {
156
+ "epoch": 6.47,
157
+ "learning_rate": 7.058823529411765e-05,
158
+ "loss": 0.1908,
159
  "step": 220
160
  },
161
  {
162
+ "epoch": 6.76,
163
+ "learning_rate": 6.470588235294118e-05,
164
+ "loss": 0.1118,
165
  "step": 230
166
  },
167
  {
168
+ "epoch": 7.06,
169
+ "learning_rate": 5.882352941176471e-05,
170
+ "loss": 0.0461,
171
  "step": 240
172
  },
173
  {
174
+ "epoch": 7.35,
175
+ "learning_rate": 5.294117647058824e-05,
176
+ "loss": 0.1002,
177
  "step": 250
178
  },
179
  {
180
+ "epoch": 7.65,
181
+ "learning_rate": 4.705882352941177e-05,
182
+ "loss": 0.082,
183
  "step": 260
184
  },
185
  {
186
+ "epoch": 7.94,
187
+ "learning_rate": 4.11764705882353e-05,
188
+ "loss": 0.0712,
189
+ "step": 270
190
+ },
191
+ {
192
+ "epoch": 8.24,
193
+ "learning_rate": 3.529411764705883e-05,
194
+ "loss": 0.0565,
195
+ "step": 280
196
+ },
197
+ {
198
+ "epoch": 8.53,
199
+ "learning_rate": 2.9411764705882354e-05,
200
+ "loss": 0.0702,
201
+ "step": 290
202
+ },
203
+ {
204
+ "epoch": 8.82,
205
+ "learning_rate": 2.3529411764705884e-05,
206
+ "loss": 0.0423,
207
+ "step": 300
208
+ },
209
+ {
210
+ "epoch": 8.82,
211
+ "eval_accuracy": 0.9774436090225563,
212
+ "eval_loss": 0.08701933920383453,
213
+ "eval_runtime": 2.414,
214
+ "eval_samples_per_second": 110.19,
215
+ "eval_steps_per_second": 14.084,
216
+ "step": 300
217
+ },
218
+ {
219
+ "epoch": 9.12,
220
+ "learning_rate": 1.7647058823529414e-05,
221
+ "loss": 0.0652,
222
+ "step": 310
223
+ },
224
+ {
225
+ "epoch": 9.41,
226
+ "learning_rate": 1.1764705882352942e-05,
227
+ "loss": 0.027,
228
+ "step": 320
229
+ },
230
+ {
231
+ "epoch": 9.71,
232
+ "learning_rate": 5.882352941176471e-06,
233
+ "loss": 0.0633,
234
+ "step": 330
235
+ },
236
+ {
237
+ "epoch": 10.0,
238
+ "learning_rate": 0.0,
239
+ "loss": 0.055,
240
+ "step": 340
241
+ },
242
+ {
243
+ "epoch": 10.0,
244
+ "step": 340,
245
+ "total_flos": 8.230018095787622e+17,
246
+ "train_loss": 0.1465345554492053,
247
+ "train_runtime": 221.0307,
248
+ "train_samples_per_second": 48.048,
249
+ "train_steps_per_second": 1.538
250
  }
251
  ],
252
  "logging_steps": 10,
253
+ "max_steps": 340,
254
+ "num_train_epochs": 10,
255
  "save_steps": 100,
256
+ "total_flos": 8.230018095787622e+17,
257
  "trial_name": null,
258
  "trial_params": null
259
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:945f141fbeb29ad39b8605b232d98a21f0507a88e5e0eb935c00a2a7f5a4a921
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0c51a9692dffa79666ee4c2a799f0ef6e3fddf95c8240e6d000dc48049d3457
3
  size 4600