sharren commited on
Commit
e060267
1 Parent(s): 4e0ffec

🍻 cheers

Browse files
README.md CHANGED
@@ -2,6 +2,7 @@
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224
4
  tags:
 
5
  - generated_from_trainer
6
  metrics:
7
  - accuracy
@@ -18,13 +19,13 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  # vit-lr-0.0001
20
 
21
- This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 1.0203
24
- - Accuracy: 0.8457
25
- - Precision: 0.8488
26
- - Recall: 0.8457
27
- - F1: 0.8416
28
 
29
  ## Model description
30
 
 
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224
4
  tags:
5
+ - image-classification
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
 
19
 
20
  # vit-lr-0.0001
21
 
22
+ This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the skin-cancer dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.4778
25
+ - Accuracy: 0.8311
26
+ - Precision: 0.8433
27
+ - Recall: 0.8311
28
+ - F1: 0.8269
29
 
30
  ## Model description
31
 
all_results.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "epoch": 12.0,
3
- "eval_accuracy": 0.8283633841886269,
4
- "eval_f1": 0.8213379813460607,
5
- "eval_loss": 0.4716978371143341,
6
- "eval_precision": 0.8230999577196753,
7
- "eval_recall": 0.8283633841886269,
8
- "eval_runtime": 38.426,
9
- "eval_samples_per_second": 75.053,
10
- "eval_steps_per_second": 9.395,
11
  "total_flos": 4.768760767819088e+18,
12
- "train_loss": 0.16453982563157443,
13
- "train_runtime": 1738.7619,
14
- "train_samples_per_second": 294.922,
15
- "train_steps_per_second": 18.461
16
  }
 
1
  {
2
  "epoch": 12.0,
3
+ "eval_accuracy": 0.8311373092926491,
4
+ "eval_f1": 0.8268544179848872,
5
+ "eval_loss": 0.4778192639350891,
6
+ "eval_precision": 0.8433264041291242,
7
+ "eval_recall": 0.8311373092926491,
8
+ "eval_runtime": 38.5646,
9
+ "eval_samples_per_second": 74.784,
10
+ "eval_steps_per_second": 9.361,
11
  "total_flos": 4.768760767819088e+18,
12
+ "train_loss": 0.15186076372211968,
13
+ "train_runtime": 1747.1919,
14
+ "train_samples_per_second": 293.5,
15
+ "train_steps_per_second": 18.372
16
  }
eval_results.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
  "epoch": 12.0,
3
- "eval_accuracy": 0.8283633841886269,
4
- "eval_f1": 0.8213379813460607,
5
- "eval_loss": 0.4716978371143341,
6
- "eval_precision": 0.8230999577196753,
7
- "eval_recall": 0.8283633841886269,
8
- "eval_runtime": 38.426,
9
- "eval_samples_per_second": 75.053,
10
- "eval_steps_per_second": 9.395
11
  }
 
1
  {
2
  "epoch": 12.0,
3
+ "eval_accuracy": 0.8311373092926491,
4
+ "eval_f1": 0.8268544179848872,
5
+ "eval_loss": 0.4778192639350891,
6
+ "eval_precision": 0.8433264041291242,
7
+ "eval_recall": 0.8311373092926491,
8
+ "eval_runtime": 38.5646,
9
+ "eval_samples_per_second": 74.784,
10
+ "eval_steps_per_second": 9.361
11
  }
runs/Mar19_13-16-22_befed1cbff90/events.out.tfevents.1710855985.befed1cbff90.172.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a48d22f2a847c500cf946bfe1a8808b24bb9afcf39f36517c9ea66f7a5fda93
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 12.0,
3
  "total_flos": 4.768760767819088e+18,
4
- "train_loss": 0.16453982563157443,
5
- "train_runtime": 1738.7619,
6
- "train_samples_per_second": 294.922,
7
- "train_steps_per_second": 18.461
8
  }
 
1
  {
2
  "epoch": 12.0,
3
  "total_flos": 4.768760767819088e+18,
4
+ "train_loss": 0.15186076372211968,
5
+ "train_runtime": 1747.1919,
6
+ "train_samples_per_second": 293.5,
7
+ "train_steps_per_second": 18.372
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.4716978371143341,
3
  "best_model_checkpoint": "./vit-lr-0.0001/checkpoint-642",
4
  "epoch": 12.0,
5
  "eval_steps": 500,
@@ -10,240 +10,240 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 5.450945854187012,
14
- "learning_rate": 9.549150281252611e-06,
15
- "loss": 0.682,
16
  "step": 321
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.8099861303744799,
21
- "eval_f1": 0.798120450266025,
22
- "eval_loss": 0.5192127823829651,
23
- "eval_precision": 0.8034262669589041,
24
- "eval_recall": 0.8099861303744799,
25
- "eval_runtime": 37.3933,
26
- "eval_samples_per_second": 77.126,
27
- "eval_steps_per_second": 9.654,
28
  "step": 321
29
  },
30
  {
31
  "epoch": 2.0,
32
- "grad_norm": 5.513205051422119,
33
- "learning_rate": 6.394955530196143e-05,
34
- "loss": 0.4386,
35
  "step": 642
36
  },
37
  {
38
  "epoch": 2.0,
39
- "eval_accuracy": 0.8283633841886269,
40
- "eval_f1": 0.8213379813460607,
41
- "eval_loss": 0.4716978371143341,
42
- "eval_precision": 0.8230999577196753,
43
- "eval_recall": 0.8283633841886269,
44
- "eval_runtime": 37.886,
45
- "eval_samples_per_second": 76.123,
46
- "eval_steps_per_second": 9.529,
47
  "step": 642
48
  },
49
  {
50
  "epoch": 3.0,
51
- "grad_norm": 0.9458593726158142,
52
- "learning_rate": 6.840622763423387e-05,
53
- "loss": 0.2621,
54
  "step": 963
55
  },
56
  {
57
  "epoch": 3.0,
58
- "eval_accuracy": 0.8349514563106796,
59
- "eval_f1": 0.8201100816778963,
60
- "eval_loss": 0.5676096081733704,
61
- "eval_precision": 0.8262616496556073,
62
- "eval_recall": 0.8349514563106796,
63
- "eval_runtime": 37.2214,
64
- "eval_samples_per_second": 77.482,
65
- "eval_steps_per_second": 9.699,
66
  "step": 963
67
  },
68
  {
69
  "epoch": 4.0,
70
- "grad_norm": 7.709182262420654,
71
- "learning_rate": 6.9628986498044885e-06,
72
- "loss": 0.1891,
73
  "step": 1284
74
  },
75
  {
76
  "epoch": 4.0,
77
  "eval_accuracy": 0.8495145631067961,
78
- "eval_f1": 0.8436304900485414,
79
- "eval_loss": 0.5022268891334534,
80
- "eval_precision": 0.8555501567834226,
81
  "eval_recall": 0.8495145631067961,
82
- "eval_runtime": 37.4592,
83
- "eval_samples_per_second": 76.99,
84
- "eval_steps_per_second": 9.637,
85
  "step": 1284
86
  },
87
  {
88
  "epoch": 5.0,
89
- "grad_norm": 0.030552733689546585,
90
- "learning_rate": 9.960573506570156e-05,
91
- "loss": 0.1052,
92
  "step": 1605
93
  },
94
  {
95
  "epoch": 5.0,
96
- "eval_accuracy": 0.8398058252427184,
97
- "eval_f1": 0.8357173097291434,
98
- "eval_loss": 0.6660671830177307,
99
- "eval_precision": 0.8482768361910064,
100
- "eval_recall": 0.8398058252427184,
101
- "eval_runtime": 39.2791,
102
- "eval_samples_per_second": 73.423,
103
- "eval_steps_per_second": 9.191,
104
  "step": 1605
105
  },
106
  {
107
  "epoch": 6.0,
108
- "grad_norm": 1.1932728290557861,
109
- "learning_rate": 1.4644660940675861e-05,
110
- "loss": 0.0785,
111
  "step": 1926
112
  },
113
  {
114
  "epoch": 6.0,
115
- "eval_accuracy": 0.8592233009708737,
116
- "eval_f1": 0.8574256259898136,
117
- "eval_loss": 0.5570405125617981,
118
- "eval_precision": 0.8573736727029027,
119
- "eval_recall": 0.8592233009708737,
120
- "eval_runtime": 37.1007,
121
- "eval_samples_per_second": 77.734,
122
- "eval_steps_per_second": 9.73,
123
  "step": 1926
124
  },
125
  {
126
  "epoch": 7.0,
127
- "grad_norm": 17.325477600097656,
128
- "learning_rate": 5.626666167820289e-05,
129
- "loss": 0.0481,
130
  "step": 2247
131
  },
132
  {
133
  "epoch": 7.0,
134
- "eval_accuracy": 0.8547156726768377,
135
- "eval_f1": 0.8523115263952025,
136
- "eval_loss": 0.6496189832687378,
137
- "eval_precision": 0.8547876753873573,
138
- "eval_recall": 0.8547156726768377,
139
- "eval_runtime": 36.7758,
140
- "eval_samples_per_second": 78.421,
141
- "eval_steps_per_second": 9.816,
142
  "step": 2247
143
  },
144
  {
145
  "epoch": 8.0,
146
- "grad_norm": 0.6180940270423889,
147
- "learning_rate": 7.545207078756922e-05,
148
- "loss": 0.0281,
149
  "step": 2568
150
  },
151
  {
152
  "epoch": 8.0,
153
- "eval_accuracy": 0.8571428571428571,
154
- "eval_f1": 0.8544924977438809,
155
- "eval_loss": 0.7423234581947327,
156
- "eval_precision": 0.8569592454687236,
157
- "eval_recall": 0.8571428571428571,
158
- "eval_runtime": 37.383,
159
- "eval_samples_per_second": 77.147,
160
- "eval_steps_per_second": 9.657,
161
  "step": 2568
162
  },
163
  {
164
  "epoch": 9.0,
165
- "grad_norm": 0.014829314313828945,
166
- "learning_rate": 3.5111757055883184e-06,
167
- "loss": 0.0439,
168
  "step": 2889
169
  },
170
  {
171
  "epoch": 9.0,
172
- "eval_accuracy": 0.8540221914008321,
173
- "eval_f1": 0.8518021160859013,
174
- "eval_loss": 0.7677786946296692,
175
- "eval_precision": 0.851139101545856,
176
- "eval_recall": 0.8540221914008321,
177
- "eval_runtime": 37.2162,
178
- "eval_samples_per_second": 77.493,
179
- "eval_steps_per_second": 9.7,
180
  "step": 2889
181
  },
182
  {
183
  "epoch": 10.0,
184
- "grad_norm": 0.003476586891338229,
185
- "learning_rate": 9.801468428386933e-05,
186
- "loss": 0.0297,
187
  "step": 3210
188
  },
189
  {
190
  "epoch": 10.0,
191
- "eval_accuracy": 0.8467406380027739,
192
- "eval_f1": 0.8464070946689463,
193
- "eval_loss": 0.8647756576538086,
194
- "eval_precision": 0.8478472152581428,
195
- "eval_recall": 0.8467406380027739,
196
- "eval_runtime": 37.1575,
197
- "eval_samples_per_second": 77.616,
198
- "eval_steps_per_second": 9.715,
199
  "step": 3210
200
  },
201
  {
202
  "epoch": 11.0,
203
- "grad_norm": 0.09397422522306442,
204
- "learning_rate": 2.0610737385380886e-05,
205
- "loss": 0.037,
206
  "step": 3531
207
  },
208
  {
209
  "epoch": 11.0,
210
- "eval_accuracy": 0.8561026352288488,
211
- "eval_f1": 0.8548878398804619,
212
- "eval_loss": 0.7682856321334839,
213
- "eval_precision": 0.8552181984518148,
214
- "eval_recall": 0.8561026352288488,
215
- "eval_runtime": 37.5045,
216
- "eval_samples_per_second": 76.898,
217
- "eval_steps_per_second": 9.626,
218
  "step": 3531
219
  },
220
  {
221
  "epoch": 12.0,
222
- "grad_norm": 0.002134101465344429,
223
- "learning_rate": 4.999999999998897e-05,
224
- "loss": 0.0322,
225
  "step": 3852
226
  },
227
  {
228
  "epoch": 12.0,
229
- "eval_accuracy": 0.8512482662968099,
230
- "eval_f1": 0.8396847788052201,
231
- "eval_loss": 1.0125652551651,
232
- "eval_precision": 0.8561110421693547,
233
- "eval_recall": 0.8512482662968099,
234
- "eval_runtime": 37.3877,
235
- "eval_samples_per_second": 77.138,
236
- "eval_steps_per_second": 9.656,
237
  "step": 3852
238
  },
239
  {
240
  "epoch": 12.0,
241
  "step": 3852,
242
  "total_flos": 4.768760767819088e+18,
243
- "train_loss": 0.16453982563157443,
244
- "train_runtime": 1738.7619,
245
- "train_samples_per_second": 294.922,
246
- "train_steps_per_second": 18.461
247
  }
248
  ],
249
  "logging_steps": 500,
 
1
  {
2
+ "best_metric": 0.4778192639350891,
3
  "best_model_checkpoint": "./vit-lr-0.0001/checkpoint-642",
4
  "epoch": 12.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 5.167571067810059,
14
+ "learning_rate": 9.997548148581541e-05,
15
+ "loss": 0.6718,
16
  "step": 321
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.8242024965325936,
21
+ "eval_f1": 0.8162630829948523,
22
+ "eval_loss": 0.4934074282646179,
23
+ "eval_precision": 0.8254417232097437,
24
+ "eval_recall": 0.8242024965325936,
25
+ "eval_runtime": 37.6292,
26
+ "eval_samples_per_second": 76.643,
27
+ "eval_steps_per_second": 9.594,
28
  "step": 321
29
  },
30
  {
31
  "epoch": 2.0,
32
+ "grad_norm": 6.953319072723389,
33
+ "learning_rate": 9.990164344447551e-05,
34
+ "loss": 0.4045,
35
  "step": 642
36
  },
37
  {
38
  "epoch": 2.0,
39
+ "eval_accuracy": 0.8311373092926491,
40
+ "eval_f1": 0.8268544179848872,
41
+ "eval_loss": 0.4778192639350891,
42
+ "eval_precision": 0.8433264041291242,
43
+ "eval_recall": 0.8311373092926491,
44
+ "eval_runtime": 37.5244,
45
+ "eval_samples_per_second": 76.857,
46
+ "eval_steps_per_second": 9.62,
47
  "step": 642
48
  },
49
  {
50
  "epoch": 3.0,
51
+ "grad_norm": 7.354413986206055,
52
+ "learning_rate": 9.977855850575433e-05,
53
+ "loss": 0.2419,
54
  "step": 963
55
  },
56
  {
57
  "epoch": 3.0,
58
+ "eval_accuracy": 0.840499306518724,
59
+ "eval_f1": 0.8409562025706393,
60
+ "eval_loss": 0.5132780075073242,
61
+ "eval_precision": 0.8524873378932092,
62
+ "eval_recall": 0.840499306518724,
63
+ "eval_runtime": 36.8758,
64
+ "eval_samples_per_second": 78.209,
65
+ "eval_steps_per_second": 9.79,
66
  "step": 963
67
  },
68
  {
69
  "epoch": 4.0,
70
+ "grad_norm": 0.17630255222320557,
71
+ "learning_rate": 9.960634813962617e-05,
72
+ "loss": 0.1267,
73
  "step": 1284
74
  },
75
  {
76
  "epoch": 4.0,
77
  "eval_accuracy": 0.8495145631067961,
78
+ "eval_f1": 0.8447806876150558,
79
+ "eval_loss": 0.6153807044029236,
80
+ "eval_precision": 0.8490665425851771,
81
  "eval_recall": 0.8495145631067961,
82
+ "eval_runtime": 37.1161,
83
+ "eval_samples_per_second": 77.702,
84
+ "eval_steps_per_second": 9.726,
85
  "step": 1284
86
  },
87
  {
88
  "epoch": 5.0,
89
+ "grad_norm": 0.5389394760131836,
90
+ "learning_rate": 9.938518229693118e-05,
91
+ "loss": 0.0733,
92
  "step": 1605
93
  },
94
  {
95
  "epoch": 5.0,
96
+ "eval_accuracy": 0.8422330097087378,
97
+ "eval_f1": 0.8361023278787632,
98
+ "eval_loss": 0.7844527959823608,
99
+ "eval_precision": 0.8420613182520028,
100
+ "eval_recall": 0.8422330097087378,
101
+ "eval_runtime": 37.3092,
102
+ "eval_samples_per_second": 77.3,
103
+ "eval_steps_per_second": 9.676,
104
  "step": 1605
105
  },
106
  {
107
  "epoch": 6.0,
108
+ "grad_norm": 24.989282608032227,
109
+ "learning_rate": 9.911527924165445e-05,
110
+ "loss": 0.0446,
111
  "step": 1926
112
  },
113
  {
114
  "epoch": 6.0,
115
+ "eval_accuracy": 0.8470873786407767,
116
+ "eval_f1": 0.840751584936853,
117
+ "eval_loss": 0.8766722679138184,
118
+ "eval_precision": 0.8407202080357687,
119
+ "eval_recall": 0.8470873786407767,
120
+ "eval_runtime": 37.9466,
121
+ "eval_samples_per_second": 76.002,
122
+ "eval_steps_per_second": 9.513,
123
  "step": 1926
124
  },
125
  {
126
  "epoch": 7.0,
127
+ "grad_norm": 0.16091497242450714,
128
+ "learning_rate": 9.879690533552573e-05,
129
+ "loss": 0.0523,
130
  "step": 2247
131
  },
132
  {
133
  "epoch": 7.0,
134
+ "eval_accuracy": 0.84500693481276,
135
+ "eval_f1": 0.8406651419661996,
136
+ "eval_loss": 0.8674203753471375,
137
+ "eval_precision": 0.8491745633887275,
138
+ "eval_recall": 0.84500693481276,
139
+ "eval_runtime": 37.6505,
140
+ "eval_samples_per_second": 76.599,
141
+ "eval_steps_per_second": 9.588,
142
  "step": 2247
143
  },
144
  {
145
  "epoch": 8.0,
146
+ "grad_norm": 0.0028496491722762585,
147
+ "learning_rate": 9.843159102999166e-05,
148
+ "loss": 0.0388,
149
  "step": 2568
150
  },
151
  {
152
  "epoch": 8.0,
153
+ "eval_accuracy": 0.8398058252427184,
154
+ "eval_f1": 0.8387317635385871,
155
+ "eval_loss": 0.9753792881965637,
156
+ "eval_precision": 0.8565844319804308,
157
+ "eval_recall": 0.8398058252427184,
158
+ "eval_runtime": 37.8044,
159
+ "eval_samples_per_second": 76.287,
160
+ "eval_steps_per_second": 9.549,
161
  "step": 2568
162
  },
163
  {
164
  "epoch": 9.0,
165
+ "grad_norm": 0.0019187598954886198,
166
+ "learning_rate": 9.801741382013225e-05,
167
+ "loss": 0.0402,
168
  "step": 2889
169
  },
170
  {
171
  "epoch": 9.0,
172
+ "eval_accuracy": 0.8491678224687933,
173
+ "eval_f1": 0.8461066193854649,
174
+ "eval_loss": 0.9369620084762573,
175
+ "eval_precision": 0.8547133286785668,
176
+ "eval_recall": 0.8491678224687933,
177
+ "eval_runtime": 37.5745,
178
+ "eval_samples_per_second": 76.754,
179
+ "eval_steps_per_second": 9.608,
180
  "step": 2889
181
  },
182
  {
183
  "epoch": 10.0,
184
+ "grad_norm": 0.00408038217574358,
185
+ "learning_rate": 9.755584922004499e-05,
186
+ "loss": 0.0283,
187
  "step": 3210
188
  },
189
  {
190
  "epoch": 10.0,
191
+ "eval_accuracy": 0.8509015256588072,
192
+ "eval_f1": 0.8482666902922076,
193
+ "eval_loss": 0.9217829704284668,
194
+ "eval_precision": 0.8495520865912046,
195
+ "eval_recall": 0.8509015256588072,
196
+ "eval_runtime": 37.6867,
197
+ "eval_samples_per_second": 76.526,
198
+ "eval_steps_per_second": 9.579,
199
  "step": 3210
200
  },
201
  {
202
  "epoch": 11.0,
203
+ "grad_norm": 2.3583085536956787,
204
+ "learning_rate": 9.70473527382648e-05,
205
+ "loss": 0.0451,
206
  "step": 3531
207
  },
208
  {
209
  "epoch": 11.0,
210
+ "eval_accuracy": 0.8474341192787794,
211
+ "eval_f1": 0.8401062715209746,
212
+ "eval_loss": 0.987198531627655,
213
+ "eval_precision": 0.8400167652295873,
214
+ "eval_recall": 0.8474341192787794,
215
+ "eval_runtime": 37.5611,
216
+ "eval_samples_per_second": 76.782,
217
+ "eval_steps_per_second": 9.611,
218
  "step": 3531
219
  },
220
  {
221
  "epoch": 12.0,
222
+ "grad_norm": 11.217573165893555,
223
+ "learning_rate": 9.649242619942769e-05,
224
+ "loss": 0.0549,
225
  "step": 3852
226
  },
227
  {
228
  "epoch": 12.0,
229
+ "eval_accuracy": 0.8457004160887656,
230
+ "eval_f1": 0.8415779150905001,
231
+ "eval_loss": 1.0202850103378296,
232
+ "eval_precision": 0.8487681253829549,
233
+ "eval_recall": 0.8457004160887656,
234
+ "eval_runtime": 37.4542,
235
+ "eval_samples_per_second": 77.001,
236
+ "eval_steps_per_second": 9.638,
237
  "step": 3852
238
  },
239
  {
240
  "epoch": 12.0,
241
  "step": 3852,
242
  "total_flos": 4.768760767819088e+18,
243
+ "train_loss": 0.15186076372211968,
244
+ "train_runtime": 1747.1919,
245
+ "train_samples_per_second": 293.5,
246
+ "train_steps_per_second": 18.372
247
  }
248
  ],
249
  "logging_steps": 500,