sharren commited on
Commit
da72220
1 Parent(s): a9398f3

🍻 cheers

Browse files
README.md CHANGED
@@ -2,6 +2,7 @@
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224
4
  tags:
 
5
  - generated_from_trainer
6
  metrics:
7
  - accuracy
@@ -18,13 +19,13 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  # vit-lr-0.0001
20
 
21
- This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 0.6800
24
- - Accuracy: 0.8322
25
- - Precision: 0.8330
26
- - Recall: 0.8322
27
- - F1: 0.8229
28
 
29
  ## Model description
30
 
 
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224
4
  tags:
5
+ - image-classification
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
 
19
 
20
  # vit-lr-0.0001
21
 
22
+ This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the skin-cancer dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.4886
25
+ - Accuracy: 0.8273
26
+ - Precision: 0.8287
27
+ - Recall: 0.8273
28
+ - F1: 0.8227
29
 
30
  ## Model description
31
 
all_results.json CHANGED
@@ -1,13 +1,16 @@
1
  {
2
- "epoch": 2.18,
3
- "eval_accuracy": 0.8169209431345353,
4
- "eval_loss": 0.49744343757629395,
5
- "eval_runtime": 40.9787,
6
- "eval_samples_per_second": 70.378,
7
- "eval_steps_per_second": 8.809,
8
- "total_flos": 8.667092503134536e+17,
9
- "train_loss": 0.4869789886474609,
10
- "train_runtime": 547.2513,
11
- "train_samples_per_second": 937.047,
12
- "train_steps_per_second": 58.657
 
 
 
13
  }
 
1
  {
2
+ "epoch": 3.43,
3
+ "eval_accuracy": 0.8273231622746186,
4
+ "eval_f1": 0.822737257017553,
5
+ "eval_loss": 0.4886268079280853,
6
+ "eval_precision": 0.8287258592840144,
7
+ "eval_recall": 0.8273231622746186,
8
+ "eval_runtime": 40.0459,
9
+ "eval_samples_per_second": 72.017,
10
+ "eval_steps_per_second": 9.015,
11
+ "total_flos": 1.362060245306622e+18,
12
+ "train_loss": 0.40586378964510833,
13
+ "train_runtime": 828.4507,
14
+ "train_samples_per_second": 618.987,
15
+ "train_steps_per_second": 38.747
16
  }
eval_results.json CHANGED
@@ -1,8 +1,11 @@
1
  {
2
- "epoch": 2.18,
3
- "eval_accuracy": 0.8169209431345353,
4
- "eval_loss": 0.49744343757629395,
5
- "eval_runtime": 40.9787,
6
- "eval_samples_per_second": 70.378,
7
- "eval_steps_per_second": 8.809
 
 
 
8
  }
 
1
  {
2
+ "epoch": 3.43,
3
+ "eval_accuracy": 0.8273231622746186,
4
+ "eval_f1": 0.822737257017553,
5
+ "eval_loss": 0.4886268079280853,
6
+ "eval_precision": 0.8287258592840144,
7
+ "eval_recall": 0.8273231622746186,
8
+ "eval_runtime": 40.0459,
9
+ "eval_samples_per_second": 72.017,
10
+ "eval_steps_per_second": 9.015
11
  }
runs/Mar17_21-09-49_add18dc15495/events.out.tfevents.1710710837.add18dc15495.3839.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23901c00884c0ff9b4378a9daf6a29df8980be154cb078878ffe9f6c35e7cc21
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.18,
3
- "total_flos": 8.667092503134536e+17,
4
- "train_loss": 0.4869789886474609,
5
- "train_runtime": 547.2513,
6
- "train_samples_per_second": 937.047,
7
- "train_steps_per_second": 58.657
8
  }
 
1
  {
2
+ "epoch": 3.43,
3
+ "total_flos": 1.362060245306622e+18,
4
+ "train_loss": 0.40586378964510833,
5
+ "train_runtime": 828.4507,
6
+ "train_samples_per_second": 618.987,
7
+ "train_steps_per_second": 38.747
8
  }
trainer_state.json CHANGED
@@ -1,133 +1,230 @@
1
  {
2
- "best_metric": 0.49744343757629395,
3
- "best_model_checkpoint": "./vit-lr-0.0001/checkpoint-400",
4
- "epoch": 2.1806853582554515,
5
  "eval_steps": 100,
6
- "global_step": 700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.31,
13
- "grad_norm": 4.504175186157227,
14
- "learning_rate": 9.999760543724762e-05,
15
- "loss": 0.7774,
16
  "step": 100
17
  },
18
  {
19
  "epoch": 0.31,
20
- "eval_accuracy": 0.7846740638002774,
21
- "eval_loss": 0.5988100171089172,
22
- "eval_runtime": 39.924,
23
- "eval_samples_per_second": 72.237,
24
- "eval_steps_per_second": 9.042,
 
 
 
25
  "step": 100
26
  },
27
  {
28
  "epoch": 0.62,
29
- "grad_norm": 6.5739970207214355,
30
- "learning_rate": 9.999042197834769e-05,
31
- "loss": 0.59,
32
  "step": 200
33
  },
34
  {
35
  "epoch": 0.62,
36
- "eval_accuracy": 0.7732316227461858,
37
- "eval_loss": 0.6567931175231934,
38
- "eval_runtime": 39.9411,
39
- "eval_samples_per_second": 72.206,
40
- "eval_steps_per_second": 9.038,
 
 
 
41
  "step": 200
42
  },
43
  {
44
  "epoch": 0.93,
45
- "grad_norm": 6.0171613693237305,
46
  "learning_rate": 9.997859372626506e-05,
47
- "loss": 0.584,
48
  "step": 300
49
  },
50
  {
51
  "epoch": 0.93,
52
- "eval_accuracy": 0.7562413314840499,
53
- "eval_loss": 0.6686193346977234,
54
- "eval_runtime": 40.0793,
55
- "eval_samples_per_second": 71.957,
56
- "eval_steps_per_second": 9.007,
 
 
 
57
  "step": 300
58
  },
59
  {
60
  "epoch": 1.25,
61
- "grad_norm": 3.5295469760894775,
62
  "learning_rate": 9.996188286127832e-05,
63
- "loss": 0.4275,
64
  "step": 400
65
  },
66
  {
67
  "epoch": 1.25,
68
- "eval_accuracy": 0.8169209431345353,
69
- "eval_loss": 0.49744343757629395,
70
- "eval_runtime": 39.8506,
71
- "eval_samples_per_second": 72.37,
72
- "eval_steps_per_second": 9.059,
 
 
 
73
  "step": 400
74
  },
75
  {
76
  "epoch": 1.56,
77
- "grad_norm": 2.440728187561035,
78
  "learning_rate": 9.994038652174203e-05,
79
- "loss": 0.3963,
80
  "step": 500
81
  },
82
  {
83
  "epoch": 1.56,
84
- "eval_accuracy": 0.8287101248266296,
85
- "eval_loss": 0.507750391960144,
86
- "eval_runtime": 39.6231,
87
- "eval_samples_per_second": 72.786,
88
- "eval_steps_per_second": 9.111,
 
 
 
89
  "step": 500
90
  },
91
  {
92
  "epoch": 1.87,
93
- "grad_norm": 4.625945568084717,
94
  "learning_rate": 9.991410676662952e-05,
95
- "loss": 0.3708,
96
  "step": 600
97
  },
98
  {
99
  "epoch": 1.87,
100
- "eval_accuracy": 0.794382801664355,
101
- "eval_loss": 0.5709377527236938,
102
- "eval_runtime": 39.6196,
103
- "eval_samples_per_second": 72.792,
104
- "eval_steps_per_second": 9.112,
 
 
 
105
  "step": 600
106
  },
107
  {
108
  "epoch": 2.18,
109
- "grad_norm": 2.9291675090789795,
110
  "learning_rate": 9.988304611308174e-05,
111
- "loss": 0.2628,
112
  "step": 700
113
  },
114
  {
115
  "epoch": 2.18,
116
- "eval_accuracy": 0.812760055478502,
117
- "eval_loss": 0.6022083163261414,
118
- "eval_runtime": 39.3146,
119
- "eval_samples_per_second": 73.357,
120
- "eval_steps_per_second": 9.182,
 
 
 
121
  "step": 700
122
  },
123
  {
124
- "epoch": 2.18,
125
- "step": 700,
126
- "total_flos": 8.667092503134536e+17,
127
- "train_loss": 0.4869789886474609,
128
- "train_runtime": 547.2513,
129
- "train_samples_per_second": 937.047,
130
- "train_steps_per_second": 58.657
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
131
  }
132
  ],
133
  "logging_steps": 100,
@@ -135,7 +232,7 @@
135
  "num_input_tokens_seen": 0,
136
  "num_train_epochs": 100,
137
  "save_steps": 100,
138
- "total_flos": 8.667092503134536e+17,
139
  "train_batch_size": 16,
140
  "trial_name": null,
141
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.4886268079280853,
3
+ "best_model_checkpoint": "./vit-lr-0.0001/checkpoint-800",
4
+ "epoch": 3.426791277258567,
5
  "eval_steps": 100,
6
+ "global_step": 1100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.31,
13
+ "grad_norm": 4.336536407470703,
14
+ "learning_rate": 9.999765308867361e-05,
15
+ "loss": 0.8247,
16
  "step": 100
17
  },
18
  {
19
  "epoch": 0.31,
20
+ "eval_accuracy": 0.7808599167822469,
21
+ "eval_f1": 0.7543146399483164,
22
+ "eval_loss": 0.6282410025596619,
23
+ "eval_precision": 0.761734030016078,
24
+ "eval_recall": 0.7808599167822469,
25
+ "eval_runtime": 37.9446,
26
+ "eval_samples_per_second": 76.006,
27
+ "eval_steps_per_second": 9.514,
28
  "step": 100
29
  },
30
  {
31
  "epoch": 0.62,
32
+ "grad_norm": 6.528007507324219,
33
+ "learning_rate": 9.999051751609367e-05,
34
+ "loss": 0.6235,
35
  "step": 200
36
  },
37
  {
38
  "epoch": 0.62,
39
+ "eval_accuracy": 0.7510402219140083,
40
+ "eval_f1": 0.6980793391075255,
41
+ "eval_loss": 0.7094237208366394,
42
+ "eval_precision": 0.7832859172651316,
43
+ "eval_recall": 0.7510402219140083,
44
+ "eval_runtime": 38.1666,
45
+ "eval_samples_per_second": 75.564,
46
+ "eval_steps_per_second": 9.459,
47
  "step": 200
48
  },
49
  {
50
  "epoch": 0.93,
51
+ "grad_norm": 7.167332649230957,
52
  "learning_rate": 9.997859372626506e-05,
53
+ "loss": 0.5888,
54
  "step": 300
55
  },
56
  {
57
  "epoch": 0.93,
58
+ "eval_accuracy": 0.7402912621359223,
59
+ "eval_f1": 0.7507721767549878,
60
+ "eval_loss": 0.687461793422699,
61
+ "eval_precision": 0.7995575456891281,
62
+ "eval_recall": 0.7402912621359223,
63
+ "eval_runtime": 38.3771,
64
+ "eval_samples_per_second": 75.149,
65
+ "eval_steps_per_second": 9.407,
66
  "step": 300
67
  },
68
  {
69
  "epoch": 1.25,
70
+ "grad_norm": 2.4604434967041016,
71
  "learning_rate": 9.996188286127832e-05,
72
+ "loss": 0.454,
73
  "step": 400
74
  },
75
  {
76
  "epoch": 1.25,
77
+ "eval_accuracy": 0.7739251040221914,
78
+ "eval_f1": 0.7841730444076129,
79
+ "eval_loss": 0.6142727136611938,
80
+ "eval_precision": 0.8039138713400071,
81
+ "eval_recall": 0.7739251040221914,
82
+ "eval_runtime": 38.6976,
83
+ "eval_samples_per_second": 74.527,
84
+ "eval_steps_per_second": 9.329,
85
  "step": 400
86
  },
87
  {
88
  "epoch": 1.56,
89
+ "grad_norm": 2.9993300437927246,
90
  "learning_rate": 9.994038652174203e-05,
91
+ "loss": 0.4104,
92
  "step": 500
93
  },
94
  {
95
  "epoch": 1.56,
96
+ "eval_accuracy": 0.808252427184466,
97
+ "eval_f1": 0.7911353922443626,
98
+ "eval_loss": 0.5673110485076904,
99
+ "eval_precision": 0.8033716514082728,
100
+ "eval_recall": 0.808252427184466,
101
+ "eval_runtime": 38.598,
102
+ "eval_samples_per_second": 74.719,
103
+ "eval_steps_per_second": 9.353,
104
  "step": 500
105
  },
106
  {
107
  "epoch": 1.87,
108
+ "grad_norm": 3.316398859024048,
109
  "learning_rate": 9.991410676662952e-05,
110
+ "loss": 0.4039,
111
  "step": 600
112
  },
113
  {
114
  "epoch": 1.87,
115
+ "eval_accuracy": 0.8280166435506241,
116
+ "eval_f1": 0.8272377870020207,
117
+ "eval_loss": 0.5172362923622131,
118
+ "eval_precision": 0.838315056266821,
119
+ "eval_recall": 0.8280166435506241,
120
+ "eval_runtime": 38.241,
121
+ "eval_samples_per_second": 75.416,
122
+ "eval_steps_per_second": 9.44,
123
  "step": 600
124
  },
125
  {
126
  "epoch": 2.18,
127
+ "grad_norm": 3.1912124156951904,
128
  "learning_rate": 9.988304611308174e-05,
129
+ "loss": 0.2785,
130
  "step": 700
131
  },
132
  {
133
  "epoch": 2.18,
134
+ "eval_accuracy": 0.826629680998613,
135
+ "eval_f1": 0.8306324023780052,
136
+ "eval_loss": 0.563904345035553,
137
+ "eval_precision": 0.8424957959799085,
138
+ "eval_recall": 0.826629680998613,
139
+ "eval_runtime": 38.3845,
140
+ "eval_samples_per_second": 75.134,
141
+ "eval_steps_per_second": 9.405,
142
  "step": 700
143
  },
144
  {
145
+ "epoch": 2.49,
146
+ "grad_norm": 2.378309965133667,
147
+ "learning_rate": 9.984720753616604e-05,
148
+ "loss": 0.2744,
149
+ "step": 800
150
+ },
151
+ {
152
+ "epoch": 2.49,
153
+ "eval_accuracy": 0.8273231622746186,
154
+ "eval_f1": 0.822737257017553,
155
+ "eval_loss": 0.4886268079280853,
156
+ "eval_precision": 0.8287258592840144,
157
+ "eval_recall": 0.8273231622746186,
158
+ "eval_runtime": 38.1003,
159
+ "eval_samples_per_second": 75.695,
160
+ "eval_steps_per_second": 9.475,
161
+ "step": 800
162
+ },
163
+ {
164
+ "epoch": 2.8,
165
+ "grad_norm": 5.579433441162109,
166
+ "learning_rate": 9.980659446859127e-05,
167
+ "loss": 0.2545,
168
+ "step": 900
169
+ },
170
+ {
171
+ "epoch": 2.8,
172
+ "eval_accuracy": 0.8495145631067961,
173
+ "eval_f1": 0.8472903587104604,
174
+ "eval_loss": 0.4898224472999573,
175
+ "eval_precision": 0.8510030222503284,
176
+ "eval_recall": 0.8495145631067961,
177
+ "eval_runtime": 38.8455,
178
+ "eval_samples_per_second": 74.243,
179
+ "eval_steps_per_second": 9.293,
180
+ "step": 900
181
+ },
182
+ {
183
+ "epoch": 3.12,
184
+ "grad_norm": 3.6288774013519287,
185
+ "learning_rate": 9.976121080037899e-05,
186
+ "loss": 0.2197,
187
+ "step": 1000
188
+ },
189
+ {
190
+ "epoch": 3.12,
191
+ "eval_accuracy": 0.8574895977808599,
192
+ "eval_f1": 0.8550066256842739,
193
+ "eval_loss": 0.5342256426811218,
194
+ "eval_precision": 0.8561255195381418,
195
+ "eval_recall": 0.8574895977808599,
196
+ "eval_runtime": 39.0507,
197
+ "eval_samples_per_second": 73.853,
198
+ "eval_steps_per_second": 9.244,
199
+ "step": 1000
200
+ },
201
+ {
202
+ "epoch": 3.43,
203
+ "grad_norm": 9.022770881652832,
204
+ "learning_rate": 9.971106087849084e-05,
205
+ "loss": 0.1321,
206
+ "step": 1100
207
+ },
208
+ {
209
+ "epoch": 3.43,
210
+ "eval_accuracy": 0.8321775312066574,
211
+ "eval_f1": 0.822903478849272,
212
+ "eval_loss": 0.6799635291099548,
213
+ "eval_precision": 0.8329985305708512,
214
+ "eval_recall": 0.8321775312066574,
215
+ "eval_runtime": 38.5736,
216
+ "eval_samples_per_second": 74.766,
217
+ "eval_steps_per_second": 9.359,
218
+ "step": 1100
219
+ },
220
+ {
221
+ "epoch": 3.43,
222
+ "step": 1100,
223
+ "total_flos": 1.362060245306622e+18,
224
+ "train_loss": 0.40586378964510833,
225
+ "train_runtime": 828.4507,
226
+ "train_samples_per_second": 618.987,
227
+ "train_steps_per_second": 38.747
228
  }
229
  ],
230
  "logging_steps": 100,
 
232
  "num_input_tokens_seen": 0,
233
  "num_train_epochs": 100,
234
  "save_steps": 100,
235
+ "total_flos": 1.362060245306622e+18,
236
  "train_batch_size": 16,
237
  "trial_name": null,
238
  "trial_params": null