amjadfqs commited on
Commit
6586016
1 Parent(s): c99754d

Model save

Browse files
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.87,
3
+ "total_flos": 5.909979961466413e+18,
4
+ "train_loss": 0.1843041891330167,
5
+ "train_runtime": 18944.3436,
6
+ "train_samples_per_second": 4.031,
7
+ "train_steps_per_second": 0.01
8
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2586a9936c56271a65b005abc1e0334277c90f78fe6725d8b9c8bb026908dda
3
  size 347601681
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:802f41e0e5e8ba008457280ba3be6af3aa7fd045963b2b3f6bac8150895faad5
3
  size 347601681
runs/May26_07-29-52_project/events.out.tfevents.1685086204.project.117489.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40c8165ccdb693d9bf07b64740234a80a155fa4bb1a0712fc878586541d12636
3
- size 11809
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:424a84e20e937e6fab4cb24cab8223e99fdfaf4d59a5594e377480bc6a78180e
3
+ size 12163
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.87,
3
+ "total_flos": 5.909979961466413e+18,
4
+ "train_loss": 0.1843041891330167,
5
+ "train_runtime": 18944.3436,
6
+ "train_samples_per_second": 4.031,
7
+ "train_steps_per_second": 0.01
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,249 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9650432050274941,
3
+ "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-finetuned-brain-tumor-final_08/checkpoint-154",
4
+ "epoch": 9.87012987012987,
5
+ "global_step": 190,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.52,
12
+ "learning_rate": 2.6315789473684212e-05,
13
+ "loss": 1.2882,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.99,
18
+ "eval_accuracy": 0.7961508248232522,
19
+ "eval_f1_score": 0.7862764915452001,
20
+ "eval_loss": 0.5468631982803345,
21
+ "eval_precision": 0.807682539972508,
22
+ "eval_runtime": 146.6896,
23
+ "eval_samples_per_second": 17.356,
24
+ "eval_steps_per_second": 0.177,
25
+ "step": 19
26
+ },
27
+ {
28
+ "epoch": 1.04,
29
+ "learning_rate": 4.970760233918128e-05,
30
+ "loss": 0.7346,
31
+ "step": 20
32
+ },
33
+ {
34
+ "epoch": 1.56,
35
+ "learning_rate": 4.678362573099415e-05,
36
+ "loss": 0.3491,
37
+ "step": 30
38
+ },
39
+ {
40
+ "epoch": 1.97,
41
+ "eval_accuracy": 0.8860958366064414,
42
+ "eval_f1_score": 0.8877831452046004,
43
+ "eval_loss": 0.3029632568359375,
44
+ "eval_precision": 0.8981099107198931,
45
+ "eval_runtime": 142.8458,
46
+ "eval_samples_per_second": 17.823,
47
+ "eval_steps_per_second": 0.182,
48
+ "step": 38
49
+ },
50
+ {
51
+ "epoch": 2.08,
52
+ "learning_rate": 4.3859649122807014e-05,
53
+ "loss": 0.2344,
54
+ "step": 40
55
+ },
56
+ {
57
+ "epoch": 2.6,
58
+ "learning_rate": 4.093567251461988e-05,
59
+ "loss": 0.1791,
60
+ "step": 50
61
+ },
62
+ {
63
+ "epoch": 2.96,
64
+ "eval_accuracy": 0.9210526315789473,
65
+ "eval_f1_score": 0.9229181063056022,
66
+ "eval_loss": 0.2076900452375412,
67
+ "eval_precision": 0.9307481907300132,
68
+ "eval_runtime": 146.5105,
69
+ "eval_samples_per_second": 17.378,
70
+ "eval_steps_per_second": 0.177,
71
+ "step": 57
72
+ },
73
+ {
74
+ "epoch": 3.12,
75
+ "learning_rate": 3.8011695906432746e-05,
76
+ "loss": 0.1365,
77
+ "step": 60
78
+ },
79
+ {
80
+ "epoch": 3.64,
81
+ "learning_rate": 3.508771929824561e-05,
82
+ "loss": 0.122,
83
+ "step": 70
84
+ },
85
+ {
86
+ "epoch": 4.0,
87
+ "eval_accuracy": 0.9253731343283582,
88
+ "eval_f1_score": 0.9271544463725769,
89
+ "eval_loss": 0.20073173940181732,
90
+ "eval_precision": 0.936852899850916,
91
+ "eval_runtime": 143.3187,
92
+ "eval_samples_per_second": 17.765,
93
+ "eval_steps_per_second": 0.181,
94
+ "step": 77
95
+ },
96
+ {
97
+ "epoch": 4.16,
98
+ "learning_rate": 3.216374269005848e-05,
99
+ "loss": 0.084,
100
+ "step": 80
101
+ },
102
+ {
103
+ "epoch": 4.68,
104
+ "learning_rate": 2.9239766081871346e-05,
105
+ "loss": 0.0671,
106
+ "step": 90
107
+ },
108
+ {
109
+ "epoch": 4.99,
110
+ "eval_accuracy": 0.9269442262372348,
111
+ "eval_f1_score": 0.9294001146483667,
112
+ "eval_loss": 0.20734713971614838,
113
+ "eval_precision": 0.9400926555225891,
114
+ "eval_runtime": 150.1774,
115
+ "eval_samples_per_second": 16.953,
116
+ "eval_steps_per_second": 0.173,
117
+ "step": 96
118
+ },
119
+ {
120
+ "epoch": 5.19,
121
+ "learning_rate": 2.6315789473684212e-05,
122
+ "loss": 0.0545,
123
+ "step": 100
124
+ },
125
+ {
126
+ "epoch": 5.71,
127
+ "learning_rate": 2.3391812865497074e-05,
128
+ "loss": 0.0474,
129
+ "step": 110
130
+ },
131
+ {
132
+ "epoch": 5.97,
133
+ "eval_accuracy": 0.9481539670070699,
134
+ "eval_f1_score": 0.9493645555588069,
135
+ "eval_loss": 0.13840945065021515,
136
+ "eval_precision": 0.9547416860173351,
137
+ "eval_runtime": 148.6502,
138
+ "eval_samples_per_second": 17.127,
139
+ "eval_steps_per_second": 0.175,
140
+ "step": 115
141
+ },
142
+ {
143
+ "epoch": 6.23,
144
+ "learning_rate": 2.046783625730994e-05,
145
+ "loss": 0.0359,
146
+ "step": 120
147
+ },
148
+ {
149
+ "epoch": 6.75,
150
+ "learning_rate": 1.7543859649122806e-05,
151
+ "loss": 0.032,
152
+ "step": 130
153
+ },
154
+ {
155
+ "epoch": 6.96,
156
+ "eval_accuracy": 0.9430479183032208,
157
+ "eval_f1_score": 0.9447208627751791,
158
+ "eval_loss": 0.1683335155248642,
159
+ "eval_precision": 0.9510759669338126,
160
+ "eval_runtime": 146.9976,
161
+ "eval_samples_per_second": 17.32,
162
+ "eval_steps_per_second": 0.177,
163
+ "step": 134
164
+ },
165
+ {
166
+ "epoch": 7.27,
167
+ "learning_rate": 1.4619883040935673e-05,
168
+ "loss": 0.0284,
169
+ "step": 140
170
+ },
171
+ {
172
+ "epoch": 7.79,
173
+ "learning_rate": 1.1695906432748537e-05,
174
+ "loss": 0.0225,
175
+ "step": 150
176
+ },
177
+ {
178
+ "epoch": 8.0,
179
+ "eval_accuracy": 0.9650432050274941,
180
+ "eval_f1_score": 0.9657333174830298,
181
+ "eval_loss": 0.11006712168455124,
182
+ "eval_precision": 0.9671471415955248,
183
+ "eval_runtime": 144.8303,
184
+ "eval_samples_per_second": 17.579,
185
+ "eval_steps_per_second": 0.18,
186
+ "step": 154
187
+ },
188
+ {
189
+ "epoch": 8.31,
190
+ "learning_rate": 8.771929824561403e-06,
191
+ "loss": 0.0299,
192
+ "step": 160
193
+ },
194
+ {
195
+ "epoch": 8.83,
196
+ "learning_rate": 5.8479532163742686e-06,
197
+ "loss": 0.0193,
198
+ "step": 170
199
+ },
200
+ {
201
+ "epoch": 8.99,
202
+ "eval_accuracy": 0.9532600157109191,
203
+ "eval_f1_score": 0.9543637358051864,
204
+ "eval_loss": 0.13721555471420288,
205
+ "eval_precision": 0.9584728079885907,
206
+ "eval_runtime": 148.8815,
207
+ "eval_samples_per_second": 17.101,
208
+ "eval_steps_per_second": 0.175,
209
+ "step": 173
210
+ },
211
+ {
212
+ "epoch": 9.35,
213
+ "learning_rate": 2.9239766081871343e-06,
214
+ "loss": 0.0175,
215
+ "step": 180
216
+ },
217
+ {
218
+ "epoch": 9.87,
219
+ "learning_rate": 0.0,
220
+ "loss": 0.0193,
221
+ "step": 190
222
+ },
223
+ {
224
+ "epoch": 9.87,
225
+ "eval_accuracy": 0.9591516103692066,
226
+ "eval_f1_score": 0.9600211574702097,
227
+ "eval_loss": 0.12095439434051514,
228
+ "eval_precision": 0.9627515459909033,
229
+ "eval_runtime": 143.4592,
230
+ "eval_samples_per_second": 17.747,
231
+ "eval_steps_per_second": 0.181,
232
+ "step": 190
233
+ },
234
+ {
235
+ "epoch": 9.87,
236
+ "step": 190,
237
+ "total_flos": 5.909979961466413e+18,
238
+ "train_loss": 0.1843041891330167,
239
+ "train_runtime": 18944.3436,
240
+ "train_samples_per_second": 4.031,
241
+ "train_steps_per_second": 0.01
242
+ }
243
+ ],
244
+ "max_steps": 190,
245
+ "num_train_epochs": 10,
246
+ "total_flos": 5.909979961466413e+18,
247
+ "trial_name": null,
248
+ "trial_params": null
249
+ }