suredream commited on
Commit
e4486b5
1 Parent(s): 6bf84a8

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.9691358024691358,
4
- "eval_loss": 0.08843858540058136,
5
- "eval_runtime": 4.5137,
6
- "eval_samples_per_second": 358.903,
7
- "eval_steps_per_second": 11.299,
8
- "total_flos": 1.0874439903456461e+18,
9
- "train_loss": 0.41079250579340415,
10
- "train_runtime": 248.8888,
11
- "train_samples_per_second": 175.741,
12
- "train_steps_per_second": 1.374
13
  }
 
1
  {
2
+ "epoch": 2.9822485207100593,
3
+ "eval_accuracy": 0.9755555555555555,
4
+ "eval_loss": 0.07779138535261154,
5
+ "eval_runtime": 33.0348,
6
+ "eval_samples_per_second": 163.464,
7
+ "eval_steps_per_second": 5.116,
8
+ "total_flos": 1.2017076524313477e+18,
9
+ "train_loss": 0.406993343716576,
10
+ "train_runtime": 795.2889,
11
+ "train_samples_per_second": 61.11,
12
+ "train_steps_per_second": 0.475
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.9691358024691358,
4
- "eval_loss": 0.08843858540058136,
5
- "eval_runtime": 4.5137,
6
- "eval_samples_per_second": 358.903,
7
- "eval_steps_per_second": 11.299
8
  }
 
1
  {
2
+ "epoch": 2.9822485207100593,
3
+ "eval_accuracy": 0.9755555555555555,
4
+ "eval_loss": 0.07779138535261154,
5
+ "eval_runtime": 33.0348,
6
+ "eval_samples_per_second": 163.464,
7
+ "eval_steps_per_second": 5.116
8
  }
runs/Jul05_18-22-56_65d164acd7e3/events.out.tfevents.1720204611.65d164acd7e3.2983.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:255a6348cd216dcaffd87f0a28ca565355276a1404e133dbfb8bf9eec6a3830e
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 1.0874439903456461e+18,
4
- "train_loss": 0.41079250579340415,
5
- "train_runtime": 248.8888,
6
- "train_samples_per_second": 175.741,
7
- "train_steps_per_second": 1.374
8
  }
 
1
  {
2
+ "epoch": 2.9822485207100593,
3
+ "total_flos": 1.2017076524313477e+18,
4
+ "train_loss": 0.406993343716576,
5
+ "train_runtime": 795.2889,
6
+ "train_samples_per_second": 61.11,
7
+ "train_steps_per_second": 0.475
8
  }
trainer_state.json CHANGED
@@ -1,290 +1,311 @@
1
  {
2
- "best_metric": 0.9691358024691358,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-342",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 342,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.08771929824561403,
13
- "grad_norm": 4.784806251525879,
14
- "learning_rate": 1.4285714285714285e-05,
15
- "loss": 2.2537,
16
  "step": 10
17
  },
18
  {
19
- "epoch": 0.17543859649122806,
20
- "grad_norm": 7.325711727142334,
21
- "learning_rate": 2.857142857142857e-05,
22
- "loss": 1.9328,
23
  "step": 20
24
  },
25
  {
26
- "epoch": 0.2631578947368421,
27
- "grad_norm": 12.205706596374512,
28
- "learning_rate": 4.2857142857142856e-05,
29
- "loss": 1.3033,
30
  "step": 30
31
  },
32
  {
33
- "epoch": 0.3508771929824561,
34
- "grad_norm": 21.546316146850586,
35
- "learning_rate": 4.9185667752443e-05,
36
- "loss": 0.7435,
37
  "step": 40
38
  },
39
  {
40
- "epoch": 0.43859649122807015,
41
- "grad_norm": 11.416431427001953,
42
- "learning_rate": 4.755700325732899e-05,
43
- "loss": 0.5723,
44
  "step": 50
45
  },
46
  {
47
- "epoch": 0.5263157894736842,
48
- "grad_norm": 13.339532852172852,
49
- "learning_rate": 4.592833876221499e-05,
50
- "loss": 0.4688,
51
  "step": 60
52
  },
53
  {
54
- "epoch": 0.6140350877192983,
55
- "grad_norm": 18.226308822631836,
56
- "learning_rate": 4.429967426710098e-05,
57
- "loss": 0.4296,
58
  "step": 70
59
  },
60
  {
61
- "epoch": 0.7017543859649122,
62
- "grad_norm": 24.142580032348633,
63
- "learning_rate": 4.2671009771986977e-05,
64
- "loss": 0.3557,
65
  "step": 80
66
  },
67
  {
68
- "epoch": 0.7894736842105263,
69
- "grad_norm": 18.747182846069336,
70
- "learning_rate": 4.104234527687297e-05,
71
- "loss": 0.3364,
72
  "step": 90
73
  },
74
  {
75
- "epoch": 0.8771929824561403,
76
- "grad_norm": 9.604598999023438,
77
- "learning_rate": 3.941368078175896e-05,
78
- "loss": 0.379,
79
  "step": 100
80
  },
81
  {
82
- "epoch": 0.9649122807017544,
83
- "grad_norm": 9.6405668258667,
84
- "learning_rate": 3.778501628664495e-05,
85
- "loss": 0.2967,
86
  "step": 110
87
  },
88
  {
89
- "epoch": 1.0,
90
- "eval_accuracy": 0.9271604938271605,
91
- "eval_loss": 0.20734398066997528,
92
- "eval_runtime": 4.5343,
93
- "eval_samples_per_second": 357.28,
94
- "eval_steps_per_second": 11.248,
95
- "step": 114
96
  },
97
  {
98
- "epoch": 1.0526315789473684,
99
- "grad_norm": 10.606453895568848,
100
- "learning_rate": 3.615635179153095e-05,
101
- "loss": 0.2506,
102
- "step": 120
 
 
103
  },
104
  {
105
- "epoch": 1.1403508771929824,
106
- "grad_norm": 13.219770431518555,
107
- "learning_rate": 3.452768729641694e-05,
108
- "loss": 0.2646,
109
  "step": 130
110
  },
111
  {
112
- "epoch": 1.2280701754385965,
113
- "grad_norm": 14.424461364746094,
114
- "learning_rate": 3.289902280130293e-05,
115
- "loss": 0.3161,
116
  "step": 140
117
  },
118
  {
119
- "epoch": 1.3157894736842106,
120
- "grad_norm": 16.468141555786133,
121
- "learning_rate": 3.127035830618892e-05,
122
- "loss": 0.2296,
123
  "step": 150
124
  },
125
  {
126
- "epoch": 1.4035087719298245,
127
- "grad_norm": 18.474872589111328,
128
- "learning_rate": 2.9641693811074923e-05,
129
- "loss": 0.252,
130
  "step": 160
131
  },
132
  {
133
- "epoch": 1.4912280701754386,
134
- "grad_norm": 8.512451171875,
135
- "learning_rate": 2.8013029315960915e-05,
136
- "loss": 0.2526,
137
  "step": 170
138
  },
139
  {
140
- "epoch": 1.5789473684210527,
141
- "grad_norm": 10.639461517333984,
142
- "learning_rate": 2.6384364820846906e-05,
143
- "loss": 0.2218,
144
  "step": 180
145
  },
146
  {
147
- "epoch": 1.6666666666666665,
148
- "grad_norm": 10.84925651550293,
149
- "learning_rate": 2.47557003257329e-05,
150
- "loss": 0.2246,
151
  "step": 190
152
  },
153
  {
154
- "epoch": 1.7543859649122808,
155
- "grad_norm": 7.055878162384033,
156
- "learning_rate": 2.3127035830618892e-05,
157
- "loss": 0.2181,
158
  "step": 200
159
  },
160
  {
161
- "epoch": 1.8421052631578947,
162
- "grad_norm": 10.151970863342285,
163
- "learning_rate": 2.149837133550489e-05,
164
- "loss": 0.2336,
165
  "step": 210
166
  },
167
  {
168
- "epoch": 1.9298245614035088,
169
- "grad_norm": 10.90556812286377,
170
- "learning_rate": 1.986970684039088e-05,
171
- "loss": 0.2175,
172
  "step": 220
173
  },
174
  {
175
- "epoch": 2.0,
176
- "eval_accuracy": 0.9617283950617284,
177
- "eval_loss": 0.1142377108335495,
178
- "eval_runtime": 4.4649,
179
- "eval_samples_per_second": 362.828,
180
- "eval_steps_per_second": 11.422,
181
- "step": 228
182
- },
183
- {
184
- "epoch": 2.017543859649123,
185
- "grad_norm": 7.411689281463623,
186
- "learning_rate": 1.8241042345276872e-05,
187
- "loss": 0.2493,
188
  "step": 230
189
  },
190
  {
191
- "epoch": 2.1052631578947367,
192
- "grad_norm": 6.981323719024658,
193
- "learning_rate": 1.6612377850162867e-05,
194
- "loss": 0.1832,
195
  "step": 240
196
  },
197
  {
198
- "epoch": 2.192982456140351,
199
- "grad_norm": 17.770326614379883,
200
- "learning_rate": 1.4983713355048862e-05,
201
- "loss": 0.1862,
202
  "step": 250
203
  },
204
  {
205
- "epoch": 2.280701754385965,
206
- "grad_norm": 14.688613891601562,
207
- "learning_rate": 1.3355048859934855e-05,
208
- "loss": 0.1725,
 
 
 
 
 
 
 
 
 
209
  "step": 260
210
  },
211
  {
212
- "epoch": 2.3684210526315788,
213
- "grad_norm": 9.546713829040527,
214
- "learning_rate": 1.1726384364820847e-05,
215
- "loss": 0.2187,
216
  "step": 270
217
  },
218
  {
219
- "epoch": 2.456140350877193,
220
- "grad_norm": 13.742387771606445,
221
- "learning_rate": 1.009771986970684e-05,
222
- "loss": 0.211,
223
  "step": 280
224
  },
225
  {
226
- "epoch": 2.543859649122807,
227
- "grad_norm": 10.309969902038574,
228
- "learning_rate": 8.469055374592833e-06,
229
- "loss": 0.1776,
230
  "step": 290
231
  },
232
  {
233
- "epoch": 2.6315789473684212,
234
- "grad_norm": 11.343367576599121,
235
- "learning_rate": 6.840390879478828e-06,
236
- "loss": 0.1828,
237
  "step": 300
238
  },
239
  {
240
- "epoch": 2.719298245614035,
241
- "grad_norm": 12.15509033203125,
242
- "learning_rate": 5.211726384364822e-06,
243
- "loss": 0.1565,
244
  "step": 310
245
  },
246
  {
247
- "epoch": 2.807017543859649,
248
- "grad_norm": 13.258170127868652,
249
- "learning_rate": 3.5830618892508147e-06,
250
- "loss": 0.1601,
251
  "step": 320
252
  },
253
  {
254
- "epoch": 2.8947368421052633,
255
- "grad_norm": 13.760292053222656,
256
- "learning_rate": 1.9543973941368076e-06,
257
- "loss": 0.1777,
258
  "step": 330
259
  },
260
  {
261
- "epoch": 2.982456140350877,
262
- "grad_norm": 10.578232765197754,
263
- "learning_rate": 3.2573289902280136e-07,
264
- "loss": 0.1881,
265
  "step": 340
266
  },
267
  {
268
- "epoch": 3.0,
269
- "eval_accuracy": 0.9691358024691358,
270
- "eval_loss": 0.08843858540058136,
271
- "eval_runtime": 4.4533,
272
- "eval_samples_per_second": 363.776,
273
- "eval_steps_per_second": 11.452,
274
- "step": 342
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
275
  },
276
  {
277
- "epoch": 3.0,
278
- "step": 342,
279
- "total_flos": 1.0874439903456461e+18,
280
- "train_loss": 0.41079250579340415,
281
- "train_runtime": 248.8888,
282
- "train_samples_per_second": 175.741,
283
- "train_steps_per_second": 1.374
284
  }
285
  ],
286
  "logging_steps": 10,
287
- "max_steps": 342,
288
  "num_input_tokens_seen": 0,
289
  "num_train_epochs": 3,
290
  "save_steps": 500,
@@ -300,7 +321,7 @@
300
  "attributes": {}
301
  }
302
  },
303
- "total_flos": 1.0874439903456461e+18,
304
  "train_batch_size": 32,
305
  "trial_name": null,
306
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.9755555555555555,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-378",
4
+ "epoch": 2.9822485207100593,
5
  "eval_steps": 500,
6
+ "global_step": 378,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.07889546351084813,
13
+ "grad_norm": 4.885411262512207,
14
+ "learning_rate": 1.3157894736842106e-05,
15
+ "loss": 2.2985,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.15779092702169625,
20
+ "grad_norm": 6.575764179229736,
21
+ "learning_rate": 2.6315789473684212e-05,
22
+ "loss": 2.0642,
23
  "step": 20
24
  },
25
  {
26
+ "epoch": 0.23668639053254437,
27
+ "grad_norm": 8.125149726867676,
28
+ "learning_rate": 3.9473684210526316e-05,
29
+ "loss": 1.5012,
30
  "step": 30
31
  },
32
  {
33
+ "epoch": 0.3155818540433925,
34
+ "grad_norm": 11.912463188171387,
35
+ "learning_rate": 4.970588235294118e-05,
36
+ "loss": 0.8692,
37
  "step": 40
38
  },
39
  {
40
+ "epoch": 0.39447731755424065,
41
+ "grad_norm": 15.561235427856445,
42
+ "learning_rate": 4.823529411764706e-05,
43
+ "loss": 0.6062,
44
  "step": 50
45
  },
46
  {
47
+ "epoch": 0.47337278106508873,
48
+ "grad_norm": 22.308109283447266,
49
+ "learning_rate": 4.6764705882352944e-05,
50
+ "loss": 0.4878,
51
  "step": 60
52
  },
53
  {
54
+ "epoch": 0.5522682445759369,
55
+ "grad_norm": 16.376893997192383,
56
+ "learning_rate": 4.5294117647058826e-05,
57
+ "loss": 0.4598,
58
  "step": 70
59
  },
60
  {
61
+ "epoch": 0.631163708086785,
62
+ "grad_norm": 20.709991455078125,
63
+ "learning_rate": 4.382352941176471e-05,
64
+ "loss": 0.3735,
65
  "step": 80
66
  },
67
  {
68
+ "epoch": 0.7100591715976331,
69
+ "grad_norm": 19.054445266723633,
70
+ "learning_rate": 4.235294117647059e-05,
71
+ "loss": 0.4128,
72
  "step": 90
73
  },
74
  {
75
+ "epoch": 0.7889546351084813,
76
+ "grad_norm": 10.85267162322998,
77
+ "learning_rate": 4.0882352941176474e-05,
78
+ "loss": 0.3343,
79
  "step": 100
80
  },
81
  {
82
+ "epoch": 0.8678500986193294,
83
+ "grad_norm": 12.394430160522461,
84
+ "learning_rate": 3.9411764705882356e-05,
85
+ "loss": 0.3172,
86
  "step": 110
87
  },
88
  {
89
+ "epoch": 0.9467455621301775,
90
+ "grad_norm": 13.280746459960938,
91
+ "learning_rate": 3.794117647058824e-05,
92
+ "loss": 0.2875,
93
+ "step": 120
 
 
94
  },
95
  {
96
+ "epoch": 0.9940828402366864,
97
+ "eval_accuracy": 0.9516666666666667,
98
+ "eval_loss": 0.15403828024864197,
99
+ "eval_runtime": 32.6659,
100
+ "eval_samples_per_second": 165.31,
101
+ "eval_steps_per_second": 5.174,
102
+ "step": 126
103
  },
104
  {
105
+ "epoch": 1.0256410256410255,
106
+ "grad_norm": 11.388362884521484,
107
+ "learning_rate": 3.6470588235294114e-05,
108
+ "loss": 0.2601,
109
  "step": 130
110
  },
111
  {
112
+ "epoch": 1.1045364891518739,
113
+ "grad_norm": 21.39406394958496,
114
+ "learning_rate": 3.5e-05,
115
+ "loss": 0.287,
116
  "step": 140
117
  },
118
  {
119
+ "epoch": 1.183431952662722,
120
+ "grad_norm": 14.232524871826172,
121
+ "learning_rate": 3.352941176470588e-05,
122
+ "loss": 0.2604,
123
  "step": 150
124
  },
125
  {
126
+ "epoch": 1.26232741617357,
127
+ "grad_norm": 9.439920425415039,
128
+ "learning_rate": 3.205882352941177e-05,
129
+ "loss": 0.2563,
130
  "step": 160
131
  },
132
  {
133
+ "epoch": 1.3412228796844181,
134
+ "grad_norm": 22.91378402709961,
135
+ "learning_rate": 3.058823529411765e-05,
136
+ "loss": 0.2376,
137
  "step": 170
138
  },
139
  {
140
+ "epoch": 1.4201183431952662,
141
+ "grad_norm": 26.201648712158203,
142
+ "learning_rate": 2.9117647058823534e-05,
143
+ "loss": 0.2354,
144
  "step": 180
145
  },
146
  {
147
+ "epoch": 1.4990138067061145,
148
+ "grad_norm": 11.116905212402344,
149
+ "learning_rate": 2.7647058823529416e-05,
150
+ "loss": 0.2424,
151
  "step": 190
152
  },
153
  {
154
+ "epoch": 1.5779092702169626,
155
+ "grad_norm": 9.413314819335938,
156
+ "learning_rate": 2.6176470588235295e-05,
157
+ "loss": 0.2572,
158
  "step": 200
159
  },
160
  {
161
+ "epoch": 1.6568047337278107,
162
+ "grad_norm": 11.392881393432617,
163
+ "learning_rate": 2.4705882352941178e-05,
164
+ "loss": 0.227,
165
  "step": 210
166
  },
167
  {
168
+ "epoch": 1.7357001972386588,
169
+ "grad_norm": 8.600625038146973,
170
+ "learning_rate": 2.323529411764706e-05,
171
+ "loss": 0.2078,
172
  "step": 220
173
  },
174
  {
175
+ "epoch": 1.8145956607495068,
176
+ "grad_norm": 11.280962944030762,
177
+ "learning_rate": 2.1764705882352943e-05,
178
+ "loss": 0.2259,
 
 
 
 
 
 
 
 
 
179
  "step": 230
180
  },
181
  {
182
+ "epoch": 1.893491124260355,
183
+ "grad_norm": 5.870893955230713,
184
+ "learning_rate": 2.0294117647058825e-05,
185
+ "loss": 0.1989,
186
  "step": 240
187
  },
188
  {
189
+ "epoch": 1.972386587771203,
190
+ "grad_norm": 12.228656768798828,
191
+ "learning_rate": 1.8823529411764708e-05,
192
+ "loss": 0.2201,
193
  "step": 250
194
  },
195
  {
196
+ "epoch": 1.9960552268244576,
197
+ "eval_accuracy": 0.975,
198
+ "eval_loss": 0.08536241203546524,
199
+ "eval_runtime": 32.8385,
200
+ "eval_samples_per_second": 164.441,
201
+ "eval_steps_per_second": 5.146,
202
+ "step": 253
203
+ },
204
+ {
205
+ "epoch": 2.051282051282051,
206
+ "grad_norm": 7.734664440155029,
207
+ "learning_rate": 1.735294117647059e-05,
208
+ "loss": 0.1785,
209
  "step": 260
210
  },
211
  {
212
+ "epoch": 2.1301775147928996,
213
+ "grad_norm": 13.498882293701172,
214
+ "learning_rate": 1.588235294117647e-05,
215
+ "loss": 0.2043,
216
  "step": 270
217
  },
218
  {
219
+ "epoch": 2.2090729783037477,
220
+ "grad_norm": 11.542675971984863,
221
+ "learning_rate": 1.4411764705882352e-05,
222
+ "loss": 0.1842,
223
  "step": 280
224
  },
225
  {
226
+ "epoch": 2.287968441814596,
227
+ "grad_norm": 10.036293029785156,
228
+ "learning_rate": 1.2941176470588238e-05,
229
+ "loss": 0.1996,
230
  "step": 290
231
  },
232
  {
233
+ "epoch": 2.366863905325444,
234
+ "grad_norm": 8.317439079284668,
235
+ "learning_rate": 1.1470588235294118e-05,
236
+ "loss": 0.1573,
237
  "step": 300
238
  },
239
  {
240
+ "epoch": 2.445759368836292,
241
+ "grad_norm": 6.859732627868652,
242
+ "learning_rate": 1e-05,
243
+ "loss": 0.1835,
244
  "step": 310
245
  },
246
  {
247
+ "epoch": 2.52465483234714,
248
+ "grad_norm": 13.328524589538574,
249
+ "learning_rate": 8.529411764705883e-06,
250
+ "loss": 0.187,
251
  "step": 320
252
  },
253
  {
254
+ "epoch": 2.603550295857988,
255
+ "grad_norm": 7.502381801605225,
256
+ "learning_rate": 7.058823529411765e-06,
257
+ "loss": 0.1502,
258
  "step": 330
259
  },
260
  {
261
+ "epoch": 2.6824457593688362,
262
+ "grad_norm": 14.761018753051758,
263
+ "learning_rate": 5.588235294117647e-06,
264
+ "loss": 0.193,
265
  "step": 340
266
  },
267
  {
268
+ "epoch": 2.7613412228796843,
269
+ "grad_norm": 10.346915245056152,
270
+ "learning_rate": 4.11764705882353e-06,
271
+ "loss": 0.1617,
272
+ "step": 350
273
+ },
274
+ {
275
+ "epoch": 2.8402366863905324,
276
+ "grad_norm": 12.84180736541748,
277
+ "learning_rate": 2.647058823529412e-06,
278
+ "loss": 0.1645,
279
+ "step": 360
280
+ },
281
+ {
282
+ "epoch": 2.9191321499013805,
283
+ "grad_norm": 7.301783561706543,
284
+ "learning_rate": 1.1764705882352942e-06,
285
+ "loss": 0.1714,
286
+ "step": 370
287
+ },
288
+ {
289
+ "epoch": 2.9822485207100593,
290
+ "eval_accuracy": 0.9755555555555555,
291
+ "eval_loss": 0.07779138535261154,
292
+ "eval_runtime": 33.1571,
293
+ "eval_samples_per_second": 162.861,
294
+ "eval_steps_per_second": 5.097,
295
+ "step": 378
296
  },
297
  {
298
+ "epoch": 2.9822485207100593,
299
+ "step": 378,
300
+ "total_flos": 1.2017076524313477e+18,
301
+ "train_loss": 0.406993343716576,
302
+ "train_runtime": 795.2889,
303
+ "train_samples_per_second": 61.11,
304
+ "train_steps_per_second": 0.475
305
  }
306
  ],
307
  "logging_steps": 10,
308
+ "max_steps": 378,
309
  "num_input_tokens_seen": 0,
310
  "num_train_epochs": 3,
311
  "save_steps": 500,
 
321
  "attributes": {}
322
  }
323
  },
324
+ "total_flos": 1.2017076524313477e+18,
325
  "train_batch_size": 32,
326
  "trial_name": null,
327
  "trial_params": null