AykeeSalazar commited on
Commit
1b0965a
1 Parent(s): e7a987e

Training in progress, step 100

Browse files
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 12.05,
3
+ "eval_accuracy": 0.8737166324435318,
4
+ "eval_loss": 0.36519739031791687,
5
+ "eval_runtime": 11.444,
6
+ "eval_samples_per_second": 170.221,
7
+ "eval_steps_per_second": 5.33,
8
+ "train_loss": 0.18408180872599283,
9
+ "train_runtime": 1888.403,
10
+ "train_samples_per_second": 841.24,
11
+ "train_steps_per_second": 26.371
12
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 12.05,
3
+ "eval_accuracy": 0.8737166324435318,
4
+ "eval_loss": 0.36519739031791687,
5
+ "eval_runtime": 11.444,
6
+ "eval_samples_per_second": 170.221,
7
+ "eval_steps_per_second": 5.33
8
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:069e2adc72867c50c005ebd0f9dad1ce0849301d0d5d936c3a187811bde41d55
3
  size 343270065
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab5bb37482625a42bff52434a68253cccf5ed30ac437ab5cdb8c12da546eea61
3
  size 343270065
runs/Jul28_09-14-53_bantai-X570S-AORUS-PRO-AX/events.out.tfevents.1658972954.bantai-X570S-AORUS-PRO-AX.16115.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e2edc164d9b0af2836516848af3292ff677fc20f7629fa3b6209e7ed21ce444
3
+ size 363
runs/Jul28_09-51-05_bantai-X570S-AORUS-PRO-AX/1658973073.0384011/events.out.tfevents.1658973073.bantai-X570S-AORUS-PRO-AX.20824.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f51af9733987f7ac7ae11d79610e7660f706c3a8d13b042fc9fea777121890ea
3
+ size 5407
runs/Jul28_09-51-05_bantai-X570S-AORUS-PRO-AX/events.out.tfevents.1658973073.bantai-X570S-AORUS-PRO-AX.20824.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2b9d942e52589320a9f9cb2643f835e0c5876f3696b8b9ed08c89499323568b
3
+ size 4074
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 12.05,
3
+ "train_loss": 0.18408180872599283,
4
+ "train_runtime": 1888.403,
5
+ "train_samples_per_second": 841.24,
6
+ "train_steps_per_second": 26.371
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8737166324435318,
3
+ "best_model_checkpoint": "vc-bantai-vit-withoutAMBI-adunest-v1/checkpoint-1800",
4
+ "epoch": 12.048192771084338,
5
+ "global_step": 3000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.4,
12
+ "eval_accuracy": 0.40811088295687886,
13
+ "eval_loss": 1.2037091255187988,
14
+ "eval_runtime": 11.1902,
15
+ "eval_samples_per_second": 174.08,
16
+ "eval_steps_per_second": 5.451,
17
+ "step": 100
18
+ },
19
+ {
20
+ "epoch": 0.8,
21
+ "eval_accuracy": 0.44096509240246407,
22
+ "eval_loss": 0.9935279488563538,
23
+ "eval_runtime": 11.2125,
24
+ "eval_samples_per_second": 173.734,
25
+ "eval_steps_per_second": 5.44,
26
+ "step": 200
27
+ },
28
+ {
29
+ "epoch": 1.2,
30
+ "eval_accuracy": 0.6914784394250514,
31
+ "eval_loss": 0.6460596323013306,
32
+ "eval_runtime": 11.4894,
33
+ "eval_samples_per_second": 169.547,
34
+ "eval_steps_per_second": 5.309,
35
+ "step": 300
36
+ },
37
+ {
38
+ "epoch": 1.61,
39
+ "eval_accuracy": 0.7705338809034907,
40
+ "eval_loss": 0.49376896023750305,
41
+ "eval_runtime": 11.1511,
42
+ "eval_samples_per_second": 174.691,
43
+ "eval_steps_per_second": 5.47,
44
+ "step": 400
45
+ },
46
+ {
47
+ "epoch": 2.01,
48
+ "learning_rate": 0.0004949799196787149,
49
+ "loss": 0.357,
50
+ "step": 500
51
+ },
52
+ {
53
+ "epoch": 2.01,
54
+ "eval_accuracy": 0.784394250513347,
55
+ "eval_loss": 0.4601840376853943,
56
+ "eval_runtime": 11.4476,
57
+ "eval_samples_per_second": 170.167,
58
+ "eval_steps_per_second": 5.329,
59
+ "step": 500
60
+ },
61
+ {
62
+ "epoch": 2.41,
63
+ "eval_accuracy": 0.7294661190965093,
64
+ "eval_loss": 0.5220066905021667,
65
+ "eval_runtime": 11.1921,
66
+ "eval_samples_per_second": 174.052,
67
+ "eval_steps_per_second": 5.45,
68
+ "step": 600
69
+ },
70
+ {
71
+ "epoch": 2.81,
72
+ "eval_accuracy": 0.7782340862422998,
73
+ "eval_loss": 0.46649423241615295,
74
+ "eval_runtime": 11.2377,
75
+ "eval_samples_per_second": 173.346,
76
+ "eval_steps_per_second": 5.428,
77
+ "step": 700
78
+ },
79
+ {
80
+ "epoch": 3.21,
81
+ "eval_accuracy": 0.830082135523614,
82
+ "eval_loss": 0.44400569796562195,
83
+ "eval_runtime": 11.2183,
84
+ "eval_samples_per_second": 173.645,
85
+ "eval_steps_per_second": 5.438,
86
+ "step": 800
87
+ },
88
+ {
89
+ "epoch": 3.61,
90
+ "eval_accuracy": 0.7176591375770021,
91
+ "eval_loss": 0.5121513605117798,
92
+ "eval_runtime": 11.196,
93
+ "eval_samples_per_second": 173.991,
94
+ "eval_steps_per_second": 5.448,
95
+ "step": 900
96
+ },
97
+ {
98
+ "epoch": 4.02,
99
+ "learning_rate": 0.0004899598393574297,
100
+ "loss": 0.2437,
101
+ "step": 1000
102
+ },
103
+ {
104
+ "epoch": 4.02,
105
+ "eval_accuracy": 0.7320328542094456,
106
+ "eval_loss": 0.6155115962028503,
107
+ "eval_runtime": 11.2061,
108
+ "eval_samples_per_second": 173.833,
109
+ "eval_steps_per_second": 5.443,
110
+ "step": 1000
111
+ },
112
+ {
113
+ "epoch": 4.42,
114
+ "eval_accuracy": 0.7684804928131417,
115
+ "eval_loss": 0.5802133679389954,
116
+ "eval_runtime": 11.2176,
117
+ "eval_samples_per_second": 173.655,
118
+ "eval_steps_per_second": 5.438,
119
+ "step": 1100
120
+ },
121
+ {
122
+ "epoch": 4.82,
123
+ "eval_accuracy": 0.8028747433264887,
124
+ "eval_loss": 0.47085943818092346,
125
+ "eval_runtime": 11.2201,
126
+ "eval_samples_per_second": 173.617,
127
+ "eval_steps_per_second": 5.437,
128
+ "step": 1200
129
+ },
130
+ {
131
+ "epoch": 5.22,
132
+ "eval_accuracy": 0.8352156057494866,
133
+ "eval_loss": 0.4694225490093231,
134
+ "eval_runtime": 11.2031,
135
+ "eval_samples_per_second": 173.881,
136
+ "eval_steps_per_second": 5.445,
137
+ "step": 1300
138
+ },
139
+ {
140
+ "epoch": 5.62,
141
+ "eval_accuracy": 0.8203285420944558,
142
+ "eval_loss": 0.46516597270965576,
143
+ "eval_runtime": 11.1655,
144
+ "eval_samples_per_second": 174.467,
145
+ "eval_steps_per_second": 5.463,
146
+ "step": 1400
147
+ },
148
+ {
149
+ "epoch": 6.02,
150
+ "learning_rate": 0.0004849397590361446,
151
+ "loss": 0.1841,
152
+ "step": 1500
153
+ },
154
+ {
155
+ "epoch": 6.02,
156
+ "eval_accuracy": 0.7648870636550308,
157
+ "eval_loss": 0.5424289107322693,
158
+ "eval_runtime": 11.2414,
159
+ "eval_samples_per_second": 173.288,
160
+ "eval_steps_per_second": 5.426,
161
+ "step": 1500
162
+ },
163
+ {
164
+ "epoch": 6.43,
165
+ "eval_accuracy": 0.8059548254620124,
166
+ "eval_loss": 0.46159353852272034,
167
+ "eval_runtime": 11.1678,
168
+ "eval_samples_per_second": 174.43,
169
+ "eval_steps_per_second": 5.462,
170
+ "step": 1600
171
+ },
172
+ {
173
+ "epoch": 6.83,
174
+ "eval_accuracy": 0.8547227926078029,
175
+ "eval_loss": 0.35685229301452637,
176
+ "eval_runtime": 11.2186,
177
+ "eval_samples_per_second": 173.64,
178
+ "eval_steps_per_second": 5.437,
179
+ "step": 1700
180
+ },
181
+ {
182
+ "epoch": 7.23,
183
+ "eval_accuracy": 0.8737166324435318,
184
+ "eval_loss": 0.36519739031791687,
185
+ "eval_runtime": 11.1645,
186
+ "eval_samples_per_second": 174.481,
187
+ "eval_steps_per_second": 5.464,
188
+ "step": 1800
189
+ },
190
+ {
191
+ "epoch": 7.63,
192
+ "eval_accuracy": 0.7438398357289527,
193
+ "eval_loss": 0.7777961492538452,
194
+ "eval_runtime": 11.2328,
195
+ "eval_samples_per_second": 173.421,
196
+ "eval_steps_per_second": 5.431,
197
+ "step": 1900
198
+ },
199
+ {
200
+ "epoch": 8.03,
201
+ "learning_rate": 0.0004799196787148594,
202
+ "loss": 0.1328,
203
+ "step": 2000
204
+ },
205
+ {
206
+ "epoch": 8.03,
207
+ "eval_accuracy": 0.8162217659137577,
208
+ "eval_loss": 0.546014666557312,
209
+ "eval_runtime": 11.2154,
210
+ "eval_samples_per_second": 173.689,
211
+ "eval_steps_per_second": 5.439,
212
+ "step": 2000
213
+ },
214
+ {
215
+ "epoch": 8.43,
216
+ "eval_accuracy": 0.776694045174538,
217
+ "eval_loss": 0.8070306777954102,
218
+ "eval_runtime": 11.1916,
219
+ "eval_samples_per_second": 174.06,
220
+ "eval_steps_per_second": 5.451,
221
+ "step": 2100
222
+ },
223
+ {
224
+ "epoch": 8.84,
225
+ "eval_accuracy": 0.7797741273100616,
226
+ "eval_loss": 0.6872759461402893,
227
+ "eval_runtime": 11.206,
228
+ "eval_samples_per_second": 173.835,
229
+ "eval_steps_per_second": 5.444,
230
+ "step": 2200
231
+ },
232
+ {
233
+ "epoch": 9.24,
234
+ "eval_accuracy": 0.7782340862422998,
235
+ "eval_loss": 0.8942956328392029,
236
+ "eval_runtime": 11.1451,
237
+ "eval_samples_per_second": 174.785,
238
+ "eval_steps_per_second": 5.473,
239
+ "step": 2300
240
+ },
241
+ {
242
+ "epoch": 9.64,
243
+ "eval_accuracy": 0.8552361396303901,
244
+ "eval_loss": 0.5378373265266418,
245
+ "eval_runtime": 11.1452,
246
+ "eval_samples_per_second": 174.784,
247
+ "eval_steps_per_second": 5.473,
248
+ "step": 2400
249
+ },
250
+ {
251
+ "epoch": 10.04,
252
+ "learning_rate": 0.0004748995983935743,
253
+ "loss": 0.1059,
254
+ "step": 2500
255
+ },
256
+ {
257
+ "epoch": 10.04,
258
+ "eval_accuracy": 0.8069815195071869,
259
+ "eval_loss": 0.7080937623977661,
260
+ "eval_runtime": 11.2065,
261
+ "eval_samples_per_second": 173.828,
262
+ "eval_steps_per_second": 5.443,
263
+ "step": 2500
264
+ },
265
+ {
266
+ "epoch": 10.44,
267
+ "eval_accuracy": 0.7012320328542094,
268
+ "eval_loss": 0.994149923324585,
269
+ "eval_runtime": 11.1681,
270
+ "eval_samples_per_second": 174.426,
271
+ "eval_steps_per_second": 5.462,
272
+ "step": 2600
273
+ },
274
+ {
275
+ "epoch": 10.84,
276
+ "eval_accuracy": 0.7900410677618069,
277
+ "eval_loss": 0.9151853919029236,
278
+ "eval_runtime": 11.2106,
279
+ "eval_samples_per_second": 173.764,
280
+ "eval_steps_per_second": 5.441,
281
+ "step": 2700
282
+ },
283
+ {
284
+ "epoch": 11.24,
285
+ "eval_accuracy": 0.7736139630390144,
286
+ "eval_loss": 0.7493842244148254,
287
+ "eval_runtime": 11.1841,
288
+ "eval_samples_per_second": 174.175,
289
+ "eval_steps_per_second": 5.454,
290
+ "step": 2800
291
+ },
292
+ {
293
+ "epoch": 11.65,
294
+ "eval_accuracy": 0.7869609856262834,
295
+ "eval_loss": 0.7680638432502747,
296
+ "eval_runtime": 11.2188,
297
+ "eval_samples_per_second": 173.636,
298
+ "eval_steps_per_second": 5.437,
299
+ "step": 2900
300
+ },
301
+ {
302
+ "epoch": 12.05,
303
+ "learning_rate": 0.0004698795180722892,
304
+ "loss": 0.081,
305
+ "step": 3000
306
+ },
307
+ {
308
+ "epoch": 12.05,
309
+ "eval_accuracy": 0.8039014373716632,
310
+ "eval_loss": 0.7735891342163086,
311
+ "eval_runtime": 11.4086,
312
+ "eval_samples_per_second": 170.748,
313
+ "eval_steps_per_second": 5.347,
314
+ "step": 3000
315
+ },
316
+ {
317
+ "epoch": 12.05,
318
+ "step": 3000,
319
+ "total_flos": 7.416049873230029e+18,
320
+ "train_loss": 0.18408180872599283,
321
+ "train_runtime": 1888.403,
322
+ "train_samples_per_second": 841.24,
323
+ "train_steps_per_second": 26.371
324
+ }
325
+ ],
326
+ "max_steps": 49800,
327
+ "num_train_epochs": 200,
328
+ "total_flos": 7.416049873230029e+18,
329
+ "trial_name": null,
330
+ "trial_params": null
331
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffdc43a3e2d89349e02c90b2d24b4ee079178706583dce50e8db9b8ce898acc1
3
  size 3375
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14fdee491c04a01e9074ffcd862bd86557fe11ab5864ceed82f941032cf4df9a
3
  size 3375