File size: 9,396 Bytes
fc23c86
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
{
  "best_metric": 0.29332470893859863,
  "best_model_checkpoint": "medicinal_plants_image_detection/checkpoint-6690",
  "epoch": 30.0,
  "eval_steps": 500,
  "global_step": 6690,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_accuracy": 0.4994388327721661,
      "eval_loss": 3.614454984664917,
      "eval_runtime": 48.2613,
      "eval_samples_per_second": 36.924,
      "eval_steps_per_second": 4.621,
      "step": 223
    },
    {
      "epoch": 2.0,
      "eval_accuracy": 0.7918069584736251,
      "eval_loss": 3.1569712162017822,
      "eval_runtime": 49.1349,
      "eval_samples_per_second": 36.267,
      "eval_steps_per_second": 4.539,
      "step": 446
    },
    {
      "epoch": 2.24,
      "learning_rate": 9.322289156626508e-06,
      "loss": 3.5047,
      "step": 500
    },
    {
      "epoch": 3.0,
      "eval_accuracy": 0.8597081930415263,
      "eval_loss": 2.7521684169769287,
      "eval_runtime": 50.645,
      "eval_samples_per_second": 35.186,
      "eval_steps_per_second": 4.403,
      "step": 669
    },
    {
      "epoch": 4.0,
      "eval_accuracy": 0.8978675645342312,
      "eval_loss": 2.4042551517486572,
      "eval_runtime": 51.9856,
      "eval_samples_per_second": 34.279,
      "eval_steps_per_second": 4.29,
      "step": 892
    },
    {
      "epoch": 4.48,
      "learning_rate": 8.569277108433736e-06,
      "loss": 2.5032,
      "step": 1000
    },
    {
      "epoch": 5.0,
      "eval_accuracy": 0.9231200897867564,
      "eval_loss": 2.115753412246704,
      "eval_runtime": 48.1602,
      "eval_samples_per_second": 37.002,
      "eval_steps_per_second": 4.63,
      "step": 1115
    },
    {
      "epoch": 6.0,
      "eval_accuracy": 0.9444444444444444,
      "eval_loss": 1.8598074913024902,
      "eval_runtime": 48.8256,
      "eval_samples_per_second": 36.497,
      "eval_steps_per_second": 4.567,
      "step": 1338
    },
    {
      "epoch": 6.73,
      "learning_rate": 7.816265060240964e-06,
      "loss": 1.8072,
      "step": 1500
    },
    {
      "epoch": 7.0,
      "eval_accuracy": 0.957351290684624,
      "eval_loss": 1.6446038484573364,
      "eval_runtime": 48.2656,
      "eval_samples_per_second": 36.921,
      "eval_steps_per_second": 4.62,
      "step": 1561
    },
    {
      "epoch": 8.0,
      "eval_accuracy": 0.9618406285072951,
      "eval_loss": 1.461050033569336,
      "eval_runtime": 48.1324,
      "eval_samples_per_second": 37.023,
      "eval_steps_per_second": 4.633,
      "step": 1784
    },
    {
      "epoch": 8.97,
      "learning_rate": 7.063253012048194e-06,
      "loss": 1.3122,
      "step": 2000
    },
    {
      "epoch": 9.0,
      "eval_accuracy": 0.9685746352413019,
      "eval_loss": 1.287758469581604,
      "eval_runtime": 48.8178,
      "eval_samples_per_second": 36.503,
      "eval_steps_per_second": 4.568,
      "step": 2007
    },
    {
      "epoch": 10.0,
      "eval_accuracy": 0.9719416386083053,
      "eval_loss": 1.1408909559249878,
      "eval_runtime": 49.7454,
      "eval_samples_per_second": 35.822,
      "eval_steps_per_second": 4.483,
      "step": 2230
    },
    {
      "epoch": 11.0,
      "eval_accuracy": 0.9758698092031426,
      "eval_loss": 1.0084798336029053,
      "eval_runtime": 48.8764,
      "eval_samples_per_second": 36.459,
      "eval_steps_per_second": 4.563,
      "step": 2453
    },
    {
      "epoch": 11.21,
      "learning_rate": 6.310240963855422e-06,
      "loss": 0.9553,
      "step": 2500
    },
    {
      "epoch": 12.0,
      "eval_accuracy": 0.9803591470258137,
      "eval_loss": 0.8966515064239502,
      "eval_runtime": 47.3671,
      "eval_samples_per_second": 37.621,
      "eval_steps_per_second": 4.708,
      "step": 2676
    },
    {
      "epoch": 13.0,
      "eval_accuracy": 0.9826038159371493,
      "eval_loss": 0.7965953350067139,
      "eval_runtime": 47.0538,
      "eval_samples_per_second": 37.872,
      "eval_steps_per_second": 4.739,
      "step": 2899
    },
    {
      "epoch": 13.45,
      "learning_rate": 5.5572289156626515e-06,
      "loss": 0.7044,
      "step": 3000
    },
    {
      "epoch": 14.0,
      "eval_accuracy": 0.9842873176206509,
      "eval_loss": 0.7103424668312073,
      "eval_runtime": 46.1432,
      "eval_samples_per_second": 38.619,
      "eval_steps_per_second": 4.833,
      "step": 3122
    },
    {
      "epoch": 15.0,
      "eval_accuracy": 0.9859708193041526,
      "eval_loss": 0.6361219882965088,
      "eval_runtime": 46.1364,
      "eval_samples_per_second": 38.625,
      "eval_steps_per_second": 4.833,
      "step": 3345
    },
    {
      "epoch": 15.7,
      "learning_rate": 4.80421686746988e-06,
      "loss": 0.5256,
      "step": 3500
    },
    {
      "epoch": 16.0,
      "eval_accuracy": 0.9854096520763187,
      "eval_loss": 0.5733931064605713,
      "eval_runtime": 46.2916,
      "eval_samples_per_second": 38.495,
      "eval_steps_per_second": 4.817,
      "step": 3568
    },
    {
      "epoch": 17.0,
      "eval_accuracy": 0.9859708193041526,
      "eval_loss": 0.5201807022094727,
      "eval_runtime": 46.3808,
      "eval_samples_per_second": 38.421,
      "eval_steps_per_second": 4.808,
      "step": 3791
    },
    {
      "epoch": 17.94,
      "learning_rate": 4.051204819277109e-06,
      "loss": 0.4008,
      "step": 4000
    },
    {
      "epoch": 18.0,
      "eval_accuracy": 0.9870931537598204,
      "eval_loss": 0.47677987813949585,
      "eval_runtime": 46.3137,
      "eval_samples_per_second": 38.477,
      "eval_steps_per_second": 4.815,
      "step": 4014
    },
    {
      "epoch": 19.0,
      "eval_accuracy": 0.9870931537598204,
      "eval_loss": 0.4372333884239197,
      "eval_runtime": 46.0508,
      "eval_samples_per_second": 38.696,
      "eval_steps_per_second": 4.842,
      "step": 4237
    },
    {
      "epoch": 20.0,
      "eval_accuracy": 0.9865319865319865,
      "eval_loss": 0.40752825140953064,
      "eval_runtime": 46.1411,
      "eval_samples_per_second": 38.621,
      "eval_steps_per_second": 4.833,
      "step": 4460
    },
    {
      "epoch": 20.18,
      "learning_rate": 3.2981927710843376e-06,
      "loss": 0.3219,
      "step": 4500
    },
    {
      "epoch": 21.0,
      "eval_accuracy": 0.9859708193041526,
      "eval_loss": 0.38523805141448975,
      "eval_runtime": 46.0733,
      "eval_samples_per_second": 38.678,
      "eval_steps_per_second": 4.84,
      "step": 4683
    },
    {
      "epoch": 22.0,
      "eval_accuracy": 0.9865319865319865,
      "eval_loss": 0.3623017370700836,
      "eval_runtime": 45.8883,
      "eval_samples_per_second": 38.833,
      "eval_steps_per_second": 4.86,
      "step": 4906
    },
    {
      "epoch": 22.42,
      "learning_rate": 2.5451807228915665e-06,
      "loss": 0.2714,
      "step": 5000
    },
    {
      "epoch": 23.0,
      "eval_accuracy": 0.9859708193041526,
      "eval_loss": 0.3463130593299866,
      "eval_runtime": 46.8136,
      "eval_samples_per_second": 38.066,
      "eval_steps_per_second": 4.764,
      "step": 5129
    },
    {
      "epoch": 24.0,
      "eval_accuracy": 0.9859708193041526,
      "eval_loss": 0.33292245864868164,
      "eval_runtime": 49.1048,
      "eval_samples_per_second": 36.29,
      "eval_steps_per_second": 4.541,
      "step": 5352
    },
    {
      "epoch": 24.66,
      "learning_rate": 1.7921686746987955e-06,
      "loss": 0.2378,
      "step": 5500
    },
    {
      "epoch": 25.0,
      "eval_accuracy": 0.9865319865319865,
      "eval_loss": 0.31982797384262085,
      "eval_runtime": 46.2965,
      "eval_samples_per_second": 38.491,
      "eval_steps_per_second": 4.817,
      "step": 5575
    },
    {
      "epoch": 26.0,
      "eval_accuracy": 0.9870931537598204,
      "eval_loss": 0.31251493096351624,
      "eval_runtime": 45.905,
      "eval_samples_per_second": 38.819,
      "eval_steps_per_second": 4.858,
      "step": 5798
    },
    {
      "epoch": 26.91,
      "learning_rate": 1.0391566265060242e-06,
      "loss": 0.2165,
      "step": 6000
    },
    {
      "epoch": 27.0,
      "eval_accuracy": 0.9870931537598204,
      "eval_loss": 0.3037458658218384,
      "eval_runtime": 47.4495,
      "eval_samples_per_second": 37.556,
      "eval_steps_per_second": 4.7,
      "step": 6021
    },
    {
      "epoch": 28.0,
      "eval_accuracy": 0.9876543209876543,
      "eval_loss": 0.29743924736976624,
      "eval_runtime": 47.6086,
      "eval_samples_per_second": 37.43,
      "eval_steps_per_second": 4.684,
      "step": 6244
    },
    {
      "epoch": 29.0,
      "eval_accuracy": 0.9876543209876543,
      "eval_loss": 0.2938971519470215,
      "eval_runtime": 47.4632,
      "eval_samples_per_second": 37.545,
      "eval_steps_per_second": 4.698,
      "step": 6467
    },
    {
      "epoch": 29.15,
      "learning_rate": 2.8614457831325304e-07,
      "loss": 0.2047,
      "step": 6500
    },
    {
      "epoch": 30.0,
      "eval_accuracy": 0.9876543209876543,
      "eval_loss": 0.29332470893859863,
      "eval_runtime": 46.6765,
      "eval_samples_per_second": 38.178,
      "eval_steps_per_second": 4.778,
      "step": 6690
    }
  ],
  "logging_steps": 500,
  "max_steps": 6690,
  "num_train_epochs": 30,
  "save_steps": 500,
  "total_flos": 1.6569009834178314e+19,
  "trial_name": null,
  "trial_params": null
}