File size: 8,727 Bytes
fa979c4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
{
  "best_metric": 0.024307304993271828,
  "best_model_checkpoint": "./dinov2_LoRA_Liveness_detection_v1.1/checkpoint-448",
  "epoch": 3.0,
  "eval_steps": 64,
  "global_step": 471,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.10191082802547771,
      "grad_norm": 3.3717641830444336,
      "learning_rate": 4.840764331210191e-05,
      "loss": 0.3564,
      "step": 16
    },
    {
      "epoch": 0.20382165605095542,
      "grad_norm": 1.4053750038146973,
      "learning_rate": 4.6709129511677285e-05,
      "loss": 0.1026,
      "step": 32
    },
    {
      "epoch": 0.3057324840764331,
      "grad_norm": 1.2090115547180176,
      "learning_rate": 4.501061571125266e-05,
      "loss": 0.0606,
      "step": 48
    },
    {
      "epoch": 0.40764331210191085,
      "grad_norm": 2.0192923545837402,
      "learning_rate": 4.331210191082803e-05,
      "loss": 0.0501,
      "step": 64
    },
    {
      "epoch": 0.40764331210191085,
      "eval_accuracy": 0.9841349785948124,
      "eval_f1": 0.9841073630518083,
      "eval_loss": 0.04576801881194115,
      "eval_precision": 0.9842311607904581,
      "eval_recall": 0.9841349785948124,
      "eval_runtime": 317.7291,
      "eval_samples_per_second": 62.947,
      "eval_steps_per_second": 7.868,
      "step": 64
    },
    {
      "epoch": 0.5095541401273885,
      "grad_norm": 1.1693896055221558,
      "learning_rate": 4.1613588110403404e-05,
      "loss": 0.0437,
      "step": 80
    },
    {
      "epoch": 0.6114649681528662,
      "grad_norm": 1.2890028953552246,
      "learning_rate": 3.991507430997877e-05,
      "loss": 0.0472,
      "step": 96
    },
    {
      "epoch": 0.7133757961783439,
      "grad_norm": 1.012406826019287,
      "learning_rate": 3.821656050955414e-05,
      "loss": 0.0388,
      "step": 112
    },
    {
      "epoch": 0.8152866242038217,
      "grad_norm": 1.3089163303375244,
      "learning_rate": 3.651804670912951e-05,
      "loss": 0.0355,
      "step": 128
    },
    {
      "epoch": 0.8152866242038217,
      "eval_accuracy": 0.9879627297909847,
      "eval_f1": 0.9879658772630169,
      "eval_loss": 0.034234367311000824,
      "eval_precision": 0.9879573976357167,
      "eval_recall": 0.9879627297909847,
      "eval_runtime": 309.1521,
      "eval_samples_per_second": 64.693,
      "eval_steps_per_second": 8.087,
      "step": 128
    },
    {
      "epoch": 0.9171974522292994,
      "grad_norm": 1.0827258825302124,
      "learning_rate": 3.481953290870488e-05,
      "loss": 0.0327,
      "step": 144
    },
    {
      "epoch": 1.019108280254777,
      "grad_norm": 1.2000535726547241,
      "learning_rate": 3.3121019108280256e-05,
      "loss": 0.035,
      "step": 160
    },
    {
      "epoch": 1.1210191082802548,
      "grad_norm": 2.487323045730591,
      "learning_rate": 3.142250530785563e-05,
      "loss": 0.0275,
      "step": 176
    },
    {
      "epoch": 1.2229299363057324,
      "grad_norm": 2.1451828479766846,
      "learning_rate": 2.9723991507431e-05,
      "loss": 0.0253,
      "step": 192
    },
    {
      "epoch": 1.2229299363057324,
      "eval_accuracy": 0.990078065978343,
      "eval_f1": 0.9900620320034099,
      "eval_loss": 0.030784847214818,
      "eval_precision": 0.9901457841504492,
      "eval_recall": 0.990078065978343,
      "eval_runtime": 313.1272,
      "eval_samples_per_second": 63.872,
      "eval_steps_per_second": 7.984,
      "step": 192
    },
    {
      "epoch": 1.3248407643312101,
      "grad_norm": 1.699660062789917,
      "learning_rate": 2.802547770700637e-05,
      "loss": 0.0241,
      "step": 208
    },
    {
      "epoch": 1.426751592356688,
      "grad_norm": 1.5516241788864136,
      "learning_rate": 2.632696390658174e-05,
      "loss": 0.0186,
      "step": 224
    },
    {
      "epoch": 1.5286624203821657,
      "grad_norm": 1.0598669052124023,
      "learning_rate": 2.4628450106157114e-05,
      "loss": 0.0198,
      "step": 240
    },
    {
      "epoch": 1.6305732484076434,
      "grad_norm": 1.8472939729690552,
      "learning_rate": 2.2929936305732484e-05,
      "loss": 0.0226,
      "step": 256
    },
    {
      "epoch": 1.6305732484076434,
      "eval_accuracy": 0.990984638630068,
      "eval_f1": 0.9909855466235222,
      "eval_loss": 0.026686813682317734,
      "eval_precision": 0.9909829656263511,
      "eval_recall": 0.990984638630068,
      "eval_runtime": 311.8552,
      "eval_samples_per_second": 64.132,
      "eval_steps_per_second": 8.017,
      "step": 256
    },
    {
      "epoch": 1.732484076433121,
      "grad_norm": 1.6193630695343018,
      "learning_rate": 2.1231422505307857e-05,
      "loss": 0.021,
      "step": 272
    },
    {
      "epoch": 1.8343949044585988,
      "grad_norm": 1.1963945627212524,
      "learning_rate": 1.953290870488323e-05,
      "loss": 0.0196,
      "step": 288
    },
    {
      "epoch": 1.9363057324840764,
      "grad_norm": 1.3636715412139893,
      "learning_rate": 1.78343949044586e-05,
      "loss": 0.0231,
      "step": 304
    },
    {
      "epoch": 2.038216560509554,
      "grad_norm": 1.2037672996520996,
      "learning_rate": 1.613588110403397e-05,
      "loss": 0.0264,
      "step": 320
    },
    {
      "epoch": 2.038216560509554,
      "eval_accuracy": 0.9911860992193402,
      "eval_f1": 0.9911791189750626,
      "eval_loss": 0.02550842985510826,
      "eval_precision": 0.9912087608299792,
      "eval_recall": 0.9911860992193402,
      "eval_runtime": 310.9636,
      "eval_samples_per_second": 64.316,
      "eval_steps_per_second": 8.04,
      "step": 320
    },
    {
      "epoch": 2.140127388535032,
      "grad_norm": 1.120186448097229,
      "learning_rate": 1.4437367303609342e-05,
      "loss": 0.0143,
      "step": 336
    },
    {
      "epoch": 2.2420382165605095,
      "grad_norm": 1.6843891143798828,
      "learning_rate": 1.2738853503184714e-05,
      "loss": 0.0148,
      "step": 352
    },
    {
      "epoch": 2.343949044585987,
      "grad_norm": 1.4458714723587036,
      "learning_rate": 1.1040339702760085e-05,
      "loss": 0.0179,
      "step": 368
    },
    {
      "epoch": 2.445859872611465,
      "grad_norm": 1.239098310470581,
      "learning_rate": 9.341825902335457e-06,
      "loss": 0.0168,
      "step": 384
    },
    {
      "epoch": 2.445859872611465,
      "eval_accuracy": 0.9921934021657013,
      "eval_f1": 0.9921865805615873,
      "eval_loss": 0.02449687570333481,
      "eval_precision": 0.992217636683327,
      "eval_recall": 0.9921934021657013,
      "eval_runtime": 309.071,
      "eval_samples_per_second": 64.71,
      "eval_steps_per_second": 8.089,
      "step": 384
    },
    {
      "epoch": 2.5477707006369426,
      "grad_norm": 1.4529588222503662,
      "learning_rate": 7.643312101910828e-06,
      "loss": 0.0152,
      "step": 400
    },
    {
      "epoch": 2.6496815286624202,
      "grad_norm": 1.1592313051223755,
      "learning_rate": 5.9447983014862e-06,
      "loss": 0.0127,
      "step": 416
    },
    {
      "epoch": 2.7515923566878984,
      "grad_norm": 1.4602242708206177,
      "learning_rate": 4.246284501061571e-06,
      "loss": 0.0166,
      "step": 432
    },
    {
      "epoch": 2.853503184713376,
      "grad_norm": 1.3949599266052246,
      "learning_rate": 2.547770700636943e-06,
      "loss": 0.0144,
      "step": 448
    },
    {
      "epoch": 2.853503184713376,
      "eval_accuracy": 0.9917401158398388,
      "eval_f1": 0.9917381130215306,
      "eval_loss": 0.024307304993271828,
      "eval_precision": 0.9917449458573591,
      "eval_recall": 0.9917401158398388,
      "eval_runtime": 304.7867,
      "eval_samples_per_second": 65.62,
      "eval_steps_per_second": 8.202,
      "step": 448
    },
    {
      "epoch": 2.9554140127388537,
      "grad_norm": 0.5842750668525696,
      "learning_rate": 8.492569002123142e-07,
      "loss": 0.0177,
      "step": 464
    },
    {
      "epoch": 3.0,
      "step": 471,
      "total_flos": 4.878503731310727e+18,
      "train_loss": 0.040008016563398315,
      "train_runtime": 8568.9568,
      "train_samples_per_second": 28.008,
      "train_steps_per_second": 0.055
    }
  ],
  "logging_steps": 16,
  "max_steps": 471,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 3,
  "save_steps": 64,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": true
      },
      "attributes": {}
    }
  },
  "total_flos": 4.878503731310727e+18,
  "train_batch_size": 512,
  "trial_name": null,
  "trial_params": null
}