polejowska commited on
Commit
d4be0bc
1 Parent(s): cd66a5f

End of training

Browse files
Files changed (1) hide show
  1. trainer_state.json +90 -20
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 1.5988867282867432,
3
- "best_model_checkpoint": "detr-r50-cd45rb-8ah-6l-gelu-corrected\\checkpoint-87514",
4
- "epoch": 20.0,
5
- "global_step": 92120,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -275,31 +275,101 @@
275
  },
276
  {
277
  "epoch": 20.0,
278
- "learning_rate": 4.559270516717325e-09,
279
- "loss": 2.0084,
280
  "step": 92120
281
  },
282
  {
283
  "epoch": 20.0,
284
- "eval_loss": 1.599236011505127,
285
- "eval_runtime": 202.2872,
286
- "eval_samples_per_second": 8.804,
287
- "eval_steps_per_second": 1.102,
288
  "step": 92120
289
  },
290
  {
291
- "epoch": 20.0,
292
- "step": 92120,
293
- "total_flos": 1.7606512956165125e+20,
294
- "train_loss": 1.0303937374484369,
295
- "train_runtime": 29465.5365,
296
- "train_samples_per_second": 12.503,
297
- "train_steps_per_second": 3.126
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
298
  }
299
  ],
300
- "max_steps": 92120,
301
- "num_train_epochs": 20,
302
- "total_flos": 1.7606512956165125e+20,
303
  "trial_name": null,
304
  "trial_params": null
305
  }
 
1
  {
2
+ "best_metric": 1.5861479043960571,
3
+ "best_model_checkpoint": "detr-r50-cd45rb-8ah-6l-gelu-corrected\\checkpoint-115150",
4
+ "epoch": 25.0,
5
+ "global_step": 115150,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
275
  },
276
  {
277
  "epoch": 20.0,
278
+ "learning_rate": 2.0037342596613115e-06,
279
+ "loss": 2.0206,
280
  "step": 92120
281
  },
282
  {
283
  "epoch": 20.0,
284
+ "eval_loss": 1.6168476343154907,
285
+ "eval_runtime": 207.1893,
286
+ "eval_samples_per_second": 8.596,
287
+ "eval_steps_per_second": 1.076,
288
  "step": 92120
289
  },
290
  {
291
+ "epoch": 21.0,
292
+ "learning_rate": 1.6039947894051239e-06,
293
+ "loss": 2.026,
294
+ "step": 96726
295
+ },
296
+ {
297
+ "epoch": 21.0,
298
+ "eval_loss": 1.6022319793701172,
299
+ "eval_runtime": 206.9802,
300
+ "eval_samples_per_second": 8.605,
301
+ "eval_steps_per_second": 1.077,
302
+ "step": 96726
303
+ },
304
+ {
305
+ "epoch": 22.0,
306
+ "learning_rate": 1.2041684759009988e-06,
307
+ "loss": 2.0109,
308
+ "step": 101332
309
+ },
310
+ {
311
+ "epoch": 22.0,
312
+ "eval_loss": 1.5995537042617798,
313
+ "eval_runtime": 206.8836,
314
+ "eval_samples_per_second": 8.609,
315
+ "eval_steps_per_second": 1.078,
316
+ "step": 101332
317
+ },
318
+ {
319
+ "epoch": 23.0,
320
+ "learning_rate": 8.042553191489362e-07,
321
+ "loss": 2.0133,
322
+ "step": 105938
323
+ },
324
+ {
325
+ "epoch": 23.0,
326
+ "eval_loss": 1.5983381271362305,
327
+ "eval_runtime": 206.4758,
328
+ "eval_samples_per_second": 8.626,
329
+ "eval_steps_per_second": 1.08,
330
+ "step": 105938
331
+ },
332
+ {
333
+ "epoch": 24.0,
334
+ "learning_rate": 4.043421623968737e-07,
335
+ "loss": 2.0081,
336
+ "step": 110544
337
+ },
338
+ {
339
+ "epoch": 24.0,
340
+ "eval_loss": 1.5887646675109863,
341
+ "eval_runtime": 203.9191,
342
+ "eval_samples_per_second": 8.734,
343
+ "eval_steps_per_second": 1.094,
344
+ "step": 110544
345
+ },
346
+ {
347
+ "epoch": 25.0,
348
+ "learning_rate": 4.515848892748589e-09,
349
+ "loss": 1.9975,
350
+ "step": 115150
351
+ },
352
+ {
353
+ "epoch": 25.0,
354
+ "eval_loss": 1.5861479043960571,
355
+ "eval_runtime": 204.8681,
356
+ "eval_samples_per_second": 8.693,
357
+ "eval_steps_per_second": 1.089,
358
+ "step": 115150
359
+ },
360
+ {
361
+ "epoch": 25.0,
362
+ "step": 115150,
363
+ "total_flos": 2.2008141195206407e+20,
364
+ "train_loss": 0.4830571452317629,
365
+ "train_runtime": 17891.958,
366
+ "train_samples_per_second": 25.739,
367
+ "train_steps_per_second": 6.436
368
  }
369
  ],
370
+ "max_steps": 115150,
371
+ "num_train_epochs": 25,
372
+ "total_flos": 2.2008141195206407e+20,
373
  "trial_name": null,
374
  "trial_params": null
375
  }