polejowska commited on
Commit
852b688
1 Parent(s): c9f2d67

End of training

Browse files
runs/Feb26_19-45-51_952abec28ae3/events.out.tfevents.1677440757.952abec28ae3.204.8 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:772d1a2b6349d174f4f593ba723419561901737442b8cbdfd1a112308e0cb08f
3
- size 6618
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbbf275ad546f0ef5560e410b86461273d6b7e360bd5a8a783e1b2fe5429877c
3
+ size 6972
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 20.0,
5
- "global_step": 1880,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -288,18 +288,88 @@
288
  "step": 1880
289
  },
290
  {
291
- "epoch": 20.0,
292
- "step": 1880,
293
- "total_flos": 7.1683864704e+18,
294
- "train_loss": 0.5733721875129862,
295
- "train_runtime": 1226.2208,
296
- "train_samples_per_second": 12.233,
297
- "train_steps_per_second": 1.533
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
298
  }
299
  ],
300
- "max_steps": 1880,
301
- "num_train_epochs": 20,
302
- "total_flos": 7.1683864704e+18,
303
  "trial_name": null,
304
  "trial_params": null
305
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 25.0,
5
+ "global_step": 2350,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
288
  "step": 1880
289
  },
290
  {
291
+ "epoch": 21.0,
292
+ "learning_rate": 1.6000000000000003e-05,
293
+ "loss": 2.3083,
294
+ "step": 1974
295
+ },
296
+ {
297
+ "epoch": 21.0,
298
+ "eval_loss": 1.7549386024475098,
299
+ "eval_runtime": 37.0581,
300
+ "eval_samples_per_second": 5.397,
301
+ "eval_steps_per_second": 0.675,
302
+ "step": 1974
303
+ },
304
+ {
305
+ "epoch": 22.0,
306
+ "learning_rate": 1.2e-05,
307
+ "loss": 2.2542,
308
+ "step": 2068
309
+ },
310
+ {
311
+ "epoch": 22.0,
312
+ "eval_loss": 1.7174808979034424,
313
+ "eval_runtime": 36.8163,
314
+ "eval_samples_per_second": 5.432,
315
+ "eval_steps_per_second": 0.679,
316
+ "step": 2068
317
+ },
318
+ {
319
+ "epoch": 23.0,
320
+ "learning_rate": 8.000000000000001e-06,
321
+ "loss": 2.2262,
322
+ "step": 2162
323
+ },
324
+ {
325
+ "epoch": 23.0,
326
+ "eval_loss": 1.699831485748291,
327
+ "eval_runtime": 36.7706,
328
+ "eval_samples_per_second": 5.439,
329
+ "eval_steps_per_second": 0.68,
330
+ "step": 2162
331
+ },
332
+ {
333
+ "epoch": 24.0,
334
+ "learning_rate": 4.000000000000001e-06,
335
+ "loss": 2.2644,
336
+ "step": 2256
337
+ },
338
+ {
339
+ "epoch": 24.0,
340
+ "eval_loss": 1.7019526958465576,
341
+ "eval_runtime": 37.036,
342
+ "eval_samples_per_second": 5.4,
343
+ "eval_steps_per_second": 0.675,
344
+ "step": 2256
345
+ },
346
+ {
347
+ "epoch": 25.0,
348
+ "learning_rate": 0.0,
349
+ "loss": 2.2392,
350
+ "step": 2350
351
+ },
352
+ {
353
+ "epoch": 25.0,
354
+ "eval_loss": 1.6933141946792603,
355
+ "eval_runtime": 36.9874,
356
+ "eval_samples_per_second": 5.407,
357
+ "eval_steps_per_second": 0.676,
358
+ "step": 2350
359
+ },
360
+ {
361
+ "epoch": 25.0,
362
+ "step": 2350,
363
+ "total_flos": 8.960483088e+18,
364
+ "train_loss": 0.45169270616896606,
365
+ "train_runtime": 1228.9697,
366
+ "train_samples_per_second": 15.257,
367
+ "train_steps_per_second": 1.912
368
  }
369
  ],
370
+ "max_steps": 2350,
371
+ "num_train_epochs": 25,
372
+ "total_flos": 8.960483088e+18,
373
  "trial_name": null,
374
  "trial_params": null
375
  }