Kasper7953 commited on
Commit
7f41c81
1 Parent(s): c964019

Training in progress, step 19000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:845c13e137da03553b05598129da4a8674d9e0b1a7f13d45b2029c4e560c0674
3
  size 2847145157
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18542fb0f0ca8c5209e2b93103f1880c50a53c82c7835aa17cc9be5a52878bde
3
  size 2847145157
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98e64d9e3ec5e4e45f03e6e983897c802b870e1747cae8af2c34bdeb835bbcbe
3
  size 1524261149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a55bd617d7f0551be9aa43e265f8d49f618cdf19eed0897711e26055a6662e99
3
  size 1524261149
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8906e4503e5e52d1eb508d6d922f99d3cb6d5caafa2b7778f4a4873479d6785
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ec49eaf93dbcc4a7020eab69f82e4825b6de00732c3380cc93bef441b24d358
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2364d0eed038a9d0d4a87a052e7a1739b5247b2fbf2962d4f2b4b62f09c6e9d9
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ebdd7eec22dd0eaa942c09b9d66a5b538c98524805051b53c9cae7c97f8241a
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.698246140008994,
5
- "global_step": 18000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -422,11 +422,39 @@
422
  "learning_rate": 3.6508769299955035e-05,
423
  "loss": 2.1897,
424
  "step": 18000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
425
  }
426
  ],
427
  "max_steps": 66710,
428
  "num_train_epochs": 10,
429
- "total_flos": 2.4486318409728e+16,
430
  "trial_name": null,
431
  "trial_params": null
432
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.848148703342827,
5
+ "global_step": 19000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
422
  "learning_rate": 3.6508769299955035e-05,
423
  "loss": 2.1897,
424
  "step": 18000
425
+ },
426
+ {
427
+ "epoch": 2.73,
428
+ "eval_loss": 2.646106719970703,
429
+ "eval_runtime": 209.741,
430
+ "eval_samples_per_second": 16.84,
431
+ "eval_steps_per_second": 5.616,
432
+ "step": 18200
433
+ },
434
+ {
435
+ "epoch": 2.77,
436
+ "learning_rate": 3.613401289162045e-05,
437
+ "loss": 2.181,
438
+ "step": 18500
439
+ },
440
+ {
441
+ "epoch": 2.83,
442
+ "eval_loss": 2.6370952129364014,
443
+ "eval_runtime": 210.1426,
444
+ "eval_samples_per_second": 16.808,
445
+ "eval_steps_per_second": 5.606,
446
+ "step": 18900
447
+ },
448
+ {
449
+ "epoch": 2.85,
450
+ "learning_rate": 3.5759256483285864e-05,
451
+ "loss": 2.2077,
452
+ "step": 19000
453
  }
454
  ],
455
  "max_steps": 66710,
456
  "num_train_epochs": 10,
457
+ "total_flos": 2.5846719817728e+16,
458
  "trial_name": null,
459
  "trial_params": null
460
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98e64d9e3ec5e4e45f03e6e983897c802b870e1747cae8af2c34bdeb835bbcbe
3
  size 1524261149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a55bd617d7f0551be9aa43e265f8d49f618cdf19eed0897711e26055a6662e99
3
  size 1524261149
runs/Mar11_11-28-52_b25631785753/events.out.tfevents.1678534153.b25631785753.957.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54e79f5a2b923c081ea13c8772ce423bd840d2defafdbe1fa34fff717394491c
3
- size 7092
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2c6ce822c57a865d868ca2b1ccf414559c129b6fe06a79313875782f814b876
3
+ size 7964