Nekofox commited on
Commit
1a74eb7
1 Parent(s): 10cf62f

Training in progress, step 56000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d732736de6501f4899754db0c10e4570a7fe2fa3ac8b9511bcea1224fb0cd3f5
3
  size 3871543575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f60349f7766510102278629c2843f7b172c8d269ab71299853bf7d28b34c7f3c
3
  size 3871543575
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a305ef9c307c5169cce5f064424696b26f73c6db38d14bf539dd6e0d005ea169
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed8496b300c153eda223d64ce6ae8d9b85a0b85fbf04784c5f7f9870564dd2d0
3
  size 1944201353
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e66928c63fad4b4599d1ab60d609e927e7ea8e3552c715ad8baff6ed9f3f4bbb
3
- size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f322551d5dbc26a22a31f8ddc9da458bedc2e38dc7d116217d0c411ed1e9ed7
3
+ size 14511
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:042c44b032d6bdd4466f03a28e4b55638760717a01ada6222dbb596f3a3bfc8d
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b5ecbe8e8e0cd94fc7935cc448aa50e35fab0ed1e11419e7e3c7f29c567044d
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f383fd584c5ee76e07a987b34c6a36868eb4f11d22aa3c2299d21c5081aef278
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7a050ce0f4a32bb580c5f82cff9cdb29e8cb3d0f09c683f3a23deca0c0b8df1
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5511919525974921,
5
- "global_step": 52000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -630,11 +630,59 @@
630
  "learning_rate": 4.962640872518639e-06,
631
  "loss": 1.7226,
632
  "step": 52000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
633
  }
634
  ],
635
  "max_steps": 943410,
636
  "num_train_epochs": 10,
637
- "total_flos": 2.9278349279870976e+16,
638
  "trial_name": null,
639
  "trial_params": null
640
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.5935913335665299,
5
+ "global_step": 56000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
630
  "learning_rate": 4.962640872518639e-06,
631
  "loss": 1.7226,
632
  "step": 52000
633
+ },
634
+ {
635
+ "epoch": 0.56,
636
+ "learning_rate": 4.961920533507775e-06,
637
+ "loss": 1.7142,
638
+ "step": 52500
639
+ },
640
+ {
641
+ "epoch": 0.56,
642
+ "learning_rate": 4.961193369338535e-06,
643
+ "loss": 1.7193,
644
+ "step": 53000
645
+ },
646
+ {
647
+ "epoch": 0.57,
648
+ "learning_rate": 4.960460856809599e-06,
649
+ "loss": 1.7472,
650
+ "step": 53500
651
+ },
652
+ {
653
+ "epoch": 0.57,
654
+ "learning_rate": 4.9597200620304265e-06,
655
+ "loss": 1.7407,
656
+ "step": 54000
657
+ },
658
+ {
659
+ "epoch": 0.58,
660
+ "learning_rate": 4.958972448193223e-06,
661
+ "loss": 1.741,
662
+ "step": 54500
663
+ },
664
+ {
665
+ "epoch": 0.58,
666
+ "learning_rate": 4.958218017370592e-06,
667
+ "loss": 1.7572,
668
+ "step": 55000
669
+ },
670
+ {
671
+ "epoch": 0.59,
672
+ "learning_rate": 4.957458300945332e-06,
673
+ "loss": 1.7177,
674
+ "step": 55500
675
+ },
676
+ {
677
+ "epoch": 0.59,
678
+ "learning_rate": 4.9566902560686915e-06,
679
+ "loss": 1.7255,
680
+ "step": 56000
681
  }
682
  ],
683
  "max_steps": 943410,
684
  "num_train_epochs": 10,
685
+ "total_flos": 3.15281974910976e+16,
686
  "trial_name": null,
687
  "trial_params": null
688
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a305ef9c307c5169cce5f064424696b26f73c6db38d14bf539dd6e0d005ea169
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed8496b300c153eda223d64ce6ae8d9b85a0b85fbf04784c5f7f9870564dd2d0
3
  size 1944201353
runs/May14_15-54-58_fce7ca761ee9/events.out.tfevents.1684081292.fce7ca761ee9.347.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6022b19808a5b1c1becd15f0e3a653d2b7f29f01c522b6e28688114bff28c7f1
3
- size 9583
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6da5c4ee3bf608db87622a1727ed032f59decd9ff80a8d0ed29d509a99c4a91
3
+ size 10863