Nekofox commited on
Commit
4097eae
1 Parent(s): 9f788ed

Training in progress, step 64000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4308792b2a033acdce96ce47703119686ade603de91305623f9a41bb3db8197d
3
  size 3871543575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fe8795e671335d7bddeedb39821f0948379d742e636bab99e4d84da9158869a
3
  size 3871543575
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24918df0f1f9d1f5aadf7b8e4933628be882e87804ac0114cbca0ad2c83737f7
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c80a0783dcb4761d467c9fccd3ad9305d694cfd8a74940361136dfaf12ce4dfa
3
  size 1944201353
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:836afdbaf7ed0232c311bb2609eff325953c229bbc4edb90bdadf6a7412ce2aa
3
  size 14511
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e989135ee750e533a2b907997960a8cf01e270032e6a00adbd8dce6e9b4179f2
3
  size 14511
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df056184eca867a0b00a4f1fa76891f3c4f5cedd6a7d840fcd41506dafeb0b63
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8474830dbb0ee2555c7fca1ddb59c3a8703100405178d69f471e9f9597100d49
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ae4577bcc43ac54c56a413372da787f2adba41ace305a09ecc065c5e91b0b80
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7ba5db5b81b6826d9b84207559dd8cdb0b9297845fc72cde43cb565faf3a995
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.6359907145355678,
5
- "global_step": 60000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -726,11 +726,59 @@
726
  "learning_rate": 4.95030419957734e-06,
727
  "loss": 1.7637,
728
  "step": 60000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
729
  }
730
  ],
731
  "max_steps": 943410,
732
  "num_train_epochs": 10,
733
- "total_flos": 3.379573384711373e+16,
734
  "trial_name": null,
735
  "trial_params": null
736
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.6783900955046056,
5
+ "global_step": 64000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
726
  "learning_rate": 4.95030419957734e-06,
727
  "loss": 1.7637,
728
  "step": 60000
729
+ },
730
+ {
731
+ "epoch": 0.64,
732
+ "learning_rate": 4.9494749648583875e-06,
733
+ "loss": 1.7161,
734
+ "step": 60500
735
+ },
736
+ {
737
+ "epoch": 0.65,
738
+ "learning_rate": 4.94863893948379e-06,
739
+ "loss": 1.7069,
740
+ "step": 61000
741
+ },
742
+ {
743
+ "epoch": 0.65,
744
+ "learning_rate": 4.9477978181718865e-06,
745
+ "loss": 1.7084,
746
+ "step": 61500
747
+ },
748
+ {
749
+ "epoch": 0.66,
750
+ "learning_rate": 4.946949937970748e-06,
751
+ "loss": 1.7007,
752
+ "step": 62000
753
+ },
754
+ {
755
+ "epoch": 0.66,
756
+ "learning_rate": 4.946093581740578e-06,
757
+ "loss": 1.714,
758
+ "step": 62500
759
+ },
760
+ {
761
+ "epoch": 0.67,
762
+ "learning_rate": 4.9452304442289365e-06,
763
+ "loss": 1.7228,
764
+ "step": 63000
765
+ },
766
+ {
767
+ "epoch": 0.67,
768
+ "learning_rate": 4.944360527828692e-06,
769
+ "loss": 1.7279,
770
+ "step": 63500
771
+ },
772
+ {
773
+ "epoch": 0.68,
774
+ "learning_rate": 4.943483834951505e-06,
775
+ "loss": 1.7026,
776
+ "step": 64000
777
  }
778
  ],
779
  "max_steps": 943410,
780
  "num_train_epochs": 10,
781
+ "total_flos": 3.605231193396019e+16,
782
  "trial_name": null,
783
  "trial_params": null
784
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24918df0f1f9d1f5aadf7b8e4933628be882e87804ac0114cbca0ad2c83737f7
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c80a0783dcb4761d467c9fccd3ad9305d694cfd8a74940361136dfaf12ce4dfa
3
  size 1944201353
runs/May14_19-37-01_15e842f7c026/events.out.tfevents.1684094526.15e842f7c026.771.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de578695d7b19188bd6bbd53f9a0638874a8dcac4a1771e6bcf927b6589c26eb
3
- size 5743
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77b91fb82c97d3bca0eb4dfcc9806cd209db085bb56a651dc6901c0500042a65
3
+ size 7023