Nekofox commited on
Commit
aad68f2
1 Parent(s): ec3d8f5

Training in progress, step 654000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49722fb4525cdfb5db10b91cc9964d6d93d53a3f624d39e81da612430ad473a1
3
  size 3871544599
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46484171f9b6c5ac946d864e246abccda92dd4f25ee62ce6099d28cc729da487
3
  size 3871544599
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca9a9edb197fdbdf00385a4c3210b7e932baf72faf125a9727ef9e5c30f08804
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a86b09a69f43945d8bf2d66867995e93a245540aa345dcd0cd225e099d63d33e
3
  size 1944201353
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0e68f9154824758e939f3f203bd07329f72d1b44231a034da24c8f1b729ad93
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:936cadd1d64a617d3c80546b4e9ae3b5969c939f4794ae3e639825fdaca492b9
3
  size 14575
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f803e795f13c2c61f76367562826b3d0d4c17b6383f5b4bcdb43021fd0dba972
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9763dfb7cc467a3044703e2e59550f35dc18ba90b54d9372192d8a07f59078ce
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f3d07c5e6735b6a42b3fb3c809508eeb0916a9cf2438aa81c83c4bba3bf70b8
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da4e619cef69a82f65fefd8d8bf453d1ca59509aaa3224e842dd273c6e04dad3
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 17.065103647859413,
5
- "global_step": 651000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -7818,11 +7818,47 @@
7818
  "learning_rate": 2.621422471037019e-07,
7819
  "loss": 1.0198,
7820
  "step": 651000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7821
  }
7822
  ],
7823
  "max_steps": 762960,
7824
  "num_train_epochs": 20,
7825
- "total_flos": 7.731104357603082e+17,
7826
  "trial_name": null,
7827
  "trial_params": null
7828
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 17.143754390747713,
5
+ "global_step": 654000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
7818
  "learning_rate": 2.621422471037019e-07,
7819
  "loss": 1.0198,
7820
  "step": 651000
7821
+ },
7822
+ {
7823
+ "epoch": 17.08,
7824
+ "learning_rate": 2.598525467057997e-07,
7825
+ "loss": 1.0052,
7826
+ "step": 651500
7827
+ },
7828
+ {
7829
+ "epoch": 17.09,
7830
+ "learning_rate": 2.575723416948414e-07,
7831
+ "loss": 1.0092,
7832
+ "step": 652000
7833
+ },
7834
+ {
7835
+ "epoch": 17.1,
7836
+ "learning_rate": 2.553061736434792e-07,
7837
+ "loss": 1.0156,
7838
+ "step": 652500
7839
+ },
7840
+ {
7841
+ "epoch": 17.12,
7842
+ "learning_rate": 2.5304496932272714e-07,
7843
+ "loss": 1.012,
7844
+ "step": 653000
7845
+ },
7846
+ {
7847
+ "epoch": 17.13,
7848
+ "learning_rate": 2.507932892444226e-07,
7849
+ "loss": 1.0073,
7850
+ "step": 653500
7851
+ },
7852
+ {
7853
+ "epoch": 17.14,
7854
+ "learning_rate": 2.485511429528359e-07,
7855
+ "loss": 1.0151,
7856
+ "step": 654000
7857
  }
7858
  ],
7859
  "max_steps": 762960,
7860
  "num_train_epochs": 20,
7861
+ "total_flos": 7.764147094555607e+17,
7862
  "trial_name": null,
7863
  "trial_params": null
7864
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a817e83c25ddaa8901cfc233f35e575b7ed2a8f04ee848f1df7a6ce2254ee042
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93c4f6b95116fa2850a3e79a5e5ca987117cd0c0e048d0df05238b7b9d1e075f
3
  size 3771
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca9a9edb197fdbdf00385a4c3210b7e932baf72faf125a9727ef9e5c30f08804
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a86b09a69f43945d8bf2d66867995e93a245540aa345dcd0cd225e099d63d33e
3
  size 1944201353
runs/Jun05_15-17-53_cc80fbc5a73c/1685978328.9691155/events.out.tfevents.1685978328.cc80fbc5a73c.10476.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:505a1766d67e9068b9918997269f5b796ea17b141c75f3f422b1fb17b0f33578
3
+ size 6184
runs/Jun05_15-17-53_cc80fbc5a73c/events.out.tfevents.1685978328.cc80fbc5a73c.10476.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed547c48fad89210b9e31ef59c6b25636e6f3b92fc69406276f50df01a67c22b
3
+ size 4461
runs/Jun05_15-52-52_cc80fbc5a73c/1685980427.3172033/events.out.tfevents.1685980427.cc80fbc5a73c.10476.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57f6bc42b9c797a3b761d2faff81b1a6a90fc0e136e94de2aa8e3d34a7f55105
3
+ size 6184
runs/Jun05_15-52-52_cc80fbc5a73c/events.out.tfevents.1685980427.cc80fbc5a73c.10476.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8043880ae85a6e32e1326bf6b812681b2b5ebe8b05f856a8bc0415f862862253
3
+ size 5421
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a817e83c25ddaa8901cfc233f35e575b7ed2a8f04ee848f1df7a6ce2254ee042
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93c4f6b95116fa2850a3e79a5e5ca987117cd0c0e048d0df05238b7b9d1e075f
3
  size 3771