Nekofox commited on
Commit
c4e49e7
1 Parent(s): ac89ad4

Training in progress, step 585000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f1a48804678162ab3aecf919d1b706d10ef7258fab83c58318f53ff5a3fa94b
3
  size 3871544599
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:800f47d6c105599f23476b36ba02ef6cd898b37ec9f6ea6c11464b383ba2cbd7
3
  size 3871544599
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ddb0d445df94c4cc297a21738ebeae7340f5cb1491611529b9010ef16e2285e
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ade14b8fcd7033799d31d7c0b3638db665d1101ba6c901b224e22e4630967f0f
3
  size 1944201353
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1be13f5c1447e7a1f0c568d6b3ce9d67f06043aea7e6a6adb6d516e1a9e08df
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d89a086ff98497212b3403fb71dd7cca09fd28ce2e72380eabd270a7198bf63d
3
  size 14575
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88f64a459349cb576f0b208442db510e681babf73815faf743d1f75670b079e6
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a56e5f53e3690fa8d88396102c5e72891424a69c9adf23f31ba1d7ae3b5bd5e
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0011f6c0eaad524da3d93ee2e4f36118921f7fbfc672d8200c6cde5159731c7
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd7e558efc05c7857c55680cae30ef0a4d65e8d9cbb5e001241cc014941d7312
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 15.256356754149584,
5
- "global_step": 582000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -6990,11 +6990,47 @@
6990
  "learning_rate": 6.640749410559011e-07,
6991
  "loss": 1.0248,
6992
  "step": 582000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6993
  }
6994
  ],
6995
  "max_steps": 762960,
6996
  "num_train_epochs": 20,
6997
- "total_flos": 6.971082996612465e+17,
6998
  "trial_name": null,
6999
  "trial_params": null
7000
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 15.334997011670215,
5
+ "global_step": 585000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
6990
  "learning_rate": 6.640749410559011e-07,
6991
  "loss": 1.0248,
6992
  "step": 582000
6993
+ },
6994
+ {
6995
+ "epoch": 15.27,
6996
+ "learning_rate": 6.605922514508042e-07,
6997
+ "loss": 1.0305,
6998
+ "step": 582500
6999
+ },
7000
+ {
7001
+ "epoch": 15.28,
7002
+ "learning_rate": 6.571103714792401e-07,
7003
+ "loss": 1.0334,
7004
+ "step": 583000
7005
+ },
7006
+ {
7007
+ "epoch": 15.3,
7008
+ "learning_rate": 6.536363030247672e-07,
7009
+ "loss": 1.0313,
7010
+ "step": 583500
7011
+ },
7012
+ {
7013
+ "epoch": 15.31,
7014
+ "learning_rate": 6.501700608130337e-07,
7015
+ "loss": 1.0269,
7016
+ "step": 584000
7017
+ },
7018
+ {
7019
+ "epoch": 15.32,
7020
+ "learning_rate": 6.467116595365149e-07,
7021
+ "loss": 1.0397,
7022
+ "step": 584500
7023
+ },
7024
+ {
7025
+ "epoch": 15.33,
7026
+ "learning_rate": 6.432680070962052e-07,
7027
+ "loss": 1.0271,
7028
+ "step": 585000
7029
  }
7030
  ],
7031
  "max_steps": 762960,
7032
  "num_train_epochs": 20,
7033
+ "total_flos": 7.004102496447283e+17,
7034
  "trial_name": null,
7035
  "trial_params": null
7036
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ddb0d445df94c4cc297a21738ebeae7340f5cb1491611529b9010ef16e2285e
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ade14b8fcd7033799d31d7c0b3638db665d1101ba6c901b224e22e4630967f0f
3
  size 1944201353
runs/Jun01_02-00-15_72d6bfb1a401/events.out.tfevents.1685586378.72d6bfb1a401.2268.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ae362c64a1320faae29882bc06c0bf84eeb1edd292e0baf069f637fc22f4975
3
- size 9261
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:289f05ba23629ccf8a109c80a0479b07884acff653ab97fe91883a05fb591060
3
+ size 10221