Nekofox commited on
Commit
3db83ca
1 Parent(s): aa8a810

Training in progress, step 82000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8fda0e5fe549ec2bbd6b44b861b4240b2b8eb1b05c2b398b62e81cb4cec45858
3
  size 3871544599
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5a5b2493529df71a379e03aceed1ddf08858862981c8490b324f0d677b2c8ab
3
  size 3871544599
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce81deabfd18bbdab45e183fa2de8b4bb3e861afc2a7cf21748e8659e78689e0
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6f94fa1057b251e6a9c0d42c7e10e9758a59d645321d1cc9582f8d2a2e2df2d
3
  size 1944201353
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ee84876c7f2a656d566aee4b35660bd05f55d08a876847f7a9618373980c3f3
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac9bcd02cdc1b6c7cac5869d3509f7b05a1d2086795c55cac28ba45375a25f1f
3
  size 14575
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb331a19c0420810069d00793f1cb8d9dc4cc1b1645fc6215ba6d2d671f7cc8b
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47de88e32f411b951afd40673c7113ea3a9e24d8093a06f3d88682cdb20e034e
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:363dc8c23d6d69c9d91cbb8e418340018389226bcce8507f5129d9e7f829d211
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85647a99ed4bf5c0c797c9cd93a757114f5be791f28752f8b894b2456864bb55
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5653230821414439,
5
- "global_step": 80000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -966,11 +966,35 @@
966
  "learning_rate": 4.96070703971027e-06,
967
  "loss": 1.6206,
968
  "step": 80000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
969
  }
970
  ],
971
  "max_steps": 1415120,
972
  "num_train_epochs": 10,
973
- "total_flos": 4.173651302439322e+16,
974
  "trial_name": null,
975
  "trial_params": null
976
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.57945615919498,
5
+ "global_step": 82000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
966
  "learning_rate": 4.96070703971027e-06,
967
  "loss": 1.6206,
968
  "step": 80000
969
+ },
970
+ {
971
+ "epoch": 0.57,
972
+ "learning_rate": 4.960215456513178e-06,
973
+ "loss": 1.5827,
974
+ "step": 80500
975
+ },
976
+ {
977
+ "epoch": 0.57,
978
+ "learning_rate": 4.959721834288042e-06,
979
+ "loss": 1.6156,
980
+ "step": 81000
981
+ },
982
+ {
983
+ "epoch": 0.58,
984
+ "learning_rate": 4.959224195197477e-06,
985
+ "loss": 1.5982,
986
+ "step": 81500
987
+ },
988
+ {
989
+ "epoch": 0.58,
990
+ "learning_rate": 4.95872352604645e-06,
991
+ "loss": 1.6165,
992
+ "step": 82000
993
  }
994
  ],
995
  "max_steps": 1415120,
996
  "num_train_epochs": 10,
997
+ "total_flos": 4.237671466401792e+16,
998
  "trial_name": null,
999
  "trial_params": null
1000
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce81deabfd18bbdab45e183fa2de8b4bb3e861afc2a7cf21748e8659e78689e0
3
  size 1944201353
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6f94fa1057b251e6a9c0d42c7e10e9758a59d645321d1cc9582f8d2a2e2df2d
3
  size 1944201353
runs/May15_09-17-05_1fe6bbfe264a/events.out.tfevents.1684142280.1fe6bbfe264a.10378.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb6a895acdf8c4c62e210f0f27ac4d59e0a3b7d96e5ee7acd0552b2f96602750
3
- size 8943
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1387b94b0524f24c8670f43148c1ed8883a648b0a239475a839c0b02f117890c
3
+ size 9583