ncbateman commited on
Commit
5fba230
·
verified ·
1 Parent(s): c460b3e

Training in progress, step 720, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52ab772a3d2f29871c5b33edf53b3357c7f213d43a3b6c7fe3da00f9e9e266b8
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a4972d945aaf79f38a6385891c2c6bf16c9ab13d1387a9a314a9ae88e2af9d7
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0019585f029b5baa58be8cfe62931034d42db0a67d35a6a218c83edc08d495f6
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:263b3898d405f513a3d751718a8e4459efbe49762bd2d59a834f0b0bd5f9c305
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cf483ccbcb523a1ae54b6742d201e95685c3798b63064fda748091e660916fb
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92e2bed38537091b1b6847ec894ec446f212f658d47a8eafa5ceedcd4769dcc4
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68087e6a2853e7290ab7c85e019dd29d494adf51d146626f9b298ee98b25dc83
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa5e57bbef4d99689575267a9a61782e3d42e915f722a8a205895c6faf79e5c7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9252669039145908,
5
  "eval_steps": 386,
6
- "global_step": 715,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5028,6 +5028,41 @@
5028
  "learning_rate": 9.266966179767538e-05,
5029
  "loss": 0.7856,
5030
  "step": 715
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5031
  }
5032
  ],
5033
  "logging_steps": 1,
@@ -5047,7 +5082,7 @@
5047
  "attributes": {}
5048
  }
5049
  },
5050
- "total_flos": 7.993250777609011e+17,
5051
  "train_batch_size": 4,
5052
  "trial_name": null,
5053
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9317373018440634,
5
  "eval_steps": 386,
6
+ "global_step": 720,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5028
  "learning_rate": 9.266966179767538e-05,
5029
  "loss": 0.7856,
5030
  "step": 715
5031
+ },
5032
+ {
5033
+ "epoch": 0.9265609835004853,
5034
+ "grad_norm": 0.8092474937438965,
5035
+ "learning_rate": 9.264815634051982e-05,
5036
+ "loss": 1.0298,
5037
+ "step": 716
5038
+ },
5039
+ {
5040
+ "epoch": 0.9278550630863798,
5041
+ "grad_norm": 0.8919221758842468,
5042
+ "learning_rate": 9.262662188656705e-05,
5043
+ "loss": 0.7962,
5044
+ "step": 717
5045
+ },
5046
+ {
5047
+ "epoch": 0.9291491426722743,
5048
+ "grad_norm": 0.771659791469574,
5049
+ "learning_rate": 9.260505845045854e-05,
5050
+ "loss": 1.0239,
5051
+ "step": 718
5052
+ },
5053
+ {
5054
+ "epoch": 0.9304432222581689,
5055
+ "grad_norm": 0.7577182054519653,
5056
+ "learning_rate": 9.258346604685542e-05,
5057
+ "loss": 0.9672,
5058
+ "step": 719
5059
+ },
5060
+ {
5061
+ "epoch": 0.9317373018440634,
5062
+ "grad_norm": 0.7373968362808228,
5063
+ "learning_rate": 9.256184469043851e-05,
5064
+ "loss": 0.7484,
5065
+ "step": 720
5066
  }
5067
  ],
5068
  "logging_steps": 1,
 
5082
  "attributes": {}
5083
  }
5084
  },
5085
+ "total_flos": 8.04914763619369e+17,
5086
  "train_batch_size": 4,
5087
  "trial_name": null,
5088
  "trial_params": null