ncbateman commited on
Commit
863c93a
·
verified ·
1 Parent(s): 7484319

Training in progress, step 465, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a8e766c93c4cb51d235429ab576d2269c0fe74ccc12cbec07722e592fc31d83
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb22d9108d46568eed2a25c6378eb936291db1fd5def7bc554afe2f3f354388f
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9f249a9f18d595322f53870ff656ff9f0fb190feac83ed8e8e07c86b79d402d
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:feddcd4823e3bf21b23adc8b4128b78879305ba02f9d65f76af450bf7e0ad182
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4d5ea361bd8f109ccf9deae94ad5b06097316390b345e2c5b8dfcae47e6460a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79792a0c4a549329639ba69896508be1c58dde196d323715b7d4f344f0e143f2
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:702e6ac2a5684998fe08dbec2461764b61e07652058ef3b71a2777c5464d9e27
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19b2a9c436b3bae0ae5d93979cf58505c2ebbb5587127ec39bd71f602d8b990f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.595276609511485,
5
  "eval_steps": 386,
6
- "global_step": 460,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -3243,6 +3243,41 @@
3243
  "learning_rate": 9.716979960019173e-05,
3244
  "loss": 0.8261,
3245
  "step": 460
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3246
  }
3247
  ],
3248
  "logging_steps": 1,
@@ -3262,7 +3297,7 @@
3262
  "attributes": {}
3263
  }
3264
  },
3265
- "total_flos": 5.142510989790413e+17,
3266
  "train_batch_size": 4,
3267
  "trial_name": null,
3268
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.6017470074409577,
5
  "eval_steps": 386,
6
+ "global_step": 465,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
3243
  "learning_rate": 9.716979960019173e-05,
3244
  "loss": 0.8261,
3245
  "step": 460
3246
+ },
3247
+ {
3248
+ "epoch": 0.5965706890973795,
3249
+ "grad_norm": 0.766036331653595,
3250
+ "learning_rate": 9.715610945382177e-05,
3251
+ "loss": 0.9601,
3252
+ "step": 461
3253
+ },
3254
+ {
3255
+ "epoch": 0.597864768683274,
3256
+ "grad_norm": 0.9155464172363281,
3257
+ "learning_rate": 9.714238724566393e-05,
3258
+ "loss": 0.8716,
3259
+ "step": 462
3260
+ },
3261
+ {
3262
+ "epoch": 0.5991588482691685,
3263
+ "grad_norm": 0.8961794972419739,
3264
+ "learning_rate": 9.712863298504807e-05,
3265
+ "loss": 0.9595,
3266
+ "step": 463
3267
+ },
3268
+ {
3269
+ "epoch": 0.6004529278550631,
3270
+ "grad_norm": 0.8102921843528748,
3271
+ "learning_rate": 9.711484668132575e-05,
3272
+ "loss": 0.7174,
3273
+ "step": 464
3274
+ },
3275
+ {
3276
+ "epoch": 0.6017470074409577,
3277
+ "grad_norm": 0.7466800808906555,
3278
+ "learning_rate": 9.710102834387043e-05,
3279
+ "loss": 0.8707,
3280
+ "step": 465
3281
  }
3282
  ],
3283
  "logging_steps": 1,
 
3297
  "attributes": {}
3298
  }
3299
  },
3300
+ "total_flos": 5.198407848375091e+17,
3301
  "train_batch_size": 4,
3302
  "trial_name": null,
3303
  "trial_params": null