ncbateman commited on
Commit
4079918
·
verified ·
1 Parent(s): ecb0ce9

Training in progress, step 695, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a3b487bcd9f0f8a52ebb009ad90b8ecda6c53af66c9e15949f86cd4ee4c5493
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2818821d2bd85c742350df6f93ddc6ceaa5a28fbd9c64e00f2455a5ea94572d
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:963768aacc28d56da4770e8791826eb46d62fef62323535d71a32db43b751e99
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3c3d6d6a41f72e4e2daea557637ea5b684d9fb7a2db23f4008a8c201310880c
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:679bf09455ce8b50952b872f5ea495d76ca0e5689b5a5b2ac13810d836dad521
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c791046602634dc7125db7c8a6fa9643238ca36be61916506dd41a5029b29c2a
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb6690e503326fa9d439d70768c7431f28556349fb205663edc4009a63fe4c77
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:743b3e06741f3e617852c286974506bffbbfec118a8156be26ba7327d67612e1
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.8929149142672275,
5
  "eval_steps": 386,
6
- "global_step": 690,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4853,6 +4853,41 @@
4853
  "learning_rate": 9.319783184592142e-05,
4854
  "loss": 0.9691,
4855
  "step": 690
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4856
  }
4857
  ],
4858
  "logging_steps": 1,
@@ -4872,7 +4907,7 @@
4872
  "attributes": {}
4873
  }
4874
  },
4875
- "total_flos": 7.713766484685619e+17,
4876
  "train_batch_size": 4,
4877
  "trial_name": null,
4878
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8993853121967001,
5
  "eval_steps": 386,
6
+ "global_step": 695,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4853
  "learning_rate": 9.319783184592142e-05,
4854
  "loss": 0.9691,
4855
  "step": 690
4856
+ },
4857
+ {
4858
+ "epoch": 0.8942089938531219,
4859
+ "grad_norm": 0.6824143528938293,
4860
+ "learning_rate": 9.317705600932164e-05,
4861
+ "loss": 0.7027,
4862
+ "step": 691
4863
+ },
4864
+ {
4865
+ "epoch": 0.8955030734390165,
4866
+ "grad_norm": 0.8860282301902771,
4867
+ "learning_rate": 9.315625081632191e-05,
4868
+ "loss": 0.9419,
4869
+ "step": 692
4870
+ },
4871
+ {
4872
+ "epoch": 0.896797153024911,
4873
+ "grad_norm": 0.9011827707290649,
4874
+ "learning_rate": 9.313541628106777e-05,
4875
+ "loss": 0.8468,
4876
+ "step": 693
4877
+ },
4878
+ {
4879
+ "epoch": 0.8980912326108056,
4880
+ "grad_norm": 0.836565375328064,
4881
+ "learning_rate": 9.311455241772482e-05,
4882
+ "loss": 1.0456,
4883
+ "step": 694
4884
+ },
4885
+ {
4886
+ "epoch": 0.8993853121967001,
4887
+ "grad_norm": 0.819817841053009,
4888
+ "learning_rate": 9.309365924047853e-05,
4889
+ "loss": 0.9606,
4890
+ "step": 695
4891
  }
4892
  ],
4893
  "logging_steps": 1,
 
4907
  "attributes": {}
4908
  }
4909
  },
4910
+ "total_flos": 7.769663343270298e+17,
4911
  "train_batch_size": 4,
4912
  "trial_name": null,
4913
  "trial_params": null