ncbateman commited on
Commit
c88d44e
·
verified ·
1 Parent(s): 3e01cd9

Training in progress, step 685, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aa4cdb306bf7294222f7b3f970f532c7b4cdc22e6cc372d92a68a5832ae3ac9
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a662f46feddbe2497f49933107c98ff00f401806533aaf98017b0ee6565b00be
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3eb132123db17680d8840722840709fbc913fe87e08366059ecb3b185ef779ee
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d00e266f5b1f45df60e8c44f7e3943273cb57caebf20915b93c9a2bb87831d7
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:477ac7793a58a9aee87e63f0ed0db383646c754c91fbf8cf6726681a3e1bf55c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad79945a21a826c0f45869cc500d5d990f1fd3dd860f10e0654ca0015c8252fb
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59c557a3a19fcbe03c6517f32635519665f582ddfe4481e7465a155c1f572f8b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6df9925b4c7f085a8aa1642bfcd531b37d20682fc6e02418e3381af28e29b06
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.8799741184082821,
5
  "eval_steps": 386,
6
- "global_step": 680,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4783,6 +4783,41 @@
4783
  "learning_rate": 9.340397251217009e-05,
4784
  "loss": 0.8103,
4785
  "step": 680
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4786
  }
4787
  ],
4788
  "logging_steps": 1,
@@ -4802,7 +4837,7 @@
4802
  "attributes": {}
4803
  }
4804
  },
4805
- "total_flos": 7.601972767516262e+17,
4806
  "train_batch_size": 4,
4807
  "trial_name": null,
4808
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8864445163377548,
5
  "eval_steps": 386,
6
+ "global_step": 685,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4783
  "learning_rate": 9.340397251217009e-05,
4784
  "loss": 0.8103,
4785
  "step": 680
4786
+ },
4787
+ {
4788
+ "epoch": 0.8812681979941767,
4789
+ "grad_norm": 0.8201668858528137,
4790
+ "learning_rate": 9.338349101318261e-05,
4791
+ "loss": 0.7959,
4792
+ "step": 681
4793
+ },
4794
+ {
4795
+ "epoch": 0.8825622775800712,
4796
+ "grad_norm": 0.814172625541687,
4797
+ "learning_rate": 9.336298001743846e-05,
4798
+ "loss": 0.8074,
4799
+ "step": 682
4800
+ },
4801
+ {
4802
+ "epoch": 0.8838563571659657,
4803
+ "grad_norm": 0.7825469374656677,
4804
+ "learning_rate": 9.33424395388832e-05,
4805
+ "loss": 0.91,
4806
+ "step": 683
4807
+ },
4808
+ {
4809
+ "epoch": 0.8851504367518602,
4810
+ "grad_norm": 0.7842270135879517,
4811
+ "learning_rate": 9.332186959148248e-05,
4812
+ "loss": 0.9331,
4813
+ "step": 684
4814
+ },
4815
+ {
4816
+ "epoch": 0.8864445163377548,
4817
+ "grad_norm": 0.8008681535720825,
4818
+ "learning_rate": 9.330127018922194e-05,
4819
+ "loss": 0.7166,
4820
+ "step": 685
4821
  }
4822
  ],
4823
  "logging_steps": 1,
 
4837
  "attributes": {}
4838
  }
4839
  },
4840
+ "total_flos": 7.657869626100941e+17,
4841
  "train_batch_size": 4,
4842
  "trial_name": null,
4843
  "trial_params": null