AmberYifan commited on
Commit
2b2ca8a
1 Parent(s): f112cc5

Training in progress, step 936, checkpoint

Browse files
last-checkpoint/global_step936/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e77a0d44241097b329310fb937831b42336816347dcbff5933c4dcd9260c02c
3
+ size 14483467880
last-checkpoint/global_step936/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a69f404f68683abbbca660d382b195ee997d5dbb69450863a00743a030a04d65
3
+ size 14483467880
last-checkpoint/global_step936/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ef693a22aa13fb0a4efc9309a73331a0dc3b75ea7e79e6f385061dae5f8cadb
3
+ size 14483467880
last-checkpoint/global_step936/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be84f2c1f72c8a09c08f41cc770a56f12d7b210f22f67653a0d9a4d3122ff4d5
3
+ size 14483467880
last-checkpoint/global_step936/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb8e8226e612c7eb7aef00de840accd9ede88949eb3a3907655b10647a9bb15d
3
+ size 150629
last-checkpoint/global_step936/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f364f198b089e3e013034b0b6f5c46f056c69dde549de868d5280a87dc035d1
3
+ size 150629
last-checkpoint/global_step936/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:907c007ea3bd3d7dc8f1b747b87f5d7bd7de84fcf7963f773f54773bd2d8282c
3
+ size 150629
last-checkpoint/global_step936/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64f8f1488c715e1e2371f045bc7a763d0cab1572e5337ac22395684df0514088
3
+ size 150629
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step930
 
1
+ global_step936
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b8f60f47366913845f02edcefe3c9ebe0b02b6f0638f6b36cbda31ee6a29620
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f53da177259bd2a2db86a7e77851a46396762aee159ff39a95c0449b94bbacbb
3
  size 4943162336
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d947dc0d2ccdc25f3df4e7bae9c9f62f9ee94717b9e6adf29816f206cb9c1bd6
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56aa7cb229c570175cf312e0ea44ab87abca69083d6d08e1a2a29a788c23412
3
  size 4999819336
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93920835041bd996f9e062b2f0825850c39ead3febffe838b89b7a0967059b66
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:574acf3c0744e875058dce1701853c6e6156c36e9366abf58304ded4e177abff
3
  size 4540516344
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98ace375a7a3e380a16715316d6e5e36d9cb62649995c07cc349fb85673d36ff
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7bdce5778934f6c9002d4767cdecb9bb6877049f525666aece67f4eed039ef3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.976,
5
  "eval_steps": 62,
6
- "global_step": 930,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1671,7 +1671,7 @@
1671
  "should_evaluate": false,
1672
  "should_log": false,
1673
  "should_save": true,
1674
- "should_training_stop": false
1675
  },
1676
  "attributes": {}
1677
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.9952,
5
  "eval_steps": 62,
6
+ "global_step": 936,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1671
  "should_evaluate": false,
1672
  "should_log": false,
1673
  "should_save": true,
1674
+ "should_training_stop": true
1675
  },
1676
  "attributes": {}
1677
  }