AmberYifan commited on
Commit
7895987
·
verified ·
1 Parent(s): 4398369

Training in progress, step 124, checkpoint

Browse files
last-checkpoint/global_step124/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8232dc29225a0415e93846f907f121d4883923a2454ac5f24439b1ddaec48ed6
3
+ size 14483467880
last-checkpoint/global_step124/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb12c0ff2edb4f0e32ab5b430273aac19e4f909138fcbd89050eaf4325785680
3
+ size 14483467880
last-checkpoint/global_step124/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ed8017e9fc3ce74c24dab1205b495fefc3f0cc3a8ec990382dd6a9944b9d1ae
3
+ size 14483467880
last-checkpoint/global_step124/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09aca282ac37c9412a45b2216a419897f820e1673f8ed512018453639b823f45
3
+ size 14483467880
last-checkpoint/global_step124/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66045da7ecfe0e7cb3640c641a4309cae5379c4f301e3c72c1c4a8efe9529782
3
+ size 150629
last-checkpoint/global_step124/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16584df5949a6bb6166bd5286273f4e9b5d86cb9d794005e8298925747917133
3
+ size 150629
last-checkpoint/global_step124/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f92af64c22beb18e2a8e224a2437108f2d2d47e27436c3f19c6da4a5c9f96186
3
+ size 150629
last-checkpoint/global_step124/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32bb4a2c24916b82c832b2cebf4eb467a11ffa7c9e5514cfa4a382e45b22fe20
3
+ size 150629
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step62
 
1
+ global_step124
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1313c056599e2844cb7a30e3753cb3fcc1f3fe95c952235ad20b9801ba0f3cfa
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5ef837fbded3b18cd0a4c60904eea5a7736290649d3272b2d4d747062f78dca
3
  size 4943162336
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebdb8fc2bc7fe59280c4c3f36cc96d0c80b52f8a18ec1e3bbeb0c24ebd84bfca
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94825f39a3c46a97f26e600562154fe1141d122c3aed77b1c8207909e2d39dd3
3
  size 4999819336
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7538f12ff8c566bca31f4b0fdf4ac9e9afef563611a613f69cb433a4aeed2596
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccc54b0a6d0a78d822a62f65c8269ae1cd3e47b5d8ee2bbc91a50cad768ab180
3
  size 4540516344
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4a1dc8b9f546123ce9b44c28828ae71d9d0ecd6f59c6b7b8337c73cb2e24c49
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a82e580e4e92d21ee2fca0348b8c83585fc265a3bdec704f0dbfaf6f2f800587
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a8b225b0323772b66570a16b5c7e6446dc3c9ee076597906a2c90e3c0a383bf
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2f5b0e26d51388f8180f8023bedbf0f066c7e40bd40eba6f2df3d9d9be582f4
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c036a8d528905f7018266618c8bebe4add10c2778ef432fd0116369fa622d815
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14c4a2665fddc1defbf2e5e1c0f3875ebfe701d33e843d7bd93ecde03037e001
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b93d88429d97654e76d10b1ba4c36f29a47e210c65a03efdc136f04af8282797
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02a7d95f6cb55234c18abb2f3a67c0a306f262d68ef9b79e11b501a08555b93
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7a6860338b2857ca387402b84af60aa023d3c6c998b782fb5dcd5a6ae91d2d2
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537ea638b6cb2eeeba0fa5565c11e75e59cd64d0fdb026e5c722db4638703a11
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.1984,
5
  "eval_steps": 62,
6
- "global_step": 62,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -128,6 +128,112 @@
128
  "eval_samples_per_second": 7.273,
129
  "eval_steps_per_second": 0.473,
130
  "step": 62
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
131
  }
132
  ],
133
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.3968,
5
  "eval_steps": 62,
6
+ "global_step": 124,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
128
  "eval_samples_per_second": 7.273,
129
  "eval_steps_per_second": 0.473,
130
  "step": 62
131
+ },
132
+ {
133
+ "epoch": 0.224,
134
+ "grad_norm": 111.31786558317472,
135
+ "learning_rate": 3.7234042553191484e-07,
136
+ "logits/generated": -2.4125685691833496,
137
+ "logits/real": -2.412478446960449,
138
+ "logps/generated": -122.41896057128906,
139
+ "logps/real": -142.01275634765625,
140
+ "loss": 0.7703,
141
+ "rewards/accuracies": 0.6499999761581421,
142
+ "rewards/generated": 1.1598608493804932,
143
+ "rewards/margins": 0.22506161034107208,
144
+ "rewards/real": 1.3849226236343384,
145
+ "step": 70
146
+ },
147
+ {
148
+ "epoch": 0.256,
149
+ "grad_norm": 108.77845029282479,
150
+ "learning_rate": 4.25531914893617e-07,
151
+ "logits/generated": -2.425182819366455,
152
+ "logits/real": -2.4704861640930176,
153
+ "logps/generated": -111.57796478271484,
154
+ "logps/real": -133.41946411132812,
155
+ "loss": 0.7575,
156
+ "rewards/accuracies": 0.637499988079071,
157
+ "rewards/generated": 1.273758888244629,
158
+ "rewards/margins": 0.2473028153181076,
159
+ "rewards/real": 1.521061658859253,
160
+ "step": 80
161
+ },
162
+ {
163
+ "epoch": 0.288,
164
+ "grad_norm": 87.55111605760202,
165
+ "learning_rate": 4.787234042553192e-07,
166
+ "logits/generated": -2.457540988922119,
167
+ "logits/real": -2.5106961727142334,
168
+ "logps/generated": -118.1611099243164,
169
+ "logps/real": -128.29928588867188,
170
+ "loss": 0.6781,
171
+ "rewards/accuracies": 0.7124999761581421,
172
+ "rewards/generated": 0.9840036630630493,
173
+ "rewards/margins": 0.5047105550765991,
174
+ "rewards/real": 1.4887142181396484,
175
+ "step": 90
176
+ },
177
+ {
178
+ "epoch": 0.32,
179
+ "grad_norm": 86.71987338916492,
180
+ "learning_rate": 4.96437054631829e-07,
181
+ "logits/generated": -2.4262959957122803,
182
+ "logits/real": -2.446533679962158,
183
+ "logps/generated": -118.33076477050781,
184
+ "logps/real": -132.8785400390625,
185
+ "loss": 0.7601,
186
+ "rewards/accuracies": 0.637499988079071,
187
+ "rewards/generated": 1.1130377054214478,
188
+ "rewards/margins": 0.3733757734298706,
189
+ "rewards/real": 1.4864133596420288,
190
+ "step": 100
191
+ },
192
+ {
193
+ "epoch": 0.352,
194
+ "grad_norm": 85.8458816841653,
195
+ "learning_rate": 4.904988123515439e-07,
196
+ "logits/generated": -2.3812742233276367,
197
+ "logits/real": -2.4494009017944336,
198
+ "logps/generated": -113.8266372680664,
199
+ "logps/real": -131.19769287109375,
200
+ "loss": 0.7051,
201
+ "rewards/accuracies": 0.762499988079071,
202
+ "rewards/generated": 0.42378121614456177,
203
+ "rewards/margins": 0.6939576268196106,
204
+ "rewards/real": 1.1177388429641724,
205
+ "step": 110
206
+ },
207
+ {
208
+ "epoch": 0.384,
209
+ "grad_norm": 71.18315494374211,
210
+ "learning_rate": 4.845605700712589e-07,
211
+ "logits/generated": -2.4884400367736816,
212
+ "logits/real": -2.6123955249786377,
213
+ "logps/generated": -122.7501220703125,
214
+ "logps/real": -125.4404067993164,
215
+ "loss": 0.7524,
216
+ "rewards/accuracies": 0.5625,
217
+ "rewards/generated": 1.1129395961761475,
218
+ "rewards/margins": 0.42210373282432556,
219
+ "rewards/real": 1.5350432395935059,
220
+ "step": 120
221
+ },
222
+ {
223
+ "epoch": 0.3968,
224
+ "eval_logits/generated": -2.5561394691467285,
225
+ "eval_logits/real": -2.586364269256592,
226
+ "eval_logps/generated": -108.77558898925781,
227
+ "eval_logps/real": -121.60958099365234,
228
+ "eval_loss": 0.7001773715019226,
229
+ "eval_rewards/accuracies": 0.692307710647583,
230
+ "eval_rewards/generated": 1.2539945840835571,
231
+ "eval_rewards/margins": 0.47646236419677734,
232
+ "eval_rewards/real": 1.7304571866989136,
233
+ "eval_runtime": 36.5599,
234
+ "eval_samples_per_second": 5.47,
235
+ "eval_steps_per_second": 0.356,
236
+ "step": 124
237
  }
238
  ],
239
  "logging_steps": 10,