Training in progress, step 124, checkpoint
Browse files- last-checkpoint/global_step124/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step124/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step124/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step124/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step124/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step124/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step124/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step124/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model-00001-of-00003.safetensors +1 -1
- last-checkpoint/model-00002-of-00003.safetensors +1 -1
- last-checkpoint/model-00003-of-00003.safetensors +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +108 -2
last-checkpoint/global_step124/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8232dc29225a0415e93846f907f121d4883923a2454ac5f24439b1ddaec48ed6
|
3 |
+
size 14483467880
|
last-checkpoint/global_step124/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb12c0ff2edb4f0e32ab5b430273aac19e4f909138fcbd89050eaf4325785680
|
3 |
+
size 14483467880
|
last-checkpoint/global_step124/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ed8017e9fc3ce74c24dab1205b495fefc3f0cc3a8ec990382dd6a9944b9d1ae
|
3 |
+
size 14483467880
|
last-checkpoint/global_step124/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09aca282ac37c9412a45b2216a419897f820e1673f8ed512018453639b823f45
|
3 |
+
size 14483467880
|
last-checkpoint/global_step124/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66045da7ecfe0e7cb3640c641a4309cae5379c4f301e3c72c1c4a8efe9529782
|
3 |
+
size 150629
|
last-checkpoint/global_step124/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16584df5949a6bb6166bd5286273f4e9b5d86cb9d794005e8298925747917133
|
3 |
+
size 150629
|
last-checkpoint/global_step124/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f92af64c22beb18e2a8e224a2437108f2d2d47e27436c3f19c6da4a5c9f96186
|
3 |
+
size 150629
|
last-checkpoint/global_step124/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32bb4a2c24916b82c832b2cebf4eb467a11ffa7c9e5514cfa4a382e45b22fe20
|
3 |
+
size 150629
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step124
|
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943162336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5ef837fbded3b18cd0a4c60904eea5a7736290649d3272b2d4d747062f78dca
|
3 |
size 4943162336
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94825f39a3c46a97f26e600562154fe1141d122c3aed77b1c8207909e2d39dd3
|
3 |
size 4999819336
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4540516344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccc54b0a6d0a78d822a62f65c8269ae1cd3e47b5d8ee2bbc91a50cad768ab180
|
3 |
size 4540516344
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a82e580e4e92d21ee2fca0348b8c83585fc265a3bdec704f0dbfaf6f2f800587
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2f5b0e26d51388f8180f8023bedbf0f066c7e40bd40eba6f2df3d9d9be582f4
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14c4a2665fddc1defbf2e5e1c0f3875ebfe701d33e843d7bd93ecde03037e001
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f02a7d95f6cb55234c18abb2f3a67c0a306f262d68ef9b79e11b501a08555b93
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:537ea638b6cb2eeeba0fa5565c11e75e59cd64d0fdb026e5c722db4638703a11
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 62,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -128,6 +128,112 @@
|
|
128 |
"eval_samples_per_second": 7.273,
|
129 |
"eval_steps_per_second": 0.473,
|
130 |
"step": 62
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
131 |
}
|
132 |
],
|
133 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.3968,
|
5 |
"eval_steps": 62,
|
6 |
+
"global_step": 124,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
128 |
"eval_samples_per_second": 7.273,
|
129 |
"eval_steps_per_second": 0.473,
|
130 |
"step": 62
|
131 |
+
},
|
132 |
+
{
|
133 |
+
"epoch": 0.224,
|
134 |
+
"grad_norm": 111.31786558317472,
|
135 |
+
"learning_rate": 3.7234042553191484e-07,
|
136 |
+
"logits/generated": -2.4125685691833496,
|
137 |
+
"logits/real": -2.412478446960449,
|
138 |
+
"logps/generated": -122.41896057128906,
|
139 |
+
"logps/real": -142.01275634765625,
|
140 |
+
"loss": 0.7703,
|
141 |
+
"rewards/accuracies": 0.6499999761581421,
|
142 |
+
"rewards/generated": 1.1598608493804932,
|
143 |
+
"rewards/margins": 0.22506161034107208,
|
144 |
+
"rewards/real": 1.3849226236343384,
|
145 |
+
"step": 70
|
146 |
+
},
|
147 |
+
{
|
148 |
+
"epoch": 0.256,
|
149 |
+
"grad_norm": 108.77845029282479,
|
150 |
+
"learning_rate": 4.25531914893617e-07,
|
151 |
+
"logits/generated": -2.425182819366455,
|
152 |
+
"logits/real": -2.4704861640930176,
|
153 |
+
"logps/generated": -111.57796478271484,
|
154 |
+
"logps/real": -133.41946411132812,
|
155 |
+
"loss": 0.7575,
|
156 |
+
"rewards/accuracies": 0.637499988079071,
|
157 |
+
"rewards/generated": 1.273758888244629,
|
158 |
+
"rewards/margins": 0.2473028153181076,
|
159 |
+
"rewards/real": 1.521061658859253,
|
160 |
+
"step": 80
|
161 |
+
},
|
162 |
+
{
|
163 |
+
"epoch": 0.288,
|
164 |
+
"grad_norm": 87.55111605760202,
|
165 |
+
"learning_rate": 4.787234042553192e-07,
|
166 |
+
"logits/generated": -2.457540988922119,
|
167 |
+
"logits/real": -2.5106961727142334,
|
168 |
+
"logps/generated": -118.1611099243164,
|
169 |
+
"logps/real": -128.29928588867188,
|
170 |
+
"loss": 0.6781,
|
171 |
+
"rewards/accuracies": 0.7124999761581421,
|
172 |
+
"rewards/generated": 0.9840036630630493,
|
173 |
+
"rewards/margins": 0.5047105550765991,
|
174 |
+
"rewards/real": 1.4887142181396484,
|
175 |
+
"step": 90
|
176 |
+
},
|
177 |
+
{
|
178 |
+
"epoch": 0.32,
|
179 |
+
"grad_norm": 86.71987338916492,
|
180 |
+
"learning_rate": 4.96437054631829e-07,
|
181 |
+
"logits/generated": -2.4262959957122803,
|
182 |
+
"logits/real": -2.446533679962158,
|
183 |
+
"logps/generated": -118.33076477050781,
|
184 |
+
"logps/real": -132.8785400390625,
|
185 |
+
"loss": 0.7601,
|
186 |
+
"rewards/accuracies": 0.637499988079071,
|
187 |
+
"rewards/generated": 1.1130377054214478,
|
188 |
+
"rewards/margins": 0.3733757734298706,
|
189 |
+
"rewards/real": 1.4864133596420288,
|
190 |
+
"step": 100
|
191 |
+
},
|
192 |
+
{
|
193 |
+
"epoch": 0.352,
|
194 |
+
"grad_norm": 85.8458816841653,
|
195 |
+
"learning_rate": 4.904988123515439e-07,
|
196 |
+
"logits/generated": -2.3812742233276367,
|
197 |
+
"logits/real": -2.4494009017944336,
|
198 |
+
"logps/generated": -113.8266372680664,
|
199 |
+
"logps/real": -131.19769287109375,
|
200 |
+
"loss": 0.7051,
|
201 |
+
"rewards/accuracies": 0.762499988079071,
|
202 |
+
"rewards/generated": 0.42378121614456177,
|
203 |
+
"rewards/margins": 0.6939576268196106,
|
204 |
+
"rewards/real": 1.1177388429641724,
|
205 |
+
"step": 110
|
206 |
+
},
|
207 |
+
{
|
208 |
+
"epoch": 0.384,
|
209 |
+
"grad_norm": 71.18315494374211,
|
210 |
+
"learning_rate": 4.845605700712589e-07,
|
211 |
+
"logits/generated": -2.4884400367736816,
|
212 |
+
"logits/real": -2.6123955249786377,
|
213 |
+
"logps/generated": -122.7501220703125,
|
214 |
+
"logps/real": -125.4404067993164,
|
215 |
+
"loss": 0.7524,
|
216 |
+
"rewards/accuracies": 0.5625,
|
217 |
+
"rewards/generated": 1.1129395961761475,
|
218 |
+
"rewards/margins": 0.42210373282432556,
|
219 |
+
"rewards/real": 1.5350432395935059,
|
220 |
+
"step": 120
|
221 |
+
},
|
222 |
+
{
|
223 |
+
"epoch": 0.3968,
|
224 |
+
"eval_logits/generated": -2.5561394691467285,
|
225 |
+
"eval_logits/real": -2.586364269256592,
|
226 |
+
"eval_logps/generated": -108.77558898925781,
|
227 |
+
"eval_logps/real": -121.60958099365234,
|
228 |
+
"eval_loss": 0.7001773715019226,
|
229 |
+
"eval_rewards/accuracies": 0.692307710647583,
|
230 |
+
"eval_rewards/generated": 1.2539945840835571,
|
231 |
+
"eval_rewards/margins": 0.47646236419677734,
|
232 |
+
"eval_rewards/real": 1.7304571866989136,
|
233 |
+
"eval_runtime": 36.5599,
|
234 |
+
"eval_samples_per_second": 5.47,
|
235 |
+
"eval_steps_per_second": 0.356,
|
236 |
+
"step": 124
|
237 |
}
|
238 |
],
|
239 |
"logging_steps": 10,
|