AmberYifan
commited on
Commit
•
003766d
1
Parent(s):
75a0fa8
Training in progress, step 806, checkpoint
Browse files- last-checkpoint/global_step806/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step806/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step806/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step806/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step806/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step806/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step806/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step806/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model-00001-of-00003.safetensors +1 -1
- last-checkpoint/model-00002-of-00003.safetensors +1 -1
- last-checkpoint/model-00003-of-00003.safetensors +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +214 -2
last-checkpoint/global_step806/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4655b1b3999db772d77f146a4f7f14ee1e3d50fd58911f740c36b4d70c5bf76
|
3 |
+
size 13476835648
|
last-checkpoint/global_step806/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96dcc27ffe6bebd92bf61a45bdc95681d0b5d883b204853945880b81b274398b
|
3 |
+
size 13476835648
|
last-checkpoint/global_step806/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f9bb7e5bb9ca422cb0d1dc04d2671971df137a3f09d07042cad506b9a2d71f9
|
3 |
+
size 13476835648
|
last-checkpoint/global_step806/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba7f1a348180a0d364072685057323ea6b36164ec89aaa3b178eded6e40ff885
|
3 |
+
size 13476835648
|
last-checkpoint/global_step806/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8d40541af74b88448ba760a8978e722801bd2f9f599321fbb51f3dc9b7aa48d
|
3 |
+
size 150693
|
last-checkpoint/global_step806/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:157d3836b0324e6cee2dd66a33217d6e37ed5ed7b3b9b43d035418d1760303bb
|
3 |
+
size 150693
|
last-checkpoint/global_step806/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f58aefc7e17b7c63dbeb24bef6fbbd4df65f9011bd0a645acb9ead93913de3e
|
3 |
+
size 150693
|
last-checkpoint/global_step806/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e7011657dbb583fe08aa94c28ca514c23f5adadb33ff22d042174c99859c360
|
3 |
+
size 150693
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step806
|
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4938985352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6b19051be7334b0ec1c05289f0ba87187f1d4d8ad4c691e9ccba473137a5c0c
|
3 |
size 4938985352
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4947390880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70b23e112ecb38d9c61e0a318a310cbe0da90c31bcf2bc8cbd996ea1dc8ba03b
|
3 |
size 4947390880
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3590488816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c1e6f6df51c8519ad30f4a5eac897f58101f14df58a659a6a23b1c9d757dd53
|
3 |
size 3590488816
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43ea574d07a576c8cd612773a5015f4f8303ef6ce35f964bd81b8b489ceed9bd
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:231c40114b2d8985fa7545edd47494bc1e9d1e0a8db77f30a4d192048f265712
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d4d2cd69e482e80eb9dbe4006558389d72a76a801f542398022187d536edd47
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08d86ba141f647d4a747b93c9fe2e7871e4a119de2b70afdde8f5f8f330a1740
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b56640485d548dbcc67b1963f981239312b10af622fb02275932812ae1326861
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
"eval_steps": 62,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -1218,6 +1218,218 @@
|
|
1218 |
"eval_samples_per_second": 7.845,
|
1219 |
"eval_steps_per_second": 0.51,
|
1220 |
"step": 682
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1221 |
}
|
1222 |
],
|
1223 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.5792,
|
5 |
"eval_steps": 62,
|
6 |
+
"global_step": 806,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
1218 |
"eval_samples_per_second": 7.845,
|
1219 |
"eval_steps_per_second": 0.51,
|
1220 |
"step": 682
|
1221 |
+
},
|
1222 |
+
{
|
1223 |
+
"epoch": 2.208,
|
1224 |
+
"grad_norm": 0.3658391972106121,
|
1225 |
+
"learning_rate": 1.4608076009501184e-07,
|
1226 |
+
"logits/generated": -0.7777714133262634,
|
1227 |
+
"logits/real": -1.4327569007873535,
|
1228 |
+
"logps/generated": -349.45123291015625,
|
1229 |
+
"logps/real": -91.0394287109375,
|
1230 |
+
"loss": 0.1006,
|
1231 |
+
"rewards/accuracies": 1.0,
|
1232 |
+
"rewards/generated": -6.516034126281738,
|
1233 |
+
"rewards/margins": 16.061874389648438,
|
1234 |
+
"rewards/real": 9.5458402633667,
|
1235 |
+
"step": 690
|
1236 |
+
},
|
1237 |
+
{
|
1238 |
+
"epoch": 2.24,
|
1239 |
+
"grad_norm": 0.37751724197745956,
|
1240 |
+
"learning_rate": 1.4014251781472683e-07,
|
1241 |
+
"logits/generated": -0.8562400937080383,
|
1242 |
+
"logits/real": -1.4605350494384766,
|
1243 |
+
"logps/generated": -349.2660827636719,
|
1244 |
+
"logps/real": -110.1448745727539,
|
1245 |
+
"loss": 0.0985,
|
1246 |
+
"rewards/accuracies": 1.0,
|
1247 |
+
"rewards/generated": -6.469089508056641,
|
1248 |
+
"rewards/margins": 17.073518753051758,
|
1249 |
+
"rewards/real": 10.604430198669434,
|
1250 |
+
"step": 700
|
1251 |
+
},
|
1252 |
+
{
|
1253 |
+
"epoch": 2.2720000000000002,
|
1254 |
+
"grad_norm": 0.3099039440839268,
|
1255 |
+
"learning_rate": 1.342042755344418e-07,
|
1256 |
+
"logits/generated": -0.9007622003555298,
|
1257 |
+
"logits/real": -1.437908411026001,
|
1258 |
+
"logps/generated": -345.6163330078125,
|
1259 |
+
"logps/real": -93.06938171386719,
|
1260 |
+
"loss": 0.0978,
|
1261 |
+
"rewards/accuracies": 1.0,
|
1262 |
+
"rewards/generated": -6.0835700035095215,
|
1263 |
+
"rewards/margins": 15.84107780456543,
|
1264 |
+
"rewards/real": 9.757506370544434,
|
1265 |
+
"step": 710
|
1266 |
+
},
|
1267 |
+
{
|
1268 |
+
"epoch": 2.304,
|
1269 |
+
"grad_norm": 0.3864668793151262,
|
1270 |
+
"learning_rate": 1.2826603325415677e-07,
|
1271 |
+
"logits/generated": -0.8885849714279175,
|
1272 |
+
"logits/real": -1.5355165004730225,
|
1273 |
+
"logps/generated": -342.10443115234375,
|
1274 |
+
"logps/real": -104.58480072021484,
|
1275 |
+
"loss": 0.1019,
|
1276 |
+
"rewards/accuracies": 1.0,
|
1277 |
+
"rewards/generated": -6.677704811096191,
|
1278 |
+
"rewards/margins": 16.409557342529297,
|
1279 |
+
"rewards/real": 9.731854438781738,
|
1280 |
+
"step": 720
|
1281 |
+
},
|
1282 |
+
{
|
1283 |
+
"epoch": 2.336,
|
1284 |
+
"grad_norm": 0.3445053668290169,
|
1285 |
+
"learning_rate": 1.2232779097387173e-07,
|
1286 |
+
"logits/generated": -0.8385915756225586,
|
1287 |
+
"logits/real": -1.397671103477478,
|
1288 |
+
"logps/generated": -354.0185241699219,
|
1289 |
+
"logps/real": -112.39442443847656,
|
1290 |
+
"loss": 0.1017,
|
1291 |
+
"rewards/accuracies": 1.0,
|
1292 |
+
"rewards/generated": -7.097531795501709,
|
1293 |
+
"rewards/margins": 18.07855987548828,
|
1294 |
+
"rewards/real": 10.981030464172363,
|
1295 |
+
"step": 730
|
1296 |
+
},
|
1297 |
+
{
|
1298 |
+
"epoch": 2.368,
|
1299 |
+
"grad_norm": 0.3341439577424557,
|
1300 |
+
"learning_rate": 1.163895486935867e-07,
|
1301 |
+
"logits/generated": -0.8578903079032898,
|
1302 |
+
"logits/real": -1.383490800857544,
|
1303 |
+
"logps/generated": -347.2725524902344,
|
1304 |
+
"logps/real": -103.35150146484375,
|
1305 |
+
"loss": 0.1017,
|
1306 |
+
"rewards/accuracies": 1.0,
|
1307 |
+
"rewards/generated": -6.981736183166504,
|
1308 |
+
"rewards/margins": 17.021286010742188,
|
1309 |
+
"rewards/real": 10.039549827575684,
|
1310 |
+
"step": 740
|
1311 |
+
},
|
1312 |
+
{
|
1313 |
+
"epoch": 2.3808,
|
1314 |
+
"eval_logits/generated": -0.880645751953125,
|
1315 |
+
"eval_logits/real": -1.4227505922317505,
|
1316 |
+
"eval_logps/generated": -358.9116516113281,
|
1317 |
+
"eval_logps/real": -105.00930786132812,
|
1318 |
+
"eval_loss": 0.10732075572013855,
|
1319 |
+
"eval_rewards/accuracies": 1.0,
|
1320 |
+
"eval_rewards/generated": -7.624257564544678,
|
1321 |
+
"eval_rewards/margins": 17.80915641784668,
|
1322 |
+
"eval_rewards/real": 10.184901237487793,
|
1323 |
+
"eval_runtime": 36.3751,
|
1324 |
+
"eval_samples_per_second": 5.498,
|
1325 |
+
"eval_steps_per_second": 0.357,
|
1326 |
+
"step": 744
|
1327 |
+
},
|
1328 |
+
{
|
1329 |
+
"epoch": 2.4,
|
1330 |
+
"grad_norm": 0.37872196207505543,
|
1331 |
+
"learning_rate": 1.1045130641330165e-07,
|
1332 |
+
"logits/generated": -0.9046470522880554,
|
1333 |
+
"logits/real": -1.3609508275985718,
|
1334 |
+
"logps/generated": -347.01611328125,
|
1335 |
+
"logps/real": -113.12504577636719,
|
1336 |
+
"loss": 0.1048,
|
1337 |
+
"rewards/accuracies": 1.0,
|
1338 |
+
"rewards/generated": -6.732972621917725,
|
1339 |
+
"rewards/margins": 17.482839584350586,
|
1340 |
+
"rewards/real": 10.74986457824707,
|
1341 |
+
"step": 750
|
1342 |
+
},
|
1343 |
+
{
|
1344 |
+
"epoch": 2.432,
|
1345 |
+
"grad_norm": 0.3456217830065947,
|
1346 |
+
"learning_rate": 1.0451306413301662e-07,
|
1347 |
+
"logits/generated": -0.9419130086898804,
|
1348 |
+
"logits/real": -1.448075294494629,
|
1349 |
+
"logps/generated": -350.6387023925781,
|
1350 |
+
"logps/real": -104.91294860839844,
|
1351 |
+
"loss": 0.1024,
|
1352 |
+
"rewards/accuracies": 1.0,
|
1353 |
+
"rewards/generated": -6.793516635894775,
|
1354 |
+
"rewards/margins": 17.103900909423828,
|
1355 |
+
"rewards/real": 10.310384750366211,
|
1356 |
+
"step": 760
|
1357 |
+
},
|
1358 |
+
{
|
1359 |
+
"epoch": 2.464,
|
1360 |
+
"grad_norm": 0.3510621706063929,
|
1361 |
+
"learning_rate": 9.857482185273158e-08,
|
1362 |
+
"logits/generated": -0.8172124028205872,
|
1363 |
+
"logits/real": -1.428694486618042,
|
1364 |
+
"logps/generated": -363.5953674316406,
|
1365 |
+
"logps/real": -88.23005676269531,
|
1366 |
+
"loss": 0.1012,
|
1367 |
+
"rewards/accuracies": 1.0,
|
1368 |
+
"rewards/generated": -7.76650857925415,
|
1369 |
+
"rewards/margins": 17.137920379638672,
|
1370 |
+
"rewards/real": 9.371413230895996,
|
1371 |
+
"step": 770
|
1372 |
+
},
|
1373 |
+
{
|
1374 |
+
"epoch": 2.496,
|
1375 |
+
"grad_norm": 0.29361560856209884,
|
1376 |
+
"learning_rate": 9.263657957244655e-08,
|
1377 |
+
"logits/generated": -0.8288412094116211,
|
1378 |
+
"logits/real": -1.4823163747787476,
|
1379 |
+
"logps/generated": -359.7073974609375,
|
1380 |
+
"logps/real": -97.23246002197266,
|
1381 |
+
"loss": 0.1021,
|
1382 |
+
"rewards/accuracies": 1.0,
|
1383 |
+
"rewards/generated": -7.1570844650268555,
|
1384 |
+
"rewards/margins": 17.029443740844727,
|
1385 |
+
"rewards/real": 9.872357368469238,
|
1386 |
+
"step": 780
|
1387 |
+
},
|
1388 |
+
{
|
1389 |
+
"epoch": 2.528,
|
1390 |
+
"grad_norm": 0.3698992846301525,
|
1391 |
+
"learning_rate": 8.669833729216151e-08,
|
1392 |
+
"logits/generated": -0.834811806678772,
|
1393 |
+
"logits/real": -1.4748550653457642,
|
1394 |
+
"logps/generated": -355.08685302734375,
|
1395 |
+
"logps/real": -91.9556884765625,
|
1396 |
+
"loss": 0.1018,
|
1397 |
+
"rewards/accuracies": 1.0,
|
1398 |
+
"rewards/generated": -7.218266487121582,
|
1399 |
+
"rewards/margins": 17.2064208984375,
|
1400 |
+
"rewards/real": 9.988153457641602,
|
1401 |
+
"step": 790
|
1402 |
+
},
|
1403 |
+
{
|
1404 |
+
"epoch": 2.56,
|
1405 |
+
"grad_norm": 0.3614102743036081,
|
1406 |
+
"learning_rate": 8.076009501187649e-08,
|
1407 |
+
"logits/generated": -0.8415037989616394,
|
1408 |
+
"logits/real": -1.4521253108978271,
|
1409 |
+
"logps/generated": -342.2822265625,
|
1410 |
+
"logps/real": -102.14026641845703,
|
1411 |
+
"loss": 0.1031,
|
1412 |
+
"rewards/accuracies": 1.0,
|
1413 |
+
"rewards/generated": -7.008787631988525,
|
1414 |
+
"rewards/margins": 16.703975677490234,
|
1415 |
+
"rewards/real": 9.695188522338867,
|
1416 |
+
"step": 800
|
1417 |
+
},
|
1418 |
+
{
|
1419 |
+
"epoch": 2.5792,
|
1420 |
+
"eval_logits/generated": -0.878677248954773,
|
1421 |
+
"eval_logits/real": -1.4391472339630127,
|
1422 |
+
"eval_logps/generated": -359.2500305175781,
|
1423 |
+
"eval_logps/real": -104.75186920166016,
|
1424 |
+
"eval_loss": 0.1071779727935791,
|
1425 |
+
"eval_rewards/accuracies": 1.0,
|
1426 |
+
"eval_rewards/generated": -7.65809440612793,
|
1427 |
+
"eval_rewards/margins": 17.868741989135742,
|
1428 |
+
"eval_rewards/real": 10.210646629333496,
|
1429 |
+
"eval_runtime": 29.5912,
|
1430 |
+
"eval_samples_per_second": 6.759,
|
1431 |
+
"eval_steps_per_second": 0.439,
|
1432 |
+
"step": 806
|
1433 |
}
|
1434 |
],
|
1435 |
"logging_steps": 10,
|