AmberYifan commited on
Commit
003766d
1 Parent(s): 75a0fa8

Training in progress, step 806, checkpoint

Browse files
last-checkpoint/global_step806/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4655b1b3999db772d77f146a4f7f14ee1e3d50fd58911f740c36b4d70c5bf76
3
+ size 13476835648
last-checkpoint/global_step806/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96dcc27ffe6bebd92bf61a45bdc95681d0b5d883b204853945880b81b274398b
3
+ size 13476835648
last-checkpoint/global_step806/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f9bb7e5bb9ca422cb0d1dc04d2671971df137a3f09d07042cad506b9a2d71f9
3
+ size 13476835648
last-checkpoint/global_step806/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba7f1a348180a0d364072685057323ea6b36164ec89aaa3b178eded6e40ff885
3
+ size 13476835648
last-checkpoint/global_step806/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8d40541af74b88448ba760a8978e722801bd2f9f599321fbb51f3dc9b7aa48d
3
+ size 150693
last-checkpoint/global_step806/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:157d3836b0324e6cee2dd66a33217d6e37ed5ed7b3b9b43d035418d1760303bb
3
+ size 150693
last-checkpoint/global_step806/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f58aefc7e17b7c63dbeb24bef6fbbd4df65f9011bd0a645acb9ead93913de3e
3
+ size 150693
last-checkpoint/global_step806/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e7011657dbb583fe08aa94c28ca514c23f5adadb33ff22d042174c99859c360
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step682
 
1
+ global_step806
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b540a3bdebafca7694656f77d0e558804e111c4c3b9b258038b1eaccbe984eec
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b19051be7334b0ec1c05289f0ba87187f1d4d8ad4c691e9ccba473137a5c0c
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23f9ad07280adb2d4b75e2e7438927d267ba0ae53691cf890abe923d1bb78778
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b23e112ecb38d9c61e0a318a310cbe0da90c31bcf2bc8cbd996ea1dc8ba03b
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bebbcf1f86afcb2a4c347004a55e474b02a6c86a2ffd1b17318f2c0f863e1cad
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c1e6f6df51c8519ad30f4a5eac897f58101f14df58a659a6a23b1c9d757dd53
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4cf818939bfcb1de93c78e79be7390fcae46bb5c39166bd571b1f3a8b2cdeb3
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43ea574d07a576c8cd612773a5015f4f8303ef6ce35f964bd81b8b489ceed9bd
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:408ca302fdad670605f637bd7faeea541858831c4f2318e3fca2d0d709c7b218
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:231c40114b2d8985fa7545edd47494bc1e9d1e0a8db77f30a4d192048f265712
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df380dcd2c8305fefe9f4ba88e7536beb3b5e94d863ac6f29eae326ddfef0f32
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d4d2cd69e482e80eb9dbe4006558389d72a76a801f542398022187d536edd47
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51f78c929d775d81c8dd9feb87fd329a39e895b5f8b1d2cdbede2cbd8b45f49e
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08d86ba141f647d4a747b93c9fe2e7871e4a119de2b70afdde8f5f8f330a1740
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ec08ea6383804e8c05c7ff772c4aed53351dc10413de8f46c3a1998585e65c7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b56640485d548dbcc67b1963f981239312b10af622fb02275932812ae1326861
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.1824,
5
  "eval_steps": 62,
6
- "global_step": 682,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1218,6 +1218,218 @@
1218
  "eval_samples_per_second": 7.845,
1219
  "eval_steps_per_second": 0.51,
1220
  "step": 682
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1221
  }
1222
  ],
1223
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.5792,
5
  "eval_steps": 62,
6
+ "global_step": 806,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1218
  "eval_samples_per_second": 7.845,
1219
  "eval_steps_per_second": 0.51,
1220
  "step": 682
1221
+ },
1222
+ {
1223
+ "epoch": 2.208,
1224
+ "grad_norm": 0.3658391972106121,
1225
+ "learning_rate": 1.4608076009501184e-07,
1226
+ "logits/generated": -0.7777714133262634,
1227
+ "logits/real": -1.4327569007873535,
1228
+ "logps/generated": -349.45123291015625,
1229
+ "logps/real": -91.0394287109375,
1230
+ "loss": 0.1006,
1231
+ "rewards/accuracies": 1.0,
1232
+ "rewards/generated": -6.516034126281738,
1233
+ "rewards/margins": 16.061874389648438,
1234
+ "rewards/real": 9.5458402633667,
1235
+ "step": 690
1236
+ },
1237
+ {
1238
+ "epoch": 2.24,
1239
+ "grad_norm": 0.37751724197745956,
1240
+ "learning_rate": 1.4014251781472683e-07,
1241
+ "logits/generated": -0.8562400937080383,
1242
+ "logits/real": -1.4605350494384766,
1243
+ "logps/generated": -349.2660827636719,
1244
+ "logps/real": -110.1448745727539,
1245
+ "loss": 0.0985,
1246
+ "rewards/accuracies": 1.0,
1247
+ "rewards/generated": -6.469089508056641,
1248
+ "rewards/margins": 17.073518753051758,
1249
+ "rewards/real": 10.604430198669434,
1250
+ "step": 700
1251
+ },
1252
+ {
1253
+ "epoch": 2.2720000000000002,
1254
+ "grad_norm": 0.3099039440839268,
1255
+ "learning_rate": 1.342042755344418e-07,
1256
+ "logits/generated": -0.9007622003555298,
1257
+ "logits/real": -1.437908411026001,
1258
+ "logps/generated": -345.6163330078125,
1259
+ "logps/real": -93.06938171386719,
1260
+ "loss": 0.0978,
1261
+ "rewards/accuracies": 1.0,
1262
+ "rewards/generated": -6.0835700035095215,
1263
+ "rewards/margins": 15.84107780456543,
1264
+ "rewards/real": 9.757506370544434,
1265
+ "step": 710
1266
+ },
1267
+ {
1268
+ "epoch": 2.304,
1269
+ "grad_norm": 0.3864668793151262,
1270
+ "learning_rate": 1.2826603325415677e-07,
1271
+ "logits/generated": -0.8885849714279175,
1272
+ "logits/real": -1.5355165004730225,
1273
+ "logps/generated": -342.10443115234375,
1274
+ "logps/real": -104.58480072021484,
1275
+ "loss": 0.1019,
1276
+ "rewards/accuracies": 1.0,
1277
+ "rewards/generated": -6.677704811096191,
1278
+ "rewards/margins": 16.409557342529297,
1279
+ "rewards/real": 9.731854438781738,
1280
+ "step": 720
1281
+ },
1282
+ {
1283
+ "epoch": 2.336,
1284
+ "grad_norm": 0.3445053668290169,
1285
+ "learning_rate": 1.2232779097387173e-07,
1286
+ "logits/generated": -0.8385915756225586,
1287
+ "logits/real": -1.397671103477478,
1288
+ "logps/generated": -354.0185241699219,
1289
+ "logps/real": -112.39442443847656,
1290
+ "loss": 0.1017,
1291
+ "rewards/accuracies": 1.0,
1292
+ "rewards/generated": -7.097531795501709,
1293
+ "rewards/margins": 18.07855987548828,
1294
+ "rewards/real": 10.981030464172363,
1295
+ "step": 730
1296
+ },
1297
+ {
1298
+ "epoch": 2.368,
1299
+ "grad_norm": 0.3341439577424557,
1300
+ "learning_rate": 1.163895486935867e-07,
1301
+ "logits/generated": -0.8578903079032898,
1302
+ "logits/real": -1.383490800857544,
1303
+ "logps/generated": -347.2725524902344,
1304
+ "logps/real": -103.35150146484375,
1305
+ "loss": 0.1017,
1306
+ "rewards/accuracies": 1.0,
1307
+ "rewards/generated": -6.981736183166504,
1308
+ "rewards/margins": 17.021286010742188,
1309
+ "rewards/real": 10.039549827575684,
1310
+ "step": 740
1311
+ },
1312
+ {
1313
+ "epoch": 2.3808,
1314
+ "eval_logits/generated": -0.880645751953125,
1315
+ "eval_logits/real": -1.4227505922317505,
1316
+ "eval_logps/generated": -358.9116516113281,
1317
+ "eval_logps/real": -105.00930786132812,
1318
+ "eval_loss": 0.10732075572013855,
1319
+ "eval_rewards/accuracies": 1.0,
1320
+ "eval_rewards/generated": -7.624257564544678,
1321
+ "eval_rewards/margins": 17.80915641784668,
1322
+ "eval_rewards/real": 10.184901237487793,
1323
+ "eval_runtime": 36.3751,
1324
+ "eval_samples_per_second": 5.498,
1325
+ "eval_steps_per_second": 0.357,
1326
+ "step": 744
1327
+ },
1328
+ {
1329
+ "epoch": 2.4,
1330
+ "grad_norm": 0.37872196207505543,
1331
+ "learning_rate": 1.1045130641330165e-07,
1332
+ "logits/generated": -0.9046470522880554,
1333
+ "logits/real": -1.3609508275985718,
1334
+ "logps/generated": -347.01611328125,
1335
+ "logps/real": -113.12504577636719,
1336
+ "loss": 0.1048,
1337
+ "rewards/accuracies": 1.0,
1338
+ "rewards/generated": -6.732972621917725,
1339
+ "rewards/margins": 17.482839584350586,
1340
+ "rewards/real": 10.74986457824707,
1341
+ "step": 750
1342
+ },
1343
+ {
1344
+ "epoch": 2.432,
1345
+ "grad_norm": 0.3456217830065947,
1346
+ "learning_rate": 1.0451306413301662e-07,
1347
+ "logits/generated": -0.9419130086898804,
1348
+ "logits/real": -1.448075294494629,
1349
+ "logps/generated": -350.6387023925781,
1350
+ "logps/real": -104.91294860839844,
1351
+ "loss": 0.1024,
1352
+ "rewards/accuracies": 1.0,
1353
+ "rewards/generated": -6.793516635894775,
1354
+ "rewards/margins": 17.103900909423828,
1355
+ "rewards/real": 10.310384750366211,
1356
+ "step": 760
1357
+ },
1358
+ {
1359
+ "epoch": 2.464,
1360
+ "grad_norm": 0.3510621706063929,
1361
+ "learning_rate": 9.857482185273158e-08,
1362
+ "logits/generated": -0.8172124028205872,
1363
+ "logits/real": -1.428694486618042,
1364
+ "logps/generated": -363.5953674316406,
1365
+ "logps/real": -88.23005676269531,
1366
+ "loss": 0.1012,
1367
+ "rewards/accuracies": 1.0,
1368
+ "rewards/generated": -7.76650857925415,
1369
+ "rewards/margins": 17.137920379638672,
1370
+ "rewards/real": 9.371413230895996,
1371
+ "step": 770
1372
+ },
1373
+ {
1374
+ "epoch": 2.496,
1375
+ "grad_norm": 0.29361560856209884,
1376
+ "learning_rate": 9.263657957244655e-08,
1377
+ "logits/generated": -0.8288412094116211,
1378
+ "logits/real": -1.4823163747787476,
1379
+ "logps/generated": -359.7073974609375,
1380
+ "logps/real": -97.23246002197266,
1381
+ "loss": 0.1021,
1382
+ "rewards/accuracies": 1.0,
1383
+ "rewards/generated": -7.1570844650268555,
1384
+ "rewards/margins": 17.029443740844727,
1385
+ "rewards/real": 9.872357368469238,
1386
+ "step": 780
1387
+ },
1388
+ {
1389
+ "epoch": 2.528,
1390
+ "grad_norm": 0.3698992846301525,
1391
+ "learning_rate": 8.669833729216151e-08,
1392
+ "logits/generated": -0.834811806678772,
1393
+ "logits/real": -1.4748550653457642,
1394
+ "logps/generated": -355.08685302734375,
1395
+ "logps/real": -91.9556884765625,
1396
+ "loss": 0.1018,
1397
+ "rewards/accuracies": 1.0,
1398
+ "rewards/generated": -7.218266487121582,
1399
+ "rewards/margins": 17.2064208984375,
1400
+ "rewards/real": 9.988153457641602,
1401
+ "step": 790
1402
+ },
1403
+ {
1404
+ "epoch": 2.56,
1405
+ "grad_norm": 0.3614102743036081,
1406
+ "learning_rate": 8.076009501187649e-08,
1407
+ "logits/generated": -0.8415037989616394,
1408
+ "logits/real": -1.4521253108978271,
1409
+ "logps/generated": -342.2822265625,
1410
+ "logps/real": -102.14026641845703,
1411
+ "loss": 0.1031,
1412
+ "rewards/accuracies": 1.0,
1413
+ "rewards/generated": -7.008787631988525,
1414
+ "rewards/margins": 16.703975677490234,
1415
+ "rewards/real": 9.695188522338867,
1416
+ "step": 800
1417
+ },
1418
+ {
1419
+ "epoch": 2.5792,
1420
+ "eval_logits/generated": -0.878677248954773,
1421
+ "eval_logits/real": -1.4391472339630127,
1422
+ "eval_logps/generated": -359.2500305175781,
1423
+ "eval_logps/real": -104.75186920166016,
1424
+ "eval_loss": 0.1071779727935791,
1425
+ "eval_rewards/accuracies": 1.0,
1426
+ "eval_rewards/generated": -7.65809440612793,
1427
+ "eval_rewards/margins": 17.868741989135742,
1428
+ "eval_rewards/real": 10.210646629333496,
1429
+ "eval_runtime": 29.5912,
1430
+ "eval_samples_per_second": 6.759,
1431
+ "eval_steps_per_second": 0.439,
1432
+ "step": 806
1433
  }
1434
  ],
1435
  "logging_steps": 10,