AmberYifan commited on
Commit
595b99f
1 Parent(s): da0d5d8

Training in progress, step 930, checkpoint

Browse files
last-checkpoint/global_step930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fa08966d8dc9427ed0e7f7f3eb8bf1cefb83008b10e5650f1b7c8a015a0de7d
3
+ size 14483467880
last-checkpoint/global_step930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be4f83c84e72c5c3b8824eac0171131d4329604ef8b4d0a45227dd3b341167f6
3
+ size 14483467880
last-checkpoint/global_step930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93613ce7b583d30d3d45a000aa57bf80d18f49aaaf1b0160f73e928c30aa305
3
+ size 14483467880
last-checkpoint/global_step930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcfc3330efb4caf704d765f9f6a54b55802d457dcca98b2249a21f1308300cc3
3
+ size 14483467880
last-checkpoint/global_step930/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8235ea59a76df970fdd89d217227959a0e0a18cafb57843ddba09fc46890ba3d
3
+ size 150629
last-checkpoint/global_step930/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fc24f1425ef33b883cbf0586835f648175e6ddd007079dacbbfdbcaf553ab2f
3
+ size 150629
last-checkpoint/global_step930/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60a2755526c30550de59ba9ee2290d7a539afaf4085a71abf57ddae6603971dd
3
+ size 150629
last-checkpoint/global_step930/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:862ace45acbeb0cbd76349c80aff0d460a525b3d142d9e5b729f11f573c28cc3
3
+ size 150629
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step868
 
1
+ global_step930
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49ed8f0847a6d218a8d1eccb47868dcceb5eca54475b6157db67d660a1803d1d
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94bfb89fd02254d0d7d2cdb822bf9e53d6192c903b5c2ead0592f671b52bcf7a
3
  size 4943162336
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:637ae61efed0ceac33b21a213b84b61d20e3cb817770b79a2eda25413cbb5a3c
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc9727b3a71f7c7369f878f68474786432cbe6fa1dea710d3ff96fa9d70e4e0
3
  size 4999819336
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d0d7a867e4f5af4d520757d6e400338df292c54d603ec0f25b0254c5ee9e6f5
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b410ea095f6d34f670a5401486f9ca473f3f3ad7131eac5a39a6e40e73a6d18
3
  size 4540516344
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8639c02c997d5ec74743bd87a283daff10faa317419bf379edd99c706559f2ce
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5b5b0934b8613429f71d38c4aaf1cf68b50eb415214b938124e65c4e50faae1
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:211a79d80fe07a9690b74e693f719eafa8303e6798af58a53dd105eb19c8ccc5
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19f63bfbf9ef9efae26be62fb115c8fa6adfa6333f3074d8511b5eeab88f0f1e
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:319730d0d11be8a12d1633e218e39729160d397a56a34d9ebd2e63d2c81fd68f
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2a5ec9c47d3c544c4e610213c6d14c67721b556bd12896b90b14fd54cf1901
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e7c1d2c0fa7220ac8b520afb2fc0958467f149187d655695c73de033474c910
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e5fd0b1afc88ca5e581b87462a6a56c9a82154f0d69fe336f7b445bad77242b
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0a127df5e8aedd711ac814e5c853ecd07390a0c8ef0dc12756e27ebaa732ecd
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98ace375a7a3e380a16715316d6e5e36d9cb62649995c07cc349fb85673d36ff
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.7776,
5
  "eval_steps": 62,
6
- "global_step": 868,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1536,6 +1536,127 @@
1536
  "eval_samples_per_second": 5.356,
1537
  "eval_steps_per_second": 0.348,
1538
  "step": 868
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1539
  }
1540
  ],
1541
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.976,
5
  "eval_steps": 62,
6
+ "global_step": 930,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1536
  "eval_samples_per_second": 5.356,
1537
  "eval_steps_per_second": 0.348,
1538
  "step": 868
1539
+ },
1540
+ {
1541
+ "epoch": 2.784,
1542
+ "grad_norm": 39.33798985134705,
1543
+ "learning_rate": 3.919239904988123e-08,
1544
+ "logits/generated": -2.3367316722869873,
1545
+ "logits/real": -2.405890941619873,
1546
+ "logps/generated": -134.0688018798828,
1547
+ "logps/real": -103.1637191772461,
1548
+ "loss": 0.2581,
1549
+ "rewards/accuracies": 0.949999988079071,
1550
+ "rewards/generated": -0.24620242416858673,
1551
+ "rewards/margins": 4.148200035095215,
1552
+ "rewards/real": 3.9019978046417236,
1553
+ "step": 870
1554
+ },
1555
+ {
1556
+ "epoch": 2.816,
1557
+ "grad_norm": 19.24691526629623,
1558
+ "learning_rate": 3.32541567695962e-08,
1559
+ "logits/generated": -2.3322081565856934,
1560
+ "logits/real": -2.3643596172332764,
1561
+ "logps/generated": -131.92562866210938,
1562
+ "logps/real": -100.34136199951172,
1563
+ "loss": 0.2497,
1564
+ "rewards/accuracies": 0.949999988079071,
1565
+ "rewards/generated": -0.7228564620018005,
1566
+ "rewards/margins": 4.272365093231201,
1567
+ "rewards/real": 3.549508571624756,
1568
+ "step": 880
1569
+ },
1570
+ {
1571
+ "epoch": 2.848,
1572
+ "grad_norm": 74.32934828209018,
1573
+ "learning_rate": 2.7315914489311164e-08,
1574
+ "logits/generated": -2.411259174346924,
1575
+ "logits/real": -2.4403157234191895,
1576
+ "logps/generated": -153.52029418945312,
1577
+ "logps/real": -101.80616760253906,
1578
+ "loss": 0.2214,
1579
+ "rewards/accuracies": 0.9624999761581421,
1580
+ "rewards/generated": -0.7813536524772644,
1581
+ "rewards/margins": 4.41187047958374,
1582
+ "rewards/real": 3.630516767501831,
1583
+ "step": 890
1584
+ },
1585
+ {
1586
+ "epoch": 2.88,
1587
+ "grad_norm": 17.231794888700385,
1588
+ "learning_rate": 2.1377672209026125e-08,
1589
+ "logits/generated": -2.440458297729492,
1590
+ "logits/real": -2.4329943656921387,
1591
+ "logps/generated": -131.6967010498047,
1592
+ "logps/real": -100.85757446289062,
1593
+ "loss": 0.1728,
1594
+ "rewards/accuracies": 0.987500011920929,
1595
+ "rewards/generated": -1.0743391513824463,
1596
+ "rewards/margins": 4.5941972732543945,
1597
+ "rewards/real": 3.5198585987091064,
1598
+ "step": 900
1599
+ },
1600
+ {
1601
+ "epoch": 2.912,
1602
+ "grad_norm": 31.31269522304366,
1603
+ "learning_rate": 1.5439429928741092e-08,
1604
+ "logits/generated": -2.288120985031128,
1605
+ "logits/real": -2.4024569988250732,
1606
+ "logps/generated": -126.20759582519531,
1607
+ "logps/real": -93.2852554321289,
1608
+ "loss": 0.2286,
1609
+ "rewards/accuracies": 0.9750000238418579,
1610
+ "rewards/generated": -0.7462027072906494,
1611
+ "rewards/margins": 4.080456256866455,
1612
+ "rewards/real": 3.3342537879943848,
1613
+ "step": 910
1614
+ },
1615
+ {
1616
+ "epoch": 2.944,
1617
+ "grad_norm": 39.94010884942353,
1618
+ "learning_rate": 9.501187648456057e-09,
1619
+ "logits/generated": -2.390730381011963,
1620
+ "logits/real": -2.414212226867676,
1621
+ "logps/generated": -127.1091537475586,
1622
+ "logps/real": -113.78387451171875,
1623
+ "loss": 0.2001,
1624
+ "rewards/accuracies": 0.949999988079071,
1625
+ "rewards/generated": -0.6455323696136475,
1626
+ "rewards/margins": 4.345826148986816,
1627
+ "rewards/real": 3.700294017791748,
1628
+ "step": 920
1629
+ },
1630
+ {
1631
+ "epoch": 2.976,
1632
+ "grad_norm": 24.96632528956892,
1633
+ "learning_rate": 3.562945368171021e-09,
1634
+ "logits/generated": -2.4350810050964355,
1635
+ "logits/real": -2.3702778816223145,
1636
+ "logps/generated": -130.21060180664062,
1637
+ "logps/real": -103.36898040771484,
1638
+ "loss": 0.2881,
1639
+ "rewards/accuracies": 0.9624999761581421,
1640
+ "rewards/generated": -0.7739312648773193,
1641
+ "rewards/margins": 4.571539878845215,
1642
+ "rewards/real": 3.7976088523864746,
1643
+ "step": 930
1644
+ },
1645
+ {
1646
+ "epoch": 2.976,
1647
+ "eval_logits/generated": -2.3562779426574707,
1648
+ "eval_logits/real": -2.3975794315338135,
1649
+ "eval_logps/generated": -106.50991821289062,
1650
+ "eval_logps/real": -116.46751403808594,
1651
+ "eval_loss": 0.7523060441017151,
1652
+ "eval_rewards/accuracies": 0.6153846383094788,
1653
+ "eval_rewards/generated": 1.4805629253387451,
1654
+ "eval_rewards/margins": 0.7641012668609619,
1655
+ "eval_rewards/real": 2.244664430618286,
1656
+ "eval_runtime": 37.8351,
1657
+ "eval_samples_per_second": 5.286,
1658
+ "eval_steps_per_second": 0.344,
1659
+ "step": 930
1660
  }
1661
  ],
1662
  "logging_steps": 10,