AmberYifan
commited on
Commit
•
595b99f
1
Parent(s):
da0d5d8
Training in progress, step 930, checkpoint
Browse files- last-checkpoint/global_step930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model-00001-of-00003.safetensors +1 -1
- last-checkpoint/model-00002-of-00003.safetensors +1 -1
- last-checkpoint/model-00003-of-00003.safetensors +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +123 -2
last-checkpoint/global_step930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fa08966d8dc9427ed0e7f7f3eb8bf1cefb83008b10e5650f1b7c8a015a0de7d
|
3 |
+
size 14483467880
|
last-checkpoint/global_step930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be4f83c84e72c5c3b8824eac0171131d4329604ef8b4d0a45227dd3b341167f6
|
3 |
+
size 14483467880
|
last-checkpoint/global_step930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c93613ce7b583d30d3d45a000aa57bf80d18f49aaaf1b0160f73e928c30aa305
|
3 |
+
size 14483467880
|
last-checkpoint/global_step930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcfc3330efb4caf704d765f9f6a54b55802d457dcca98b2249a21f1308300cc3
|
3 |
+
size 14483467880
|
last-checkpoint/global_step930/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8235ea59a76df970fdd89d217227959a0e0a18cafb57843ddba09fc46890ba3d
|
3 |
+
size 150629
|
last-checkpoint/global_step930/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fc24f1425ef33b883cbf0586835f648175e6ddd007079dacbbfdbcaf553ab2f
|
3 |
+
size 150629
|
last-checkpoint/global_step930/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60a2755526c30550de59ba9ee2290d7a539afaf4085a71abf57ddae6603971dd
|
3 |
+
size 150629
|
last-checkpoint/global_step930/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:862ace45acbeb0cbd76349c80aff0d460a525b3d142d9e5b729f11f573c28cc3
|
3 |
+
size 150629
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step930
|
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943162336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94bfb89fd02254d0d7d2cdb822bf9e53d6192c903b5c2ead0592f671b52bcf7a
|
3 |
size 4943162336
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fc9727b3a71f7c7369f878f68474786432cbe6fa1dea710d3ff96fa9d70e4e0
|
3 |
size 4999819336
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4540516344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b410ea095f6d34f670a5401486f9ca473f3f3ad7131eac5a39a6e40e73a6d18
|
3 |
size 4540516344
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5b5b0934b8613429f71d38c4aaf1cf68b50eb415214b938124e65c4e50faae1
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19f63bfbf9ef9efae26be62fb115c8fa6adfa6333f3074d8511b5eeab88f0f1e
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba2a5ec9c47d3c544c4e610213c6d14c67721b556bd12896b90b14fd54cf1901
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e5fd0b1afc88ca5e581b87462a6a56c9a82154f0d69fe336f7b445bad77242b
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98ace375a7a3e380a16715316d6e5e36d9cb62649995c07cc349fb85673d36ff
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
"eval_steps": 62,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -1536,6 +1536,127 @@
|
|
1536 |
"eval_samples_per_second": 5.356,
|
1537 |
"eval_steps_per_second": 0.348,
|
1538 |
"step": 868
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1539 |
}
|
1540 |
],
|
1541 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.976,
|
5 |
"eval_steps": 62,
|
6 |
+
"global_step": 930,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
1536 |
"eval_samples_per_second": 5.356,
|
1537 |
"eval_steps_per_second": 0.348,
|
1538 |
"step": 868
|
1539 |
+
},
|
1540 |
+
{
|
1541 |
+
"epoch": 2.784,
|
1542 |
+
"grad_norm": 39.33798985134705,
|
1543 |
+
"learning_rate": 3.919239904988123e-08,
|
1544 |
+
"logits/generated": -2.3367316722869873,
|
1545 |
+
"logits/real": -2.405890941619873,
|
1546 |
+
"logps/generated": -134.0688018798828,
|
1547 |
+
"logps/real": -103.1637191772461,
|
1548 |
+
"loss": 0.2581,
|
1549 |
+
"rewards/accuracies": 0.949999988079071,
|
1550 |
+
"rewards/generated": -0.24620242416858673,
|
1551 |
+
"rewards/margins": 4.148200035095215,
|
1552 |
+
"rewards/real": 3.9019978046417236,
|
1553 |
+
"step": 870
|
1554 |
+
},
|
1555 |
+
{
|
1556 |
+
"epoch": 2.816,
|
1557 |
+
"grad_norm": 19.24691526629623,
|
1558 |
+
"learning_rate": 3.32541567695962e-08,
|
1559 |
+
"logits/generated": -2.3322081565856934,
|
1560 |
+
"logits/real": -2.3643596172332764,
|
1561 |
+
"logps/generated": -131.92562866210938,
|
1562 |
+
"logps/real": -100.34136199951172,
|
1563 |
+
"loss": 0.2497,
|
1564 |
+
"rewards/accuracies": 0.949999988079071,
|
1565 |
+
"rewards/generated": -0.7228564620018005,
|
1566 |
+
"rewards/margins": 4.272365093231201,
|
1567 |
+
"rewards/real": 3.549508571624756,
|
1568 |
+
"step": 880
|
1569 |
+
},
|
1570 |
+
{
|
1571 |
+
"epoch": 2.848,
|
1572 |
+
"grad_norm": 74.32934828209018,
|
1573 |
+
"learning_rate": 2.7315914489311164e-08,
|
1574 |
+
"logits/generated": -2.411259174346924,
|
1575 |
+
"logits/real": -2.4403157234191895,
|
1576 |
+
"logps/generated": -153.52029418945312,
|
1577 |
+
"logps/real": -101.80616760253906,
|
1578 |
+
"loss": 0.2214,
|
1579 |
+
"rewards/accuracies": 0.9624999761581421,
|
1580 |
+
"rewards/generated": -0.7813536524772644,
|
1581 |
+
"rewards/margins": 4.41187047958374,
|
1582 |
+
"rewards/real": 3.630516767501831,
|
1583 |
+
"step": 890
|
1584 |
+
},
|
1585 |
+
{
|
1586 |
+
"epoch": 2.88,
|
1587 |
+
"grad_norm": 17.231794888700385,
|
1588 |
+
"learning_rate": 2.1377672209026125e-08,
|
1589 |
+
"logits/generated": -2.440458297729492,
|
1590 |
+
"logits/real": -2.4329943656921387,
|
1591 |
+
"logps/generated": -131.6967010498047,
|
1592 |
+
"logps/real": -100.85757446289062,
|
1593 |
+
"loss": 0.1728,
|
1594 |
+
"rewards/accuracies": 0.987500011920929,
|
1595 |
+
"rewards/generated": -1.0743391513824463,
|
1596 |
+
"rewards/margins": 4.5941972732543945,
|
1597 |
+
"rewards/real": 3.5198585987091064,
|
1598 |
+
"step": 900
|
1599 |
+
},
|
1600 |
+
{
|
1601 |
+
"epoch": 2.912,
|
1602 |
+
"grad_norm": 31.31269522304366,
|
1603 |
+
"learning_rate": 1.5439429928741092e-08,
|
1604 |
+
"logits/generated": -2.288120985031128,
|
1605 |
+
"logits/real": -2.4024569988250732,
|
1606 |
+
"logps/generated": -126.20759582519531,
|
1607 |
+
"logps/real": -93.2852554321289,
|
1608 |
+
"loss": 0.2286,
|
1609 |
+
"rewards/accuracies": 0.9750000238418579,
|
1610 |
+
"rewards/generated": -0.7462027072906494,
|
1611 |
+
"rewards/margins": 4.080456256866455,
|
1612 |
+
"rewards/real": 3.3342537879943848,
|
1613 |
+
"step": 910
|
1614 |
+
},
|
1615 |
+
{
|
1616 |
+
"epoch": 2.944,
|
1617 |
+
"grad_norm": 39.94010884942353,
|
1618 |
+
"learning_rate": 9.501187648456057e-09,
|
1619 |
+
"logits/generated": -2.390730381011963,
|
1620 |
+
"logits/real": -2.414212226867676,
|
1621 |
+
"logps/generated": -127.1091537475586,
|
1622 |
+
"logps/real": -113.78387451171875,
|
1623 |
+
"loss": 0.2001,
|
1624 |
+
"rewards/accuracies": 0.949999988079071,
|
1625 |
+
"rewards/generated": -0.6455323696136475,
|
1626 |
+
"rewards/margins": 4.345826148986816,
|
1627 |
+
"rewards/real": 3.700294017791748,
|
1628 |
+
"step": 920
|
1629 |
+
},
|
1630 |
+
{
|
1631 |
+
"epoch": 2.976,
|
1632 |
+
"grad_norm": 24.96632528956892,
|
1633 |
+
"learning_rate": 3.562945368171021e-09,
|
1634 |
+
"logits/generated": -2.4350810050964355,
|
1635 |
+
"logits/real": -2.3702778816223145,
|
1636 |
+
"logps/generated": -130.21060180664062,
|
1637 |
+
"logps/real": -103.36898040771484,
|
1638 |
+
"loss": 0.2881,
|
1639 |
+
"rewards/accuracies": 0.9624999761581421,
|
1640 |
+
"rewards/generated": -0.7739312648773193,
|
1641 |
+
"rewards/margins": 4.571539878845215,
|
1642 |
+
"rewards/real": 3.7976088523864746,
|
1643 |
+
"step": 930
|
1644 |
+
},
|
1645 |
+
{
|
1646 |
+
"epoch": 2.976,
|
1647 |
+
"eval_logits/generated": -2.3562779426574707,
|
1648 |
+
"eval_logits/real": -2.3975794315338135,
|
1649 |
+
"eval_logps/generated": -106.50991821289062,
|
1650 |
+
"eval_logps/real": -116.46751403808594,
|
1651 |
+
"eval_loss": 0.7523060441017151,
|
1652 |
+
"eval_rewards/accuracies": 0.6153846383094788,
|
1653 |
+
"eval_rewards/generated": 1.4805629253387451,
|
1654 |
+
"eval_rewards/margins": 0.7641012668609619,
|
1655 |
+
"eval_rewards/real": 2.244664430618286,
|
1656 |
+
"eval_runtime": 37.8351,
|
1657 |
+
"eval_samples_per_second": 5.286,
|
1658 |
+
"eval_steps_per_second": 0.344,
|
1659 |
+
"step": 930
|
1660 |
}
|
1661 |
],
|
1662 |
"logging_steps": 10,
|