AmberYifan
commited on
Commit
•
cd17d6e
1
Parent(s):
a369e1b
Training in progress, step 930, checkpoint
Browse files- last-checkpoint/global_step930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step930/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model-00001-of-00003.safetensors +1 -1
- last-checkpoint/model-00002-of-00003.safetensors +1 -1
- last-checkpoint/model-00003-of-00003.safetensors +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +123 -2
last-checkpoint/global_step930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b123a2cb22969eb9ccdfb292bc88c166ef1e867193095e50dbfbb01c4cca2951
|
3 |
+
size 13476835648
|
last-checkpoint/global_step930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75d6ced840634693a094a3edc203312b6532e27dd589c03696dd60e7bce660a5
|
3 |
+
size 13476835648
|
last-checkpoint/global_step930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74ed7591c60b03da0d1dc6cc3d9bfe28c9349fd72909ee0f7770ebf71cf5f300
|
3 |
+
size 13476835648
|
last-checkpoint/global_step930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec1a3899e3e0db79c3497e9367c84bcaa34ec1e76d90811c546d0eaeae30451b
|
3 |
+
size 13476835648
|
last-checkpoint/global_step930/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a98a917211259358e0aa315ceda5d9c8adfaf7a77dfb884a74aedb59c4bd78f
|
3 |
+
size 150693
|
last-checkpoint/global_step930/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85392d249fe1774166e899bdacd4ddbaeeb18826e8ac208a06a13d57095ef4c1
|
3 |
+
size 150693
|
last-checkpoint/global_step930/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62deb2157fa7caf68b01c013a50a8a320c3d100a989932ea59653e9809b1d906
|
3 |
+
size 150693
|
last-checkpoint/global_step930/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2266da4e0281fec19e433f5d7ad9197820be41db576884e86fe11aafcbc31b1
|
3 |
+
size 150693
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step930
|
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4938985352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef0f4df2c2dd63dd83e130b116d935a681a8ee1ce46d3cb72eadaf7aca4d3879
|
3 |
size 4938985352
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4947390880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdb87e29425f917524e9cf4fb01bc4e694598be78980bb38df50ed6dd399a71f
|
3 |
size 4947390880
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3590488816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbf925b489dde5633219973a1f7552c30e5d3d96df88e0f751b425f56891190c
|
3 |
size 3590488816
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5b5b0934b8613429f71d38c4aaf1cf68b50eb415214b938124e65c4e50faae1
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19f63bfbf9ef9efae26be62fb115c8fa6adfa6333f3074d8511b5eeab88f0f1e
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba2a5ec9c47d3c544c4e610213c6d14c67721b556bd12896b90b14fd54cf1901
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e5fd0b1afc88ca5e581b87462a6a56c9a82154f0d69fe336f7b445bad77242b
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3037f93266047f9be66a7aa9272e870b0bbd8228f26f8217758f94a734d71a2f
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
"eval_steps": 62,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -1536,6 +1536,127 @@
|
|
1536 |
"eval_samples_per_second": 5.923,
|
1537 |
"eval_steps_per_second": 0.385,
|
1538 |
"step": 868
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1539 |
}
|
1540 |
],
|
1541 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.976,
|
5 |
"eval_steps": 62,
|
6 |
+
"global_step": 930,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
1536 |
"eval_samples_per_second": 5.923,
|
1537 |
"eval_steps_per_second": 0.385,
|
1538 |
"step": 868
|
1539 |
+
},
|
1540 |
+
{
|
1541 |
+
"epoch": 2.784,
|
1542 |
+
"grad_norm": 23.996876211666585,
|
1543 |
+
"learning_rate": 3.919239904988123e-08,
|
1544 |
+
"logits/generated": -0.9030688405036926,
|
1545 |
+
"logits/real": -0.8869367837905884,
|
1546 |
+
"logps/generated": -263.31884765625,
|
1547 |
+
"logps/real": -231.1215057373047,
|
1548 |
+
"loss": 0.3838,
|
1549 |
+
"rewards/accuracies": 0.987500011920929,
|
1550 |
+
"rewards/generated": 2.1591622829437256,
|
1551 |
+
"rewards/margins": 2.8290388584136963,
|
1552 |
+
"rewards/real": 4.988200664520264,
|
1553 |
+
"step": 870
|
1554 |
+
},
|
1555 |
+
{
|
1556 |
+
"epoch": 2.816,
|
1557 |
+
"grad_norm": 15.933355481968098,
|
1558 |
+
"learning_rate": 3.32541567695962e-08,
|
1559 |
+
"logits/generated": -0.9254922866821289,
|
1560 |
+
"logits/real": -0.9375091791152954,
|
1561 |
+
"logps/generated": -257.25921630859375,
|
1562 |
+
"logps/real": -218.4817352294922,
|
1563 |
+
"loss": 0.3943,
|
1564 |
+
"rewards/accuracies": 0.9624999761581421,
|
1565 |
+
"rewards/generated": 2.433042049407959,
|
1566 |
+
"rewards/margins": 2.4680287837982178,
|
1567 |
+
"rewards/real": 4.901071071624756,
|
1568 |
+
"step": 880
|
1569 |
+
},
|
1570 |
+
{
|
1571 |
+
"epoch": 2.848,
|
1572 |
+
"grad_norm": 15.729400330653592,
|
1573 |
+
"learning_rate": 2.7315914489311164e-08,
|
1574 |
+
"logits/generated": -0.8918999433517456,
|
1575 |
+
"logits/real": -0.9543954730033875,
|
1576 |
+
"logps/generated": -251.86434936523438,
|
1577 |
+
"logps/real": -217.92153930664062,
|
1578 |
+
"loss": 0.3792,
|
1579 |
+
"rewards/accuracies": 0.9375,
|
1580 |
+
"rewards/generated": 2.4217216968536377,
|
1581 |
+
"rewards/margins": 2.721459150314331,
|
1582 |
+
"rewards/real": 5.143180847167969,
|
1583 |
+
"step": 890
|
1584 |
+
},
|
1585 |
+
{
|
1586 |
+
"epoch": 2.88,
|
1587 |
+
"grad_norm": 14.591897761657874,
|
1588 |
+
"learning_rate": 2.1377672209026125e-08,
|
1589 |
+
"logits/generated": -0.9395130276679993,
|
1590 |
+
"logits/real": -0.9594659805297852,
|
1591 |
+
"logps/generated": -265.73876953125,
|
1592 |
+
"logps/real": -222.98593139648438,
|
1593 |
+
"loss": 0.3686,
|
1594 |
+
"rewards/accuracies": 0.987500011920929,
|
1595 |
+
"rewards/generated": 2.46151065826416,
|
1596 |
+
"rewards/margins": 2.638683795928955,
|
1597 |
+
"rewards/real": 5.100194931030273,
|
1598 |
+
"step": 900
|
1599 |
+
},
|
1600 |
+
{
|
1601 |
+
"epoch": 2.912,
|
1602 |
+
"grad_norm": 20.099085379716534,
|
1603 |
+
"learning_rate": 1.5439429928741092e-08,
|
1604 |
+
"logits/generated": -0.950794517993927,
|
1605 |
+
"logits/real": -0.8883028030395508,
|
1606 |
+
"logps/generated": -254.50732421875,
|
1607 |
+
"logps/real": -226.67514038085938,
|
1608 |
+
"loss": 0.3771,
|
1609 |
+
"rewards/accuracies": 0.925000011920929,
|
1610 |
+
"rewards/generated": 2.2818403244018555,
|
1611 |
+
"rewards/margins": 2.8682749271392822,
|
1612 |
+
"rewards/real": 5.150115013122559,
|
1613 |
+
"step": 910
|
1614 |
+
},
|
1615 |
+
{
|
1616 |
+
"epoch": 2.944,
|
1617 |
+
"grad_norm": 27.113250586107085,
|
1618 |
+
"learning_rate": 9.501187648456057e-09,
|
1619 |
+
"logits/generated": -0.9123473167419434,
|
1620 |
+
"logits/real": -0.8874839544296265,
|
1621 |
+
"logps/generated": -254.9096221923828,
|
1622 |
+
"logps/real": -226.13595581054688,
|
1623 |
+
"loss": 0.3878,
|
1624 |
+
"rewards/accuracies": 0.9750000238418579,
|
1625 |
+
"rewards/generated": 2.072730302810669,
|
1626 |
+
"rewards/margins": 2.4795820713043213,
|
1627 |
+
"rewards/real": 4.55231237411499,
|
1628 |
+
"step": 920
|
1629 |
+
},
|
1630 |
+
{
|
1631 |
+
"epoch": 2.976,
|
1632 |
+
"grad_norm": 18.727290911205092,
|
1633 |
+
"learning_rate": 3.562945368171021e-09,
|
1634 |
+
"logits/generated": -0.9185419082641602,
|
1635 |
+
"logits/real": -0.9089628458023071,
|
1636 |
+
"logps/generated": -247.39254760742188,
|
1637 |
+
"logps/real": -213.3396453857422,
|
1638 |
+
"loss": 0.4001,
|
1639 |
+
"rewards/accuracies": 0.925000011920929,
|
1640 |
+
"rewards/generated": 2.629145860671997,
|
1641 |
+
"rewards/margins": 2.3609352111816406,
|
1642 |
+
"rewards/real": 4.990080833435059,
|
1643 |
+
"step": 930
|
1644 |
+
},
|
1645 |
+
{
|
1646 |
+
"epoch": 2.976,
|
1647 |
+
"eval_logits/generated": -0.874191164970398,
|
1648 |
+
"eval_logits/real": -0.8781108260154724,
|
1649 |
+
"eval_logps/generated": -253.27622985839844,
|
1650 |
+
"eval_logps/real": -213.75250244140625,
|
1651 |
+
"eval_loss": 0.552344799041748,
|
1652 |
+
"eval_rewards/accuracies": 0.8461538553237915,
|
1653 |
+
"eval_rewards/generated": 2.939284324645996,
|
1654 |
+
"eval_rewards/margins": 2.054386854171753,
|
1655 |
+
"eval_rewards/real": 4.993671894073486,
|
1656 |
+
"eval_runtime": 34.0216,
|
1657 |
+
"eval_samples_per_second": 5.879,
|
1658 |
+
"eval_steps_per_second": 0.382,
|
1659 |
+
"step": 930
|
1660 |
}
|
1661 |
],
|
1662 |
"logging_steps": 10,
|