ZeroUniqueness
commited on
Commit
β’
7b65909
1
Parent(s):
e6f4e44
Training in progress, step 7300
Browse files- adapter_model.bin +1 -1
- {checkpoint-6900 β checkpoint-7200/adapter_model}/README.md +0 -0
- {checkpoint-6900 β checkpoint-7200/adapter_model}/adapter_config.json +0 -0
- {checkpoint-6900 β checkpoint-7200/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-6900/adapter_model β checkpoint-7300}/README.md +0 -0
- {checkpoint-6900/adapter_model β checkpoint-7300}/adapter_config.json +0 -0
- {checkpoint-6900/adapter_model β checkpoint-7300}/adapter_model.bin +1 -1
- {checkpoint-6900 β checkpoint-7300}/optimizer.pt +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_0.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_1.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_10.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_11.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_12.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_13.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_2.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_3.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_4.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_5.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_6.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_7.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_8.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/rng_state_9.pth +1 -1
- {checkpoint-6900 β checkpoint-7300}/scheduler.pt +1 -1
- {checkpoint-6900 β checkpoint-7300}/trainer_state.json +107 -3
- {checkpoint-6900 β checkpoint-7300}/training_args.bin +0 -0
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aae85b4318efc26db922c4214aefd89c824feffab65eaf0292127550a92cb40
|
3 |
size 500897101
|
{checkpoint-6900 β checkpoint-7200/adapter_model}/README.md
RENAMED
File without changes
|
{checkpoint-6900 β checkpoint-7200/adapter_model}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-6900 β checkpoint-7200/adapter_model}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4ed435f77b8aaa468d0a026e8247b6e75dcc7152deb57502bce336e2ea4128e
|
3 |
size 500897101
|
{checkpoint-6900/adapter_model β checkpoint-7300}/README.md
RENAMED
File without changes
|
{checkpoint-6900/adapter_model β checkpoint-7300}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-6900/adapter_model β checkpoint-7300}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aae85b4318efc26db922c4214aefd89c824feffab65eaf0292127550a92cb40
|
3 |
size 500897101
|
{checkpoint-6900 β checkpoint-7300}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1001752701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01309cc50248a7ee8aa0943e05f78f45996da25a30bca6c7edfa2ce6d0a4c468
|
3 |
size 1001752701
|
{checkpoint-6900 β checkpoint-7300}/rng_state_0.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44bf845e28723f2b5d06a252c217649c369f5a412e746c6a11a5766c3cc80b5e
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_1.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e22c3abfb08277a3455800cbf62f599d1fe3557f00ea08203d0be94c4d225d4
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_10.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16491d9b84450524221e0f17b2f0f5d4a7227f93b877a553c45c150bba768473
|
3 |
size 27789
|
{checkpoint-6900 β checkpoint-7300}/rng_state_11.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71481d903c6fa6e1f00f003f755a79f5d2ca1cadae1a66a569b9407c13075f2a
|
3 |
size 27789
|
{checkpoint-6900 β checkpoint-7300}/rng_state_12.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a5d6e0a5a00d6198aee4a1b139049dfce02c1037c1eb6f70bda5f9ddd91443b
|
3 |
size 27789
|
{checkpoint-6900 β checkpoint-7300}/rng_state_13.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9dc354d1f1d4681afeb867b8be0cde07c70b7eeef5460c9f709ab7d88ebb815
|
3 |
size 27789
|
{checkpoint-6900 β checkpoint-7300}/rng_state_2.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a8282ce3cee62a6d68bc928ab48b04011fe533a03a47b9a255d11d5cb5ebe4a
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_3.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0de2be89dd7c5d96346af9b92d8b38d6e391cb480702a46ded7e0734baffd1f7
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_4.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f41d54704cd0a89fb3b5e04ff0bc6606a439f0d0fac2786a95f27ce9861763b
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_5.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52490042f81e8334c22ac8fdf36cb1d11dff94eccb6eb672211c661ae447a0c6
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_6.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb02b274f95c75d386f4b6937d7c47c650dab44e83c2c964735cb0d6db243843
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_7.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e919b96ff9ef7ae0a19a5876d608542799d877c721866d11eceba04fb94f731
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_8.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa2e5213b2c17cb726c6144a6195b40ed2ee1f47db76e08204f824274dd4141f
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/rng_state_9.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d32a236dfc5a71f5abbfaf52ec05bbecdee8d6d8401fa330bafb1126c6198db
|
3 |
size 27772
|
{checkpoint-6900 β checkpoint-7300}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3236dda3895d025575cdd5d0cacbdf3a24ed0df5efb8e36e20822ffe5102420
|
3 |
size 627
|
{checkpoint-6900 β checkpoint-7300}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -1686,11 +1686,115 @@
|
|
1686 |
"learning_rate": 5.734606883846338e-06,
|
1687 |
"loss": 0.7717,
|
1688 |
"step": 6900
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1689 |
}
|
1690 |
],
|
1691 |
"max_steps": 7737,
|
1692 |
"num_train_epochs": 3,
|
1693 |
-
"total_flos":
|
1694 |
"trial_name": null,
|
1695 |
"trial_params": null
|
1696 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.830554478480031,
|
5 |
+
"global_step": 7300,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
1686 |
"learning_rate": 5.734606883846338e-06,
|
1687 |
"loss": 0.7717,
|
1688 |
"step": 6900
|
1689 |
+
},
|
1690 |
+
{
|
1691 |
+
"epoch": 2.69,
|
1692 |
+
"learning_rate": 5.40022537278978e-06,
|
1693 |
+
"loss": 0.7701,
|
1694 |
+
"step": 6925
|
1695 |
+
},
|
1696 |
+
{
|
1697 |
+
"epoch": 2.69,
|
1698 |
+
"learning_rate": 5.07561723084089e-06,
|
1699 |
+
"loss": 0.7694,
|
1700 |
+
"step": 6950
|
1701 |
+
},
|
1702 |
+
{
|
1703 |
+
"epoch": 2.7,
|
1704 |
+
"learning_rate": 4.7608159941809e-06,
|
1705 |
+
"loss": 0.7659,
|
1706 |
+
"step": 6975
|
1707 |
+
},
|
1708 |
+
{
|
1709 |
+
"epoch": 2.71,
|
1710 |
+
"learning_rate": 4.455854185812047e-06,
|
1711 |
+
"loss": 0.7639,
|
1712 |
+
"step": 7000
|
1713 |
+
},
|
1714 |
+
{
|
1715 |
+
"epoch": 2.71,
|
1716 |
+
"eval_loss": 0.8055068850517273,
|
1717 |
+
"eval_runtime": 58.7443,
|
1718 |
+
"eval_samples_per_second": 12.427,
|
1719 |
+
"eval_steps_per_second": 0.902,
|
1720 |
+
"step": 7000
|
1721 |
+
},
|
1722 |
+
{
|
1723 |
+
"epoch": 2.72,
|
1724 |
+
"learning_rate": 4.160763312197513e-06,
|
1725 |
+
"loss": 0.7724,
|
1726 |
+
"step": 7025
|
1727 |
+
},
|
1728 |
+
{
|
1729 |
+
"epoch": 2.73,
|
1730 |
+
"learning_rate": 3.875573860006421e-06,
|
1731 |
+
"loss": 0.7696,
|
1732 |
+
"step": 7050
|
1733 |
+
},
|
1734 |
+
{
|
1735 |
+
"epoch": 2.74,
|
1736 |
+
"learning_rate": 3.6003152929641624e-06,
|
1737 |
+
"loss": 0.7625,
|
1738 |
+
"step": 7075
|
1739 |
+
},
|
1740 |
+
{
|
1741 |
+
"epoch": 2.75,
|
1742 |
+
"learning_rate": 3.335016048808437e-06,
|
1743 |
+
"loss": 0.7733,
|
1744 |
+
"step": 7100
|
1745 |
+
},
|
1746 |
+
{
|
1747 |
+
"epoch": 2.76,
|
1748 |
+
"learning_rate": 3.0797035363512193e-06,
|
1749 |
+
"loss": 0.7685,
|
1750 |
+
"step": 7125
|
1751 |
+
},
|
1752 |
+
{
|
1753 |
+
"epoch": 2.77,
|
1754 |
+
"learning_rate": 2.834404132647128e-06,
|
1755 |
+
"loss": 0.769,
|
1756 |
+
"step": 7150
|
1757 |
+
},
|
1758 |
+
{
|
1759 |
+
"epoch": 2.78,
|
1760 |
+
"learning_rate": 2.5991431802683262e-06,
|
1761 |
+
"loss": 0.7647,
|
1762 |
+
"step": 7175
|
1763 |
+
},
|
1764 |
+
{
|
1765 |
+
"epoch": 2.79,
|
1766 |
+
"learning_rate": 2.3739449846862826e-06,
|
1767 |
+
"loss": 0.7634,
|
1768 |
+
"step": 7200
|
1769 |
+
},
|
1770 |
+
{
|
1771 |
+
"epoch": 2.8,
|
1772 |
+
"learning_rate": 2.158832811760736e-06,
|
1773 |
+
"loss": 0.7617,
|
1774 |
+
"step": 7225
|
1775 |
+
},
|
1776 |
+
{
|
1777 |
+
"epoch": 2.81,
|
1778 |
+
"learning_rate": 1.95382888533604e-06,
|
1779 |
+
"loss": 0.768,
|
1780 |
+
"step": 7250
|
1781 |
+
},
|
1782 |
+
{
|
1783 |
+
"epoch": 2.82,
|
1784 |
+
"learning_rate": 1.7589543849450996e-06,
|
1785 |
+
"loss": 0.7712,
|
1786 |
+
"step": 7275
|
1787 |
+
},
|
1788 |
+
{
|
1789 |
+
"epoch": 2.83,
|
1790 |
+
"learning_rate": 1.5742294436213223e-06,
|
1791 |
+
"loss": 0.7703,
|
1792 |
+
"step": 7300
|
1793 |
}
|
1794 |
],
|
1795 |
"max_steps": 7737,
|
1796 |
"num_train_epochs": 3,
|
1797 |
+
"total_flos": 3.143766232455866e+19,
|
1798 |
"trial_name": null,
|
1799 |
"trial_params": null
|
1800 |
}
|
{checkpoint-6900 β checkpoint-7300}/training_args.bin
RENAMED
File without changes
|