ZeroUniqueness commited on
Commit
7b65909
β€’
1 Parent(s): e6f4e44

Training in progress, step 7300

Browse files
Files changed (25) hide show
  1. adapter_model.bin +1 -1
  2. {checkpoint-6900 β†’ checkpoint-7200/adapter_model}/README.md +0 -0
  3. {checkpoint-6900 β†’ checkpoint-7200/adapter_model}/adapter_config.json +0 -0
  4. {checkpoint-6900 β†’ checkpoint-7200/adapter_model}/adapter_model.bin +1 -1
  5. {checkpoint-6900/adapter_model β†’ checkpoint-7300}/README.md +0 -0
  6. {checkpoint-6900/adapter_model β†’ checkpoint-7300}/adapter_config.json +0 -0
  7. {checkpoint-6900/adapter_model β†’ checkpoint-7300}/adapter_model.bin +1 -1
  8. {checkpoint-6900 β†’ checkpoint-7300}/optimizer.pt +1 -1
  9. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_0.pth +1 -1
  10. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_1.pth +1 -1
  11. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_10.pth +1 -1
  12. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_11.pth +1 -1
  13. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_12.pth +1 -1
  14. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_13.pth +1 -1
  15. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_2.pth +1 -1
  16. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_3.pth +1 -1
  17. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_4.pth +1 -1
  18. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_5.pth +1 -1
  19. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_6.pth +1 -1
  20. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_7.pth +1 -1
  21. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_8.pth +1 -1
  22. {checkpoint-6900 β†’ checkpoint-7300}/rng_state_9.pth +1 -1
  23. {checkpoint-6900 β†’ checkpoint-7300}/scheduler.pt +1 -1
  24. {checkpoint-6900 β†’ checkpoint-7300}/trainer_state.json +107 -3
  25. {checkpoint-6900 β†’ checkpoint-7300}/training_args.bin +0 -0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4ed435f77b8aaa468d0a026e8247b6e75dcc7152deb57502bce336e2ea4128e
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aae85b4318efc26db922c4214aefd89c824feffab65eaf0292127550a92cb40
3
  size 500897101
{checkpoint-6900 β†’ checkpoint-7200/adapter_model}/README.md RENAMED
File without changes
{checkpoint-6900 β†’ checkpoint-7200/adapter_model}/adapter_config.json RENAMED
File without changes
{checkpoint-6900 β†’ checkpoint-7200/adapter_model}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dce28954f69ce7f466b50fc774c94fb6da869b76f94baf208c3e276b1365db2
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4ed435f77b8aaa468d0a026e8247b6e75dcc7152deb57502bce336e2ea4128e
3
  size 500897101
{checkpoint-6900/adapter_model β†’ checkpoint-7300}/README.md RENAMED
File without changes
{checkpoint-6900/adapter_model β†’ checkpoint-7300}/adapter_config.json RENAMED
File without changes
{checkpoint-6900/adapter_model β†’ checkpoint-7300}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dce28954f69ce7f466b50fc774c94fb6da869b76f94baf208c3e276b1365db2
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aae85b4318efc26db922c4214aefd89c824feffab65eaf0292127550a92cb40
3
  size 500897101
{checkpoint-6900 β†’ checkpoint-7300}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e51694cb0a1cd9603ece0232dabcd7a370a6f8e378f0b01213ceaaf413c4d0c
3
  size 1001752701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01309cc50248a7ee8aa0943e05f78f45996da25a30bca6c7edfa2ce6d0a4c468
3
  size 1001752701
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_0.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:361a0cbcd4b75d795f0109f290c642aca880cc06772f00227ba1e0217fc939ef
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44bf845e28723f2b5d06a252c217649c369f5a412e746c6a11a5766c3cc80b5e
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_1.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f5123ae610aa26457a3fa34fd70ab7e4ab44cb21dc09fd095aad55a2d15294a
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e22c3abfb08277a3455800cbf62f599d1fe3557f00ea08203d0be94c4d225d4
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_10.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a213c64ebe2689a3f02bbe5b0ee2c66feb57c0f5f4f8621c0ec2f63c6c590892
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16491d9b84450524221e0f17b2f0f5d4a7227f93b877a553c45c150bba768473
3
  size 27789
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_11.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:531d6f0912536de9c8ce68b83c17fc005458796d7921c1fe083548fda04d57a7
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71481d903c6fa6e1f00f003f755a79f5d2ca1cadae1a66a569b9407c13075f2a
3
  size 27789
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_12.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dad9e94de76a75ad267b7650de4df602944013ed9b553b148fa94de6ea86bb52
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a5d6e0a5a00d6198aee4a1b139049dfce02c1037c1eb6f70bda5f9ddd91443b
3
  size 27789
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_13.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f9e0a77144d5a662958f707fc8b494554054fd279f5a3dc74159dc97e6d1e78
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9dc354d1f1d4681afeb867b8be0cde07c70b7eeef5460c9f709ab7d88ebb815
3
  size 27789
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_2.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5b931b3c81ed25f1fcd0971b6da08a3869bfd28a0489528ed3c96c3619fa557
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a8282ce3cee62a6d68bc928ab48b04011fe533a03a47b9a255d11d5cb5ebe4a
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_3.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e121c889141260915892ddfe435284a35a9f246ef67720bdc33081a846ab328
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0de2be89dd7c5d96346af9b92d8b38d6e391cb480702a46ded7e0734baffd1f7
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_4.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f912038cfe5be27104676eb3640c3beb52c1c4c80bafea1732f0443a67ad4b4
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f41d54704cd0a89fb3b5e04ff0bc6606a439f0d0fac2786a95f27ce9861763b
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_5.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e7e05a90589de96c2e2748fa928890eb3ae0f6585d2b9768316f612aa8cf908
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52490042f81e8334c22ac8fdf36cb1d11dff94eccb6eb672211c661ae447a0c6
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_6.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfaec3c28cf52d29cdacae2acf43363d9aea5a881877b06a0055a14c1b7aed6a
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb02b274f95c75d386f4b6937d7c47c650dab44e83c2c964735cb0d6db243843
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_7.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c35c98f247077b0ff5a006aeba6561c7e6bf2e9fd8969c9bc35d64aaf01cf14a
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e919b96ff9ef7ae0a19a5876d608542799d877c721866d11eceba04fb94f731
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_8.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86a908ac53361e9d5c34680f8e1789e69824f75a3e0b100140c8133e52f8fbed
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa2e5213b2c17cb726c6144a6195b40ed2ee1f47db76e08204f824274dd4141f
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/rng_state_9.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5597a151c26d0f9f0ba329a3cf67af7f95b7fed3d58ea4461f586948ea11f890
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d32a236dfc5a71f5abbfaf52ec05bbecdee8d6d8401fa330bafb1126c6198db
3
  size 27772
{checkpoint-6900 β†’ checkpoint-7300}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed903a2193f395f38212602a53ab2a5c251266f0ae7d7dc0557e3b565ed8e240
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3236dda3895d025575cdd5d0cacbdf3a24ed0df5efb8e36e20822ffe5102420
3
  size 627
{checkpoint-6900 β†’ checkpoint-7300}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.6754556029468786,
5
- "global_step": 6900,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1686,11 +1686,115 @@
1686
  "learning_rate": 5.734606883846338e-06,
1687
  "loss": 0.7717,
1688
  "step": 6900
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1689
  }
1690
  ],
1691
  "max_steps": 7737,
1692
  "num_train_epochs": 3,
1693
- "total_flos": 2.9715299616168083e+19,
1694
  "trial_name": null,
1695
  "trial_params": null
1696
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.830554478480031,
5
+ "global_step": 7300,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1686
  "learning_rate": 5.734606883846338e-06,
1687
  "loss": 0.7717,
1688
  "step": 6900
1689
+ },
1690
+ {
1691
+ "epoch": 2.69,
1692
+ "learning_rate": 5.40022537278978e-06,
1693
+ "loss": 0.7701,
1694
+ "step": 6925
1695
+ },
1696
+ {
1697
+ "epoch": 2.69,
1698
+ "learning_rate": 5.07561723084089e-06,
1699
+ "loss": 0.7694,
1700
+ "step": 6950
1701
+ },
1702
+ {
1703
+ "epoch": 2.7,
1704
+ "learning_rate": 4.7608159941809e-06,
1705
+ "loss": 0.7659,
1706
+ "step": 6975
1707
+ },
1708
+ {
1709
+ "epoch": 2.71,
1710
+ "learning_rate": 4.455854185812047e-06,
1711
+ "loss": 0.7639,
1712
+ "step": 7000
1713
+ },
1714
+ {
1715
+ "epoch": 2.71,
1716
+ "eval_loss": 0.8055068850517273,
1717
+ "eval_runtime": 58.7443,
1718
+ "eval_samples_per_second": 12.427,
1719
+ "eval_steps_per_second": 0.902,
1720
+ "step": 7000
1721
+ },
1722
+ {
1723
+ "epoch": 2.72,
1724
+ "learning_rate": 4.160763312197513e-06,
1725
+ "loss": 0.7724,
1726
+ "step": 7025
1727
+ },
1728
+ {
1729
+ "epoch": 2.73,
1730
+ "learning_rate": 3.875573860006421e-06,
1731
+ "loss": 0.7696,
1732
+ "step": 7050
1733
+ },
1734
+ {
1735
+ "epoch": 2.74,
1736
+ "learning_rate": 3.6003152929641624e-06,
1737
+ "loss": 0.7625,
1738
+ "step": 7075
1739
+ },
1740
+ {
1741
+ "epoch": 2.75,
1742
+ "learning_rate": 3.335016048808437e-06,
1743
+ "loss": 0.7733,
1744
+ "step": 7100
1745
+ },
1746
+ {
1747
+ "epoch": 2.76,
1748
+ "learning_rate": 3.0797035363512193e-06,
1749
+ "loss": 0.7685,
1750
+ "step": 7125
1751
+ },
1752
+ {
1753
+ "epoch": 2.77,
1754
+ "learning_rate": 2.834404132647128e-06,
1755
+ "loss": 0.769,
1756
+ "step": 7150
1757
+ },
1758
+ {
1759
+ "epoch": 2.78,
1760
+ "learning_rate": 2.5991431802683262e-06,
1761
+ "loss": 0.7647,
1762
+ "step": 7175
1763
+ },
1764
+ {
1765
+ "epoch": 2.79,
1766
+ "learning_rate": 2.3739449846862826e-06,
1767
+ "loss": 0.7634,
1768
+ "step": 7200
1769
+ },
1770
+ {
1771
+ "epoch": 2.8,
1772
+ "learning_rate": 2.158832811760736e-06,
1773
+ "loss": 0.7617,
1774
+ "step": 7225
1775
+ },
1776
+ {
1777
+ "epoch": 2.81,
1778
+ "learning_rate": 1.95382888533604e-06,
1779
+ "loss": 0.768,
1780
+ "step": 7250
1781
+ },
1782
+ {
1783
+ "epoch": 2.82,
1784
+ "learning_rate": 1.7589543849450996e-06,
1785
+ "loss": 0.7712,
1786
+ "step": 7275
1787
+ },
1788
+ {
1789
+ "epoch": 2.83,
1790
+ "learning_rate": 1.5742294436213223e-06,
1791
+ "loss": 0.7703,
1792
+ "step": 7300
1793
  }
1794
  ],
1795
  "max_steps": 7737,
1796
  "num_train_epochs": 3,
1797
+ "total_flos": 3.143766232455866e+19,
1798
  "trial_name": null,
1799
  "trial_params": null
1800
  }
{checkpoint-6900 β†’ checkpoint-7300}/training_args.bin RENAMED
File without changes