marinone94 commited on
Commit
05cee88
β€’
1 Parent(s): d379668

Model save

Browse files
{checkpoint-4200 β†’ checkpoint-4400}/config.json RENAMED
File without changes
{checkpoint-4200 β†’ checkpoint-4400}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ddef0f5049947aa8210403bee49ef1fd880b41459272b4c05c3eb32308f2f44
3
  size 2490337809
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ed693bd3b91cdbbe1430c3f7f43d32b0b9b099aa5180fb31ece0f93c73b26ee
3
  size 2490337809
{checkpoint-4200 β†’ checkpoint-4400}/preprocessor_config.json RENAMED
File without changes
{checkpoint-4300 β†’ checkpoint-4400}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca11c993941e9cd903a98a8d6a851a925b5bc173fcb10c435092a4ff2bbe4c56
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c90a3d0a519652bea358ec5bc82e2a0b669425ce58bf0947c048a13d83b74d
3
  size 1262063089
{checkpoint-4200 β†’ checkpoint-4400}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e03d76f10a67412455e92aefe077a6da7230abf78e55d42dec22dfbaea90dbd
3
  size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bb367ac83047020ca661382c5402cfaed86ec3e8ea3ce8b448d44d9e43e2965
3
  size 14567
{checkpoint-4300 β†’ checkpoint-4400}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6924042b31741a307a9c2d3e5d4148105227679127f306862679a760336ca11c
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb287cb35474e15fb80cdda16160c24d664008c453ecb31933c1042ff81dd3e9
3
  size 559
{checkpoint-4200 β†’ checkpoint-4400}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fb4edd93c6eef5711ff572cfd2e93da18eb0ae8a7738f853f88ca1ecfb5e8b9
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:379bb05b55352db422771e61095d894e4be45df2c25710a995432fffb6cdd028
3
  size 623
{checkpoint-4300 β†’ checkpoint-4400}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 47.25136612021858,
5
- "global_step": 4300,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1683,11 +1683,50 @@
1683
  "eval_steps_per_second": 0.802,
1684
  "eval_wer": 0.12693726937269373,
1685
  "step": 4300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1686
  }
1687
  ],
1688
  "max_steps": 4550,
1689
  "num_train_epochs": 50,
1690
- "total_flos": 6.648181588185401e+19,
1691
  "trial_name": null,
1692
  "trial_params": null
1693
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 48.349726775956285,
5
+ "global_step": 4400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1683
  "eval_steps_per_second": 0.802,
1684
  "eval_wer": 0.12693726937269373,
1685
  "step": 4300
1686
+ },
1687
+ {
1688
+ "epoch": 47.47,
1689
+ "learning_rate": 2.284313725490196e-05,
1690
+ "loss": 0.7326,
1691
+ "step": 4320
1692
+ },
1693
+ {
1694
+ "epoch": 47.69,
1695
+ "learning_rate": 2.088235294117647e-05,
1696
+ "loss": 0.724,
1697
+ "step": 4340
1698
+ },
1699
+ {
1700
+ "epoch": 47.91,
1701
+ "learning_rate": 1.892156862745098e-05,
1702
+ "loss": 0.7316,
1703
+ "step": 4360
1704
+ },
1705
+ {
1706
+ "epoch": 48.13,
1707
+ "learning_rate": 1.696078431372549e-05,
1708
+ "loss": 0.7566,
1709
+ "step": 4380
1710
+ },
1711
+ {
1712
+ "epoch": 48.35,
1713
+ "learning_rate": 1.5e-05,
1714
+ "loss": 0.7479,
1715
+ "step": 4400
1716
+ },
1717
+ {
1718
+ "epoch": 48.35,
1719
+ "eval_loss": 0.1490115076303482,
1720
+ "eval_runtime": 188.3681,
1721
+ "eval_samples_per_second": 25.71,
1722
+ "eval_steps_per_second": 0.807,
1723
+ "eval_wer": 0.12761850695430033,
1724
+ "step": 4400
1725
  }
1726
  ],
1727
  "max_steps": 4550,
1728
  "num_train_epochs": 50,
1729
+ "total_flos": 6.805564586486029e+19,
1730
  "trial_name": null,
1731
  "trial_params": null
1732
  }
{checkpoint-4200 β†’ checkpoint-4400}/training_args.bin RENAMED
File without changes
{checkpoint-4300 β†’ checkpoint-4500}/config.json RENAMED
File without changes
{checkpoint-4300 β†’ checkpoint-4500}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58cce60fe69424e2a89d307caa661955fd8777a8855b339f2af2ad4573bb989c
3
  size 2490337809
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ddcef79ae9c9cbc49da385ba75dde3728f6718eeb4a1ea9f6af1e9bb92ea574
3
  size 2490337809
{checkpoint-4300 β†’ checkpoint-4500}/preprocessor_config.json RENAMED
File without changes
{checkpoint-4200 β†’ checkpoint-4500}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:588e62e516d26a20bbfce337c36c9f1a83451a67d19e583d1cdceb96aff5859f
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eae58c0bb9c908100e64bb4cfc44af074bab8941dffb754f675e676ebd7972b
3
  size 1262063089
{checkpoint-4300 β†’ checkpoint-4500}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:412f958acca27a8108970c9e2ebea1c88954db1eb284dd8fe51687e899621b23
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ae13169f4754f47cf02dcd08d7a9d3852557179a00533dd7f00f4265d8a8fba
3
+ size 14567
{checkpoint-4200 β†’ checkpoint-4500}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7018904ee53324745014ee00f0192d0f3344069918f4c8dd54467134a03ae355
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4c027f185a945dda35351dc282299cb9a8d301ee07589b42eb812ad50ff4977
3
  size 559
{checkpoint-4300 β†’ checkpoint-4500}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9bfd4ddf4228b39539babfcc9c868a929c00cb0946eb4b8ecfaa5fa12431293
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c583f6b4d18dff47ed1b5d6c7fe67a5bf74f8906e7b32b87ae71e701db2a021c
3
  size 623
{checkpoint-4200 β†’ checkpoint-4500}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 46.15300546448088,
5
- "global_step": 4200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1644,11 +1644,128 @@
1644
  "eval_steps_per_second": 0.798,
1645
  "eval_wer": 0.1271927334657962,
1646
  "step": 4200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1647
  }
1648
  ],
1649
  "max_steps": 4550,
1650
  "num_train_epochs": 50,
1651
- "total_flos": 6.496086001622114e+19,
1652
  "trial_name": null,
1653
  "trial_params": null
1654
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 49.44808743169399,
5
+ "global_step": 4500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1644
  "eval_steps_per_second": 0.798,
1645
  "eval_wer": 0.1271927334657962,
1646
  "step": 4200
1647
+ },
1648
+ {
1649
+ "epoch": 46.37,
1650
+ "learning_rate": 3.264705882352941e-05,
1651
+ "loss": 0.7283,
1652
+ "step": 4220
1653
+ },
1654
+ {
1655
+ "epoch": 46.59,
1656
+ "learning_rate": 3.0686274509803923e-05,
1657
+ "loss": 0.7218,
1658
+ "step": 4240
1659
+ },
1660
+ {
1661
+ "epoch": 46.81,
1662
+ "learning_rate": 2.872549019607843e-05,
1663
+ "loss": 0.7341,
1664
+ "step": 4260
1665
+ },
1666
+ {
1667
+ "epoch": 47.03,
1668
+ "learning_rate": 2.6764705882352942e-05,
1669
+ "loss": 0.7293,
1670
+ "step": 4280
1671
+ },
1672
+ {
1673
+ "epoch": 47.25,
1674
+ "learning_rate": 2.480392156862745e-05,
1675
+ "loss": 0.7194,
1676
+ "step": 4300
1677
+ },
1678
+ {
1679
+ "epoch": 47.25,
1680
+ "eval_loss": 0.14928147196769714,
1681
+ "eval_runtime": 189.625,
1682
+ "eval_samples_per_second": 25.54,
1683
+ "eval_steps_per_second": 0.802,
1684
+ "eval_wer": 0.12693726937269373,
1685
+ "step": 4300
1686
+ },
1687
+ {
1688
+ "epoch": 47.47,
1689
+ "learning_rate": 2.284313725490196e-05,
1690
+ "loss": 0.7326,
1691
+ "step": 4320
1692
+ },
1693
+ {
1694
+ "epoch": 47.69,
1695
+ "learning_rate": 2.088235294117647e-05,
1696
+ "loss": 0.724,
1697
+ "step": 4340
1698
+ },
1699
+ {
1700
+ "epoch": 47.91,
1701
+ "learning_rate": 1.892156862745098e-05,
1702
+ "loss": 0.7316,
1703
+ "step": 4360
1704
+ },
1705
+ {
1706
+ "epoch": 48.13,
1707
+ "learning_rate": 1.696078431372549e-05,
1708
+ "loss": 0.7566,
1709
+ "step": 4380
1710
+ },
1711
+ {
1712
+ "epoch": 48.35,
1713
+ "learning_rate": 1.5e-05,
1714
+ "loss": 0.7479,
1715
+ "step": 4400
1716
+ },
1717
+ {
1718
+ "epoch": 48.35,
1719
+ "eval_loss": 0.1490115076303482,
1720
+ "eval_runtime": 188.3681,
1721
+ "eval_samples_per_second": 25.71,
1722
+ "eval_steps_per_second": 0.807,
1723
+ "eval_wer": 0.12761850695430033,
1724
+ "step": 4400
1725
+ },
1726
+ {
1727
+ "epoch": 48.57,
1728
+ "learning_rate": 1.303921568627451e-05,
1729
+ "loss": 0.7139,
1730
+ "step": 4420
1731
+ },
1732
+ {
1733
+ "epoch": 48.79,
1734
+ "learning_rate": 1.107843137254902e-05,
1735
+ "loss": 0.7345,
1736
+ "step": 4440
1737
+ },
1738
+ {
1739
+ "epoch": 49.01,
1740
+ "learning_rate": 9.117647058823529e-06,
1741
+ "loss": 0.756,
1742
+ "step": 4460
1743
+ },
1744
+ {
1745
+ "epoch": 49.23,
1746
+ "learning_rate": 7.15686274509804e-06,
1747
+ "loss": 0.7196,
1748
+ "step": 4480
1749
+ },
1750
+ {
1751
+ "epoch": 49.45,
1752
+ "learning_rate": 5.196078431372549e-06,
1753
+ "loss": 0.7132,
1754
+ "step": 4500
1755
+ },
1756
+ {
1757
+ "epoch": 49.45,
1758
+ "eval_loss": 0.1501067876815796,
1759
+ "eval_runtime": 190.1989,
1760
+ "eval_samples_per_second": 25.463,
1761
+ "eval_steps_per_second": 0.799,
1762
+ "eval_wer": 0.1265398807834232,
1763
+ "step": 4500
1764
  }
1765
  ],
1766
  "max_steps": 4550,
1767
  "num_train_epochs": 50,
1768
+ "total_flos": 6.9574010203448205e+19,
1769
  "trial_name": null,
1770
  "trial_params": null
1771
  }
{checkpoint-4300 β†’ checkpoint-4500}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a459f72ab853af3d30be6993d7c2796ebd50d28c9cae60928258ccc702d6e46
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c284a4869295d3f95db2001f0fef26d374358f6f33b31cf64b9994c12e4cfd91
3
  size 1262063089