Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
5ae005f
1 Parent(s): 68cc6d4

Training in progress, step 240000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc34397f53638aed3e1f7a8fec48fd945fe9d9a65862e2d30b0c18c847384362
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21c21b20fb8c80d8819d148082ca4735a2ddcf51c6d5bd15312d293ac83a63c8
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a6f4b993c3e5de4e91e3f11164ead7579089c5cd884e3548feacf51898e103a
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:398ac2faeaf62d164de8b0d15d7dce648669506924aad7a65bb21212c9dd95dd
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44d51ee7e5bc13fe73a3bcf57ad347fa22b3599a7d682e2e8a541926fd4330c8
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:675c1da6a29e5de200fb272be2a868637018c999addc56c161958a25c0a5349b
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d56ac9935105b68f299f8fa21719a2673f088d35488fddd5fa62d8866469f5f5
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3612d2c4e947f05578cbcbc2e6074dbe6180f6b3ff976664366be3670d8b1d56
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2738bd73d910d7af8da2f55f99c628d098f5213ea57df8ec541f1d8d067bf6de
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d433144714402feaf6a20e1bebd60563ad86ca2c8b3c2397a63d836b6b3aee95
3
+ size 14439
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2c56ac3ff977fd6146b9151ff886620564565fb7b6256b4c917e31e654c4ed6
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24627e975d8a309c60a5796ee3829db81bd4fe576d49e1ab91aa7f4b4645e7d4
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77be04c57a43b741a7c74fdd71f54e13c7f455ba94a43817c822b41fc4e2570c
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a59cfcefded7a2b207187159c019180f873df3dbebd125628eee7537065bae35
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.5121474491120375,
5
- "global_step": 230000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1708,11 +1708,85 @@
1708
  "eval_samples_per_second": 978.715,
1709
  "eval_steps_per_second": 15.659,
1710
  "step": 230000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1711
  }
1712
  ],
1713
  "max_steps": 1000000,
1714
  "num_train_epochs": 16,
1715
- "total_flos": 1.612304032493538e+22,
1716
  "trial_name": null,
1717
  "trial_params": null
1718
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.6648495121169087,
5
+ "global_step": 240000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1708
  "eval_samples_per_second": 978.715,
1709
  "eval_steps_per_second": 15.659,
1710
  "step": 230000
1711
+ },
1712
+ {
1713
+ "epoch": 3.53,
1714
+ "learning_rate": 0.00013783050393360768,
1715
+ "loss": 0.3048,
1716
+ "step": 231000
1717
+ },
1718
+ {
1719
+ "epoch": 3.54,
1720
+ "learning_rate": 0.0001376997572617282,
1721
+ "loss": 0.305,
1722
+ "step": 232000
1723
+ },
1724
+ {
1725
+ "epoch": 3.56,
1726
+ "learning_rate": 0.00013756837959454766,
1727
+ "loss": 0.3042,
1728
+ "step": 233000
1729
+ },
1730
+ {
1731
+ "epoch": 3.57,
1732
+ "learning_rate": 0.0001374363723687911,
1733
+ "loss": 0.3042,
1734
+ "step": 234000
1735
+ },
1736
+ {
1737
+ "epoch": 3.59,
1738
+ "learning_rate": 0.00013730373702806846,
1739
+ "loss": 0.304,
1740
+ "step": 235000
1741
+ },
1742
+ {
1743
+ "epoch": 3.59,
1744
+ "eval_runtime": 1.0392,
1745
+ "eval_samples_per_second": 962.319,
1746
+ "eval_steps_per_second": 15.397,
1747
+ "step": 235000
1748
+ },
1749
+ {
1750
+ "epoch": 3.6,
1751
+ "learning_rate": 0.00013717047502285855,
1752
+ "loss": 0.3036,
1753
+ "step": 236000
1754
+ },
1755
+ {
1756
+ "epoch": 3.62,
1757
+ "learning_rate": 0.0001370365878104933,
1758
+ "loss": 0.3036,
1759
+ "step": 237000
1760
+ },
1761
+ {
1762
+ "epoch": 3.63,
1763
+ "learning_rate": 0.00013690207685514185,
1764
+ "loss": 0.3031,
1765
+ "step": 238000
1766
+ },
1767
+ {
1768
+ "epoch": 3.65,
1769
+ "learning_rate": 0.0001367669436277944,
1770
+ "loss": 0.3032,
1771
+ "step": 239000
1772
+ },
1773
+ {
1774
+ "epoch": 3.66,
1775
+ "learning_rate": 0.0001366311896062463,
1776
+ "loss": 0.3036,
1777
+ "step": 240000
1778
+ },
1779
+ {
1780
+ "epoch": 3.66,
1781
+ "eval_runtime": 1.0097,
1782
+ "eval_samples_per_second": 990.396,
1783
+ "eval_steps_per_second": 15.846,
1784
+ "step": 240000
1785
  }
1786
  ],
1787
  "max_steps": 1000000,
1788
  "num_train_epochs": 16,
1789
+ "total_flos": 1.6824042935238852e+22,
1790
  "trial_name": null,
1791
  "trial_params": null
1792
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a6f4b993c3e5de4e91e3f11164ead7579089c5cd884e3548feacf51898e103a
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:398ac2faeaf62d164de8b0d15d7dce648669506924aad7a65bb21212c9dd95dd
3
  size 449471589