Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
0e9502c
1 Parent(s): f00bb8c

Training in progress, step 220000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6726cc29ffbd179a11fbc16d86e9b622977d56af7affe8432ce17ac7f0c3324c
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a40ae38fb36d58e51d1115a0ffe2456ed04e074ef34058cb0e87aed44c8749c
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25943354903cd35afbe5a9d2bfdd9b41bedaf40773891780d5be2bd5e21bdecd
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10097219a660b41bb145e7706c7d6f55222a5f2edc7e876d75c0a98689203eb2
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f03fb7438c7a7d082a41521ad34b09e54c24c6f0ce434446a8cee447a9825e2b
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e24fad87df726ddb772c9cb0d65a2287f26959859abcdfd31a878c712083b0ad
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc9d9f513ad52cd61a225040b44572cf8ad6a7b8c109e5c0f358d82b01eeccf1
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92de4a3d2058b3ce7b32a9cce1c0af01d1561a150ed18aab859e87d677cd3e5
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a9d3b6fefa1771a4c0591688a8a75e14c07fabc888c3cb2da62c9a866f74518
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f65d3255696500543d0622932269f1d53ce3922d103b14f2f2c1083844f3a484
3
+ size 14439
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81ca6dfbee96ec9e54db682b05df0c1c63341958079572fddfe5a0fdd3446e54
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fa2d72d91bc1245eb1895f8dc7e0d0a135c4c74e82bc0564ae764117f596160
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:300ca51e5088cb48f99d1cdf1919949938caf62a53f95795867484c1a5c8ec3a
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90281c7a304663a504e1f9c6a24dafa78aa1aa7b7e1d73398e43919f9e0a3e35
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.206743323102295,
5
- "global_step": 210000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1560,11 +1560,85 @@
1560
  "eval_samples_per_second": 977.233,
1561
  "eval_steps_per_second": 15.636,
1562
  "step": 210000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1563
  }
1564
  ],
1565
  "max_steps": 1000000,
1566
  "num_train_epochs": 16,
1567
- "total_flos": 1.4721035104328438e+22,
1568
  "trial_name": null,
1569
  "trial_params": null
1570
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.3594453861071663,
5
+ "global_step": 220000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1560
  "eval_samples_per_second": 977.233,
1561
  "eval_steps_per_second": 15.636,
1562
  "step": 210000
1563
+ },
1564
+ {
1565
+ "epoch": 3.22,
1566
+ "learning_rate": 0.0001403107774233577,
1567
+ "loss": 0.3098,
1568
+ "step": 211000
1569
+ },
1570
+ {
1571
+ "epoch": 3.24,
1572
+ "learning_rate": 0.00014019294163068597,
1573
+ "loss": 0.3093,
1574
+ "step": 212000
1575
+ },
1576
+ {
1577
+ "epoch": 3.25,
1578
+ "learning_rate": 0.00014007444757764835,
1579
+ "loss": 0.3093,
1580
+ "step": 213000
1581
+ },
1582
+ {
1583
+ "epoch": 3.27,
1584
+ "learning_rate": 0.0001399552965600768,
1585
+ "loss": 0.3088,
1586
+ "step": 214000
1587
+ },
1588
+ {
1589
+ "epoch": 3.28,
1590
+ "learning_rate": 0.0001398354898809877,
1591
+ "loss": 0.3089,
1592
+ "step": 215000
1593
+ },
1594
+ {
1595
+ "epoch": 3.28,
1596
+ "eval_runtime": 1.0098,
1597
+ "eval_samples_per_second": 990.287,
1598
+ "eval_steps_per_second": 15.845,
1599
+ "step": 215000
1600
+ },
1601
+ {
1602
+ "epoch": 3.3,
1603
+ "learning_rate": 0.0001397150288505678,
1604
+ "loss": 0.3315,
1605
+ "step": 216000
1606
+ },
1607
+ {
1608
+ "epoch": 3.31,
1609
+ "learning_rate": 0.00013959391478615959,
1610
+ "loss": 0.628,
1611
+ "step": 217000
1612
+ },
1613
+ {
1614
+ "epoch": 3.33,
1615
+ "learning_rate": 0.00013947214901224706,
1616
+ "loss": 0.3112,
1617
+ "step": 218000
1618
+ },
1619
+ {
1620
+ "epoch": 3.34,
1621
+ "learning_rate": 0.0001393497328604412,
1622
+ "loss": 0.3094,
1623
+ "step": 219000
1624
+ },
1625
+ {
1626
+ "epoch": 3.36,
1627
+ "learning_rate": 0.00013922666766946545,
1628
+ "loss": 0.3082,
1629
+ "step": 220000
1630
+ },
1631
+ {
1632
+ "epoch": 3.36,
1633
+ "eval_runtime": 1.0751,
1634
+ "eval_samples_per_second": 930.139,
1635
+ "eval_steps_per_second": 14.882,
1636
+ "step": 220000
1637
  }
1638
  ],
1639
  "max_steps": 1000000,
1640
  "num_train_epochs": 16,
1641
+ "total_flos": 1.542203771463191e+22,
1642
  "trial_name": null,
1643
  "trial_params": null
1644
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25943354903cd35afbe5a9d2bfdd9b41bedaf40773891780d5be2bd5e21bdecd
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10097219a660b41bb145e7706c7d6f55222a5f2edc7e876d75c0a98689203eb2
3
  size 449471589