Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
d57244a
1 Parent(s): dfe1583

Training in progress, step 280000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c02aa896c2ee6ca7e7195a5ec6659df9dfbcf711b2a086585d06699889d2a77
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a09f2253c2da714db2381b4b6c94afe74f0c5bcca5dfab2a4d09f3bc77a1a830
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a8d446dc34b2bbf6e36c989da495609d6f957caff490ddd65c84402cd84a1a7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f568156f561dbbcf7503a348dffb485dffe24e58ccf5c28c9e6be3fa82361daf
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:726a297059cefb8d3acf77f8c6eb72aad5247d33b79ba9f00d002be1f6ad5127
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59a9fce20181e682cc72fca21c2c1d9ae33919a24109d9c3b0015bbe48914330
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9deb037f8188638d71fed3178b79cf150c9aa2692b1c0ab4a2586496ec3fa41c
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f3a816674b62f2ebc9df81821d70aa6368f98c31e4a2d5592af6a40fe48198f
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92c69465d2a6dab3d96db9a2b18d912729d3e1e1b1af7c09352e2b892ef04628
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:913db27023ff5c862ac68d8593e062aa9da19c0798da56d43a2896de4cc6dca5
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eec7d7dce919d39a021b1844dce51ccb12ffead3d1363108b5bdbc846b3db389
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77a839f0e74d399ee3f4539eaee8bff7b1db922601d5d69fcbfe490fd00b94d2
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7030c55d7b4ceacafe5134891d17b9fbbdf3b9a0eab868717813c67134ec0794
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9756e1f2ce28cffe3ad2413091d8de7b6aa9409f983eeb48589ea2a1911fb547
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.122955701131522,
5
- "global_step": 270000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2004,11 +2004,85 @@
2004
  "eval_samples_per_second": 902.192,
2005
  "eval_steps_per_second": 14.435,
2006
  "step": 270000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2007
  }
2008
  ],
2009
  "max_steps": 1000000,
2010
  "num_train_epochs": 16,
2011
- "total_flos": 1.892704419546778e+22,
2012
  "trial_name": null,
2013
  "trial_params": null
2014
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.275657764136393,
5
+ "global_step": 280000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2004
  "eval_samples_per_second": 902.192,
2005
  "eval_steps_per_second": 14.435,
2006
  "step": 270000
2007
+ },
2008
+ {
2009
+ "epoch": 4.14,
2010
+ "learning_rate": 0.00013212327409215343,
2011
+ "loss": 0.296,
2012
+ "step": 271000
2013
+ },
2014
+ {
2015
+ "epoch": 4.15,
2016
+ "learning_rate": 0.0001319684747836415,
2017
+ "loss": 0.2958,
2018
+ "step": 272000
2019
+ },
2020
+ {
2021
+ "epoch": 4.17,
2022
+ "learning_rate": 0.0001318131071562154,
2023
+ "loss": 0.2961,
2024
+ "step": 273000
2025
+ },
2026
+ {
2027
+ "epoch": 4.18,
2028
+ "learning_rate": 0.00013165717290895067,
2029
+ "loss": 0.2957,
2030
+ "step": 274000
2031
+ },
2032
+ {
2033
+ "epoch": 4.2,
2034
+ "learning_rate": 0.0001315006737471192,
2035
+ "loss": 0.2955,
2036
+ "step": 275000
2037
+ },
2038
+ {
2039
+ "epoch": 4.2,
2040
+ "eval_runtime": 1.0552,
2041
+ "eval_samples_per_second": 947.654,
2042
+ "eval_steps_per_second": 15.162,
2043
+ "step": 275000
2044
+ },
2045
+ {
2046
+ "epoch": 4.21,
2047
+ "learning_rate": 0.0001313436113821708,
2048
+ "loss": 0.2952,
2049
+ "step": 276000
2050
+ },
2051
+ {
2052
+ "epoch": 4.23,
2053
+ "learning_rate": 0.00013118598753171425,
2054
+ "loss": 0.2951,
2055
+ "step": 277000
2056
+ },
2057
+ {
2058
+ "epoch": 4.25,
2059
+ "learning_rate": 0.0001310278039194988,
2060
+ "loss": 0.2951,
2061
+ "step": 278000
2062
+ },
2063
+ {
2064
+ "epoch": 4.26,
2065
+ "learning_rate": 0.00013086906227539506,
2066
+ "loss": 0.2952,
2067
+ "step": 279000
2068
+ },
2069
+ {
2070
+ "epoch": 4.28,
2071
+ "learning_rate": 0.00013070976433537623,
2072
+ "loss": 0.2946,
2073
+ "step": 280000
2074
+ },
2075
+ {
2076
+ "epoch": 4.28,
2077
+ "eval_runtime": 1.0293,
2078
+ "eval_samples_per_second": 971.532,
2079
+ "eval_steps_per_second": 15.545,
2080
+ "step": 280000
2081
  }
2082
  ],
2083
  "max_steps": 1000000,
2084
  "num_train_epochs": 16,
2085
+ "total_flos": 1.962804680577125e+22,
2086
  "trial_name": null,
2087
  "trial_params": null
2088
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a8d446dc34b2bbf6e36c989da495609d6f957caff490ddd65c84402cd84a1a7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f568156f561dbbcf7503a348dffb485dffe24e58ccf5c28c9e6be3fa82361daf
3
  size 449471589