Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
e596262
1 Parent(s): a12398e

Training in progress, step 370000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44471d6e6546be5ac1a0d86dea95ba4d44ec44baa5148bbd72a7ea895ad69cfc
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8e6e5d6289bafd465e0f93748ab1bb630e682cf3fe16da7f34107958c699159
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d3b9e249ae21e66394d1e5adda08ca3c78e35cfc386e28fe333440be7a14450
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0f65f9d24c194387d73c6d6206aa2a527cc855b09f2bbd98f42e2d70ffdd0e6
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cd407f01a45e91c6a9d73f9ffcc5948c50f62ac1349333301934ceecd28bde2
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a14c2ca87be8d848b5b7a5987a7e41580ee4714e56c6a11b74724ade62186fac
3
+ size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10ca9bf76c7cf63afb390947106325fd549859bdbd17156e672be09fdd4b8f4d
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14c65884de0d108ce0c8462f58d63c86fe3c03bc71ad62ad4517385a4a06be4d
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:458dbb378f2ef2f1049b9621261d1e352171f603268c570c20cc0831e3c801af
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d71883cda87e2e2a13d7e90ee7788adac16f770d7d78f7236989f184f7851175
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed71a40157ab7c8a370261156f0220243926bfa7450a89c6374ca93f070e4120
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebafa49c46a1fb807fcc2cd7ad8adabd30b87b658f944a88ac912fe32d5b60d0
3
+ size 14567
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a42c32ab3c49e09d799093ca137ee6e22777a2749e499367cd831d70ce83fb58
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:540b632982ca1e514de58c2d575a52863f5386c323edbc210ecc94c61bdc1b4b
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.497274268175363,
5
- "global_step": 360000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2670,11 +2670,85 @@
2670
  "eval_samples_per_second": 908.433,
2671
  "eval_steps_per_second": 14.535,
2672
  "step": 360000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2673
  }
2674
  ],
2675
  "max_steps": 1000000,
2676
  "num_train_epochs": 16,
2677
- "total_flos": 2.5236061117517534e+22,
2678
  "trial_name": null,
2679
  "trial_params": null
2680
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.649976331180234,
5
+ "global_step": 370000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2670
  "eval_samples_per_second": 908.433,
2671
  "eval_steps_per_second": 14.535,
2672
  "step": 360000
2673
+ },
2674
+ {
2675
+ "epoch": 5.51,
2676
+ "learning_rate": 0.0001161297995343628,
2677
+ "loss": 0.2815,
2678
+ "step": 361000
2679
+ },
2680
+ {
2681
+ "epoch": 5.53,
2682
+ "learning_rate": 0.00011593133379434138,
2683
+ "loss": 0.2815,
2684
+ "step": 362000
2685
+ },
2686
+ {
2687
+ "epoch": 5.54,
2688
+ "learning_rate": 0.00011573247511501028,
2689
+ "loss": 0.2811,
2690
+ "step": 363000
2691
+ },
2692
+ {
2693
+ "epoch": 5.56,
2694
+ "learning_rate": 0.00011553322567105619,
2695
+ "loss": 0.2807,
2696
+ "step": 364000
2697
+ },
2698
+ {
2699
+ "epoch": 5.57,
2700
+ "learning_rate": 0.00011533358764143905,
2701
+ "loss": 0.2808,
2702
+ "step": 365000
2703
+ },
2704
+ {
2705
+ "epoch": 5.57,
2706
+ "eval_runtime": 1.1301,
2707
+ "eval_samples_per_second": 884.842,
2708
+ "eval_steps_per_second": 14.157,
2709
+ "step": 365000
2710
+ },
2711
+ {
2712
+ "epoch": 5.59,
2713
+ "learning_rate": 0.00011513356320936841,
2714
+ "loss": 0.2808,
2715
+ "step": 366000
2716
+ },
2717
+ {
2718
+ "epoch": 5.6,
2719
+ "learning_rate": 0.00011493315456227943,
2720
+ "loss": 0.2817,
2721
+ "step": 367000
2722
+ },
2723
+ {
2724
+ "epoch": 5.62,
2725
+ "learning_rate": 0.00011473236389180894,
2726
+ "loss": 0.2803,
2727
+ "step": 368000
2728
+ },
2729
+ {
2730
+ "epoch": 5.63,
2731
+ "learning_rate": 0.00011453119339377154,
2732
+ "loss": 0.2803,
2733
+ "step": 369000
2734
+ },
2735
+ {
2736
+ "epoch": 5.65,
2737
+ "learning_rate": 0.00011432964526813558,
2738
+ "loss": 0.2817,
2739
+ "step": 370000
2740
+ },
2741
+ {
2742
+ "epoch": 5.65,
2743
+ "eval_runtime": 1.2187,
2744
+ "eval_samples_per_second": 820.56,
2745
+ "eval_steps_per_second": 13.129,
2746
+ "step": 370000
2747
  }
2748
  ],
2749
  "max_steps": 1000000,
2750
  "num_train_epochs": 16,
2751
+ "total_flos": 2.5937063727821006e+22,
2752
  "trial_name": null,
2753
  "trial_params": null
2754
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d3b9e249ae21e66394d1e5adda08ca3c78e35cfc386e28fe333440be7a14450
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0f65f9d24c194387d73c6d6206aa2a527cc855b09f2bbd98f42e2d70ffdd0e6
3
  size 449471589