Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
cdd8c30
1 Parent(s): e596262

Training in progress, step 380000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8e6e5d6289bafd465e0f93748ab1bb630e682cf3fe16da7f34107958c699159
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c700adab32c9c77d19e150bd97404af77c8ea4f249d7d8819f10ecd29a7599aa
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0f65f9d24c194387d73c6d6206aa2a527cc855b09f2bbd98f42e2d70ffdd0e6
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b70ffcb599d0cbcc5aa0449b31396d7f0aecaf32d47481cf0cbeb78e7394dcdc
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a14c2ca87be8d848b5b7a5987a7e41580ee4714e56c6a11b74724ade62186fac
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:074f082b7918427797301b29e7c6af54e31efb39ae44b35e4533a95f5b0a9f49
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14c65884de0d108ce0c8462f58d63c86fe3c03bc71ad62ad4517385a4a06be4d
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65f237a078b5c1beb61259bf8b7bce0aab72bc1a5221890351cf7a2047a3cdcc
3
+ size 14439
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d71883cda87e2e2a13d7e90ee7788adac16f770d7d78f7236989f184f7851175
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3427e04a13ecc5863d163d8b4c944bb2837f27676722003cb6abda2606ce2015
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebafa49c46a1fb807fcc2cd7ad8adabd30b87b658f944a88ac912fe32d5b60d0
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dab2092ac253f5c93a298eee50fba2933b65f4ea17b7fc517f028648f502ea43
3
+ size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:540b632982ca1e514de58c2d575a52863f5386c323edbc210ecc94c61bdc1b4b
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f21b3afd8d405fcd9461eae3cafa8a4894a77b6f36c354aa188329ab6dfe547a
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.649976331180234,
5
- "global_step": 370000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2744,11 +2744,85 @@
2744
  "eval_samples_per_second": 820.56,
2745
  "eval_steps_per_second": 13.129,
2746
  "step": 370000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2747
  }
2748
  ],
2749
  "max_steps": 1000000,
2750
  "num_train_epochs": 16,
2751
- "total_flos": 2.5937063727821006e+22,
2752
  "trial_name": null,
2753
  "trial_params": null
2754
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.802678394185105,
5
+ "global_step": 380000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2744
  "eval_samples_per_second": 820.56,
2745
  "eval_steps_per_second": 13.129,
2746
  "step": 370000
2747
+ },
2748
+ {
2749
+ "epoch": 5.67,
2750
+ "learning_rate": 0.00011412772171899904,
2751
+ "loss": 0.2819,
2752
+ "step": 371000
2753
+ },
2754
+ {
2755
+ "epoch": 5.68,
2756
+ "learning_rate": 0.00011392542495456556,
2757
+ "loss": 0.28,
2758
+ "step": 372000
2759
+ },
2760
+ {
2761
+ "epoch": 5.7,
2762
+ "learning_rate": 0.00011372275718712006,
2763
+ "loss": 0.2797,
2764
+ "step": 373000
2765
+ },
2766
+ {
2767
+ "epoch": 5.71,
2768
+ "learning_rate": 0.00011351972063300484,
2769
+ "loss": 0.2797,
2770
+ "step": 374000
2771
+ },
2772
+ {
2773
+ "epoch": 5.73,
2774
+ "learning_rate": 0.00011331631751259515,
2775
+ "loss": 0.2801,
2776
+ "step": 375000
2777
+ },
2778
+ {
2779
+ "epoch": 5.73,
2780
+ "eval_runtime": 1.0146,
2781
+ "eval_samples_per_second": 985.631,
2782
+ "eval_steps_per_second": 15.77,
2783
+ "step": 375000
2784
+ },
2785
+ {
2786
+ "epoch": 5.74,
2787
+ "learning_rate": 0.00011311255005027487,
2788
+ "loss": 0.2789,
2789
+ "step": 376000
2790
+ },
2791
+ {
2792
+ "epoch": 5.76,
2793
+ "learning_rate": 0.00011290842047441232,
2794
+ "loss": 0.2791,
2795
+ "step": 377000
2796
+ },
2797
+ {
2798
+ "epoch": 5.77,
2799
+ "learning_rate": 0.00011270393101733585,
2800
+ "loss": 0.279,
2801
+ "step": 378000
2802
+ },
2803
+ {
2804
+ "epoch": 5.79,
2805
+ "learning_rate": 0.00011249908391530946,
2806
+ "loss": 0.279,
2807
+ "step": 379000
2808
+ },
2809
+ {
2810
+ "epoch": 5.8,
2811
+ "learning_rate": 0.00011229388140850814,
2812
+ "loss": 0.279,
2813
+ "step": 380000
2814
+ },
2815
+ {
2816
+ "epoch": 5.8,
2817
+ "eval_runtime": 1.2375,
2818
+ "eval_samples_per_second": 808.112,
2819
+ "eval_steps_per_second": 12.93,
2820
+ "step": 380000
2821
  }
2822
  ],
2823
  "max_steps": 1000000,
2824
  "num_train_epochs": 16,
2825
+ "total_flos": 2.6638066338124477e+22,
2826
  "trial_name": null,
2827
  "trial_params": null
2828
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0f65f9d24c194387d73c6d6206aa2a527cc855b09f2bbd98f42e2d70ffdd0e6
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b70ffcb599d0cbcc5aa0449b31396d7f0aecaf32d47481cf0cbeb78e7394dcdc
3
  size 449471589