Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
3aa0269
1 Parent(s): 684a9a1

Training in progress, step 150000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:541c09487d9370b723d6f46473ad77d95854f9f277155774d36540daed587c20
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af89620dabb8befadb717e149645c7b1a4baa437ae00fe1a45d193867a75747e
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29c9ea605b07acd9d6d6f974a1449b64b38a1f91d2d0376e5cf078cd024be1d7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4473132994381129211918f004185b9788753aef90d5b6db4b7139479af4a5e
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b84e894ef7a6033cd0e73130f2ebea7e9ec1ffbcfd8c8b79709a364acfd0ff22
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ce68a515967919f0a865a5bd2e1e8f70571d798e73f414abfc84271b022caff
3
+ size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:846e21193961d3c01650602fd61d067e6d15bb106fa27a0a886ebc7bc071a463
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6380926153299d8b0e27207014365338e9fc035d7cd51dfa2b4a3c25b6edbff5
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3963fd41f8e5a2e50a3c7c43d6a3b5ff095e754a9f186db5cd3c2302fcde5d99
3
  size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77f61692f187e649a36856bc80d6adc9da2c6f8eb5a5983beddd87644fb8d73c
3
  size 14439
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14ea5cea28ed719f191afec655c9dab07c0fb35f9db9c4929b4e91078fef40d5
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f0c634c62ca05cfd25911633dd33cd6a1a4c0751ac34bfc4f130af2e87b7357
3
+ size 14439
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5024aa92c1c16069c6562483f940b6c61d0a6604a0773cc4bdb5211b70f77f4
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6944aac36fb07ee223c68ca3cff3b6f262ad7e802285928ca04ff038bec935ea
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.1378288820681965,
5
- "global_step": 140000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1042,11 +1042,85 @@
1042
  "eval_samples_per_second": 989.716,
1043
  "eval_steps_per_second": 15.835,
1044
  "step": 140000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1045
  }
1046
  ],
1047
  "max_steps": 1000000,
1048
  "num_train_epochs": 16,
1049
- "total_flos": 9.814023402885625e+21,
1050
  "trial_name": null,
1051
  "trial_params": null
1052
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.2905309450730678,
5
+ "global_step": 150000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1042
  "eval_samples_per_second": 989.716,
1043
  "eval_steps_per_second": 15.835,
1044
  "step": 140000
1045
+ },
1046
+ {
1047
+ "epoch": 2.15,
1048
+ "learning_rate": 0.00014685425569221819,
1049
+ "loss": 0.3353,
1050
+ "step": 141000
1051
+ },
1052
+ {
1053
+ "epoch": 2.17,
1054
+ "learning_rate": 0.00014678527556960207,
1055
+ "loss": 0.3346,
1056
+ "step": 142000
1057
+ },
1058
+ {
1059
+ "epoch": 2.18,
1060
+ "learning_rate": 0.0001467155650939123,
1061
+ "loss": 0.3342,
1062
+ "step": 143000
1063
+ },
1064
+ {
1065
+ "epoch": 2.2,
1066
+ "learning_rate": 0.00014664512502749141,
1067
+ "loss": 0.3338,
1068
+ "step": 144000
1069
+ },
1070
+ {
1071
+ "epoch": 2.21,
1072
+ "learning_rate": 0.00014657395614066075,
1073
+ "loss": 0.3334,
1074
+ "step": 145000
1075
+ },
1076
+ {
1077
+ "epoch": 2.21,
1078
+ "eval_runtime": 1.0369,
1079
+ "eval_samples_per_second": 964.439,
1080
+ "eval_steps_per_second": 15.431,
1081
+ "step": 145000
1082
+ },
1083
+ {
1084
+ "epoch": 2.23,
1085
+ "learning_rate": 0.0001465020592117118,
1086
+ "loss": 0.3327,
1087
+ "step": 146000
1088
+ },
1089
+ {
1090
+ "epoch": 2.24,
1091
+ "learning_rate": 0.0001464294350268979,
1092
+ "loss": 0.3324,
1093
+ "step": 147000
1094
+ },
1095
+ {
1096
+ "epoch": 2.26,
1097
+ "learning_rate": 0.00014635608438042546,
1098
+ "loss": 0.3319,
1099
+ "step": 148000
1100
+ },
1101
+ {
1102
+ "epoch": 2.28,
1103
+ "learning_rate": 0.00014628200807444543,
1104
+ "loss": 0.3313,
1105
+ "step": 149000
1106
+ },
1107
+ {
1108
+ "epoch": 2.29,
1109
+ "learning_rate": 0.0001462072069190444,
1110
+ "loss": 0.3307,
1111
+ "step": 150000
1112
+ },
1113
+ {
1114
+ "epoch": 2.29,
1115
+ "eval_runtime": 1.0431,
1116
+ "eval_samples_per_second": 958.687,
1117
+ "eval_steps_per_second": 15.339,
1118
+ "step": 150000
1119
  }
1120
  ],
1121
  "max_steps": 1000000,
1122
  "num_train_epochs": 16,
1123
+ "total_flos": 1.0515026013189097e+22,
1124
  "trial_name": null,
1125
  "trial_params": null
1126
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29c9ea605b07acd9d6d6f974a1449b64b38a1f91d2d0376e5cf078cd024be1d7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4473132994381129211918f004185b9788753aef90d5b6db4b7139479af4a5e
3
  size 449471589