Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
e76e0b0
1 Parent(s): 3aa0269

Training in progress, step 160000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af89620dabb8befadb717e149645c7b1a4baa437ae00fe1a45d193867a75747e
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51c4479b7100b24acffdfd7fb1cff497645cac828edc9bce49ad39669a19e6f1
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4473132994381129211918f004185b9788753aef90d5b6db4b7139479af4a5e
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f45b8970c2fcdae44788b5d4ade86d7949295115594ab3b0d456c282cadcd002
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ce68a515967919f0a865a5bd2e1e8f70571d798e73f414abfc84271b022caff
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02a1d97b2752462543b92ffd0f23922ddd8ffff9e6ba2aaf2b57366a0cea0714
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6380926153299d8b0e27207014365338e9fc035d7cd51dfa2b4a3c25b6edbff5
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29849d211b595c5ac9c137dcd37e20da1964e185621f9086f1491a26e0f460bc
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77f61692f187e649a36856bc80d6adc9da2c6f8eb5a5983beddd87644fb8d73c
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e99c0c1e436962d7938fd416d17b1f2b444137c2e5f765032e46157e9b60a3ea
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f0c634c62ca05cfd25911633dd33cd6a1a4c0751ac34bfc4f130af2e87b7357
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00c80b4bceef61474bcae1ecae0d1e95d0713b469a0fdc8873f2259acce5bd7e
3
+ size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6944aac36fb07ee223c68ca3cff3b6f262ad7e802285928ca04ff038bec935ea
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b0f5af299b689f18c326dad86c4c4c3f628480672d22f22ec90ae66ce6a4f1
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.2905309450730678,
5
- "global_step": 150000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1116,11 +1116,85 @@
1116
  "eval_samples_per_second": 958.687,
1117
  "eval_steps_per_second": 15.339,
1118
  "step": 150000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1119
  }
1120
  ],
1121
  "max_steps": 1000000,
1122
  "num_train_epochs": 16,
1123
- "total_flos": 1.0515026013189097e+22,
1124
  "trial_name": null,
1125
  "trial_params": null
1126
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.443233008077939,
5
+ "global_step": 160000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1116
  "eval_samples_per_second": 958.687,
1117
  "eval_steps_per_second": 15.339,
1118
  "step": 150000
1119
+ },
1120
+ {
1121
+ "epoch": 2.31,
1122
+ "learning_rate": 0.00014613168173223585,
1123
+ "loss": 0.3308,
1124
+ "step": 151000
1125
+ },
1126
+ {
1127
+ "epoch": 2.32,
1128
+ "learning_rate": 0.00014605543333995113,
1129
+ "loss": 0.3302,
1130
+ "step": 152000
1131
+ },
1132
+ {
1133
+ "epoch": 2.34,
1134
+ "learning_rate": 0.00014597846257603038,
1135
+ "loss": 0.3294,
1136
+ "step": 153000
1137
+ },
1138
+ {
1139
+ "epoch": 2.35,
1140
+ "learning_rate": 0.0001459007702822136,
1141
+ "loss": 0.329,
1142
+ "step": 154000
1143
+ },
1144
+ {
1145
+ "epoch": 2.37,
1146
+ "learning_rate": 0.00014582235730813128,
1147
+ "loss": 0.3283,
1148
+ "step": 155000
1149
+ },
1150
+ {
1151
+ "epoch": 2.37,
1152
+ "eval_runtime": 1.0629,
1153
+ "eval_samples_per_second": 940.817,
1154
+ "eval_steps_per_second": 15.053,
1155
+ "step": 155000
1156
+ },
1157
+ {
1158
+ "epoch": 2.38,
1159
+ "learning_rate": 0.00014574322451129507,
1160
+ "loss": 0.3281,
1161
+ "step": 156000
1162
+ },
1163
+ {
1164
+ "epoch": 2.4,
1165
+ "learning_rate": 0.00014566337275708863,
1166
+ "loss": 0.328,
1167
+ "step": 157000
1168
+ },
1169
+ {
1170
+ "epoch": 2.41,
1171
+ "learning_rate": 0.0001455828029187579,
1172
+ "loss": 0.3272,
1173
+ "step": 158000
1174
+ },
1175
+ {
1176
+ "epoch": 2.43,
1177
+ "learning_rate": 0.00014550151587740178,
1178
+ "loss": 0.3269,
1179
+ "step": 159000
1180
+ },
1181
+ {
1182
+ "epoch": 2.44,
1183
+ "learning_rate": 0.00014541951252196225,
1184
+ "loss": 0.3265,
1185
+ "step": 160000
1186
+ },
1187
+ {
1188
+ "epoch": 2.44,
1189
+ "eval_runtime": 1.0199,
1190
+ "eval_samples_per_second": 980.452,
1191
+ "eval_steps_per_second": 15.687,
1192
+ "step": 160000
1193
  }
1194
  ],
1195
  "max_steps": 1000000,
1196
  "num_train_epochs": 16,
1197
+ "total_flos": 1.1216028623492568e+22,
1198
  "trial_name": null,
1199
  "trial_params": null
1200
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4473132994381129211918f004185b9788753aef90d5b6db4b7139479af4a5e
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f45b8970c2fcdae44788b5d4ade86d7949295115594ab3b0d456c282cadcd002
3
  size 449471589