pierreguillou
commited on
Commit
•
dbd4532
1
Parent(s):
a00a34d
Training in progress, step 6500
Browse files- {checkpoint-4500 → checkpoint-6000}/config.json +0 -0
- {checkpoint-4500 → checkpoint-6000}/optimizer.pt +1 -1
- {checkpoint-5000 → checkpoint-6000}/pytorch_model.bin +1 -1
- {checkpoint-5000 → checkpoint-6000}/rng_state.pth +1 -1
- {checkpoint-5000 → checkpoint-6000}/scaler.pt +1 -1
- {checkpoint-4500 → checkpoint-6000}/scheduler.pt +1 -1
- {checkpoint-4500 → checkpoint-6000}/special_tokens_map.json +0 -0
- {checkpoint-4500 → checkpoint-6000}/tokenizer.json +0 -0
- {checkpoint-4500 → checkpoint-6000}/tokenizer_config.json +0 -0
- {checkpoint-5000 → checkpoint-6000}/trainer_state.json +41 -5
- {checkpoint-4500 → checkpoint-6000}/training_args.bin +0 -0
- {checkpoint-5000 → checkpoint-6500}/config.json +0 -0
- {checkpoint-5000 → checkpoint-6500}/optimizer.pt +1 -1
- {checkpoint-4500 → checkpoint-6500}/pytorch_model.bin +1 -1
- {checkpoint-4500 → checkpoint-6500}/rng_state.pth +1 -1
- {checkpoint-4500 → checkpoint-6500}/scaler.pt +1 -1
- {checkpoint-5000 → checkpoint-6500}/scheduler.pt +1 -1
- {checkpoint-5000 → checkpoint-6500}/special_tokens_map.json +0 -0
- {checkpoint-5000 → checkpoint-6500}/tokenizer.json +0 -0
- {checkpoint-5000 → checkpoint-6500}/tokenizer_config.json +0 -0
- {checkpoint-4500 → checkpoint-6500}/trainer_state.json +77 -5
- {checkpoint-5000 → checkpoint-6500}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-4500 → checkpoint-6000}/config.json
RENAMED
File without changes
|
{checkpoint-4500 → checkpoint-6000}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2265828101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6ccab808598cafaa3502eaf827acb795d751b863043a68024a8ebc252765dda
|
3 |
size 2265828101
|
{checkpoint-5000 → checkpoint-6000}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9effd102ed93d81722319ca88162190926ca77de0e9c79bcdf05fedc7571c41
|
3 |
size 1134425553
|
{checkpoint-5000 → checkpoint-6000}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33f25f963833bb60f4e565ecbfcbf34d003c383bcd545a16637c61002e2435ad
|
3 |
size 14575
|
{checkpoint-5000 → checkpoint-6000}/scaler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06535ee946097fce21c4464212b93d33310a3a654d4286c652849b57cf50a7f8
|
3 |
size 557
|
{checkpoint-4500 → checkpoint-6000}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72f3b66da2277cfe6e060fe737d382a511cc283da3a6c66c08f0ac5f7793cfb9
|
3 |
size 627
|
{checkpoint-4500 → checkpoint-6000}/special_tokens_map.json
RENAMED
File without changes
|
{checkpoint-4500 → checkpoint-6000}/tokenizer.json
RENAMED
File without changes
|
{checkpoint-4500 → checkpoint-6000}/tokenizer_config.json
RENAMED
File without changes
|
{checkpoint-5000 → checkpoint-6000}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -186,11 +186,47 @@
|
|
186 |
"eval_samples_per_second": 53.645,
|
187 |
"eval_steps_per_second": 3.372,
|
188 |
"step": 5000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
189 |
}
|
190 |
],
|
191 |
"max_steps": 12035,
|
192 |
"num_train_epochs": 5,
|
193 |
-
"total_flos":
|
194 |
"trial_name": null,
|
195 |
"trial_params": null
|
196 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.8573209374145502,
|
3 |
+
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
|
4 |
+
"epoch": 2.4927295388450355,
|
5 |
+
"global_step": 6000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
186 |
"eval_samples_per_second": 53.645,
|
187 |
"eval_steps_per_second": 3.372,
|
188 |
"step": 5000
|
189 |
+
},
|
190 |
+
{
|
191 |
+
"epoch": 2.29,
|
192 |
+
"learning_rate": 2.7179061071873702e-05,
|
193 |
+
"loss": 0.1294,
|
194 |
+
"step": 5500
|
195 |
+
},
|
196 |
+
{
|
197 |
+
"epoch": 2.29,
|
198 |
+
"eval_accuracy": 0.8489327821653182,
|
199 |
+
"eval_f1": 0.8489327821653182,
|
200 |
+
"eval_loss": 0.8485749959945679,
|
201 |
+
"eval_precision": 0.8489327821653182,
|
202 |
+
"eval_recall": 0.8489327821653182,
|
203 |
+
"eval_runtime": 33.5765,
|
204 |
+
"eval_samples_per_second": 61.114,
|
205 |
+
"eval_steps_per_second": 3.842,
|
206 |
+
"step": 5500
|
207 |
+
},
|
208 |
+
{
|
209 |
+
"epoch": 2.49,
|
210 |
+
"learning_rate": 2.5101786456169508e-05,
|
211 |
+
"loss": 0.134,
|
212 |
+
"step": 6000
|
213 |
+
},
|
214 |
+
{
|
215 |
+
"epoch": 2.49,
|
216 |
+
"eval_accuracy": 0.8573209374145502,
|
217 |
+
"eval_f1": 0.8573209374145502,
|
218 |
+
"eval_loss": 0.7681939005851746,
|
219 |
+
"eval_precision": 0.8573209374145502,
|
220 |
+
"eval_recall": 0.8573209374145502,
|
221 |
+
"eval_runtime": 39.5768,
|
222 |
+
"eval_samples_per_second": 51.849,
|
223 |
+
"eval_steps_per_second": 3.259,
|
224 |
+
"step": 6000
|
225 |
}
|
226 |
],
|
227 |
"max_steps": 12035,
|
228 |
"num_train_epochs": 5,
|
229 |
+
"total_flos": 1.0011279790020096e+16,
|
230 |
"trial_name": null,
|
231 |
"trial_params": null
|
232 |
}
|
{checkpoint-4500 → checkpoint-6000}/training_args.bin
RENAMED
File without changes
|
{checkpoint-5000 → checkpoint-6500}/config.json
RENAMED
File without changes
|
{checkpoint-5000 → checkpoint-6500}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2265828101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:363b00981239b12adf86f779858e84efae5e7df9ed3d90c59b318b8b8fd859b0
|
3 |
size 2265828101
|
{checkpoint-4500 → checkpoint-6500}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c5ee445768534ea29279d89b14a0f720766edc05f5f4988ee819d7fd74f6c91
|
3 |
size 1134425553
|
{checkpoint-4500 → checkpoint-6500}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2155603d2a90e6f05afc18565c0a7971b5a33e500179dd735d7729ffabd71cf8
|
3 |
size 14575
|
{checkpoint-4500 → checkpoint-6500}/scaler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eec39e20dd1d19e75d63c9ea6180a447b93a16fe8c240630ce7a3dddde70b3a
|
3 |
size 557
|
{checkpoint-5000 → checkpoint-6500}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9d8fc4d7b4bac08d88a4d03d2daffd167bc9d42006a1ae8f011989b8eedebcd
|
3 |
size 627
|
{checkpoint-5000 → checkpoint-6500}/special_tokens_map.json
RENAMED
File without changes
|
{checkpoint-5000 → checkpoint-6500}/tokenizer.json
RENAMED
File without changes
|
{checkpoint-5000 → checkpoint-6500}/tokenizer_config.json
RENAMED
File without changes
|
{checkpoint-4500 → checkpoint-6500}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -168,11 +168,83 @@
|
|
168 |
"eval_samples_per_second": 58.527,
|
169 |
"eval_steps_per_second": 3.679,
|
170 |
"step": 4500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
171 |
}
|
172 |
],
|
173 |
"max_steps": 12035,
|
174 |
"num_train_epochs": 5,
|
175 |
-
"total_flos":
|
176 |
"trial_name": null,
|
177 |
"trial_params": null
|
178 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.8573209374145502,
|
3 |
+
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
|
4 |
+
"epoch": 2.700457000415455,
|
5 |
+
"global_step": 6500,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
168 |
"eval_samples_per_second": 58.527,
|
169 |
"eval_steps_per_second": 3.679,
|
170 |
"step": 4500
|
171 |
+
},
|
172 |
+
{
|
173 |
+
"epoch": 2.08,
|
174 |
+
"learning_rate": 2.9256335687577903e-05,
|
175 |
+
"loss": 0.1704,
|
176 |
+
"step": 5000
|
177 |
+
},
|
178 |
+
{
|
179 |
+
"epoch": 2.08,
|
180 |
+
"eval_accuracy": 0.8317543549243216,
|
181 |
+
"eval_f1": 0.8317543549243216,
|
182 |
+
"eval_loss": 0.856721818447113,
|
183 |
+
"eval_precision": 0.8317543549243216,
|
184 |
+
"eval_recall": 0.8317543549243216,
|
185 |
+
"eval_runtime": 38.2513,
|
186 |
+
"eval_samples_per_second": 53.645,
|
187 |
+
"eval_steps_per_second": 3.372,
|
188 |
+
"step": 5000
|
189 |
+
},
|
190 |
+
{
|
191 |
+
"epoch": 2.29,
|
192 |
+
"learning_rate": 2.7179061071873702e-05,
|
193 |
+
"loss": 0.1294,
|
194 |
+
"step": 5500
|
195 |
+
},
|
196 |
+
{
|
197 |
+
"epoch": 2.29,
|
198 |
+
"eval_accuracy": 0.8489327821653182,
|
199 |
+
"eval_f1": 0.8489327821653182,
|
200 |
+
"eval_loss": 0.8485749959945679,
|
201 |
+
"eval_precision": 0.8489327821653182,
|
202 |
+
"eval_recall": 0.8489327821653182,
|
203 |
+
"eval_runtime": 33.5765,
|
204 |
+
"eval_samples_per_second": 61.114,
|
205 |
+
"eval_steps_per_second": 3.842,
|
206 |
+
"step": 5500
|
207 |
+
},
|
208 |
+
{
|
209 |
+
"epoch": 2.49,
|
210 |
+
"learning_rate": 2.5101786456169508e-05,
|
211 |
+
"loss": 0.134,
|
212 |
+
"step": 6000
|
213 |
+
},
|
214 |
+
{
|
215 |
+
"epoch": 2.49,
|
216 |
+
"eval_accuracy": 0.8573209374145502,
|
217 |
+
"eval_f1": 0.8573209374145502,
|
218 |
+
"eval_loss": 0.7681939005851746,
|
219 |
+
"eval_precision": 0.8573209374145502,
|
220 |
+
"eval_recall": 0.8573209374145502,
|
221 |
+
"eval_runtime": 39.5768,
|
222 |
+
"eval_samples_per_second": 51.849,
|
223 |
+
"eval_steps_per_second": 3.259,
|
224 |
+
"step": 6000
|
225 |
+
},
|
226 |
+
{
|
227 |
+
"epoch": 2.7,
|
228 |
+
"learning_rate": 2.302451184046531e-05,
|
229 |
+
"loss": 0.1354,
|
230 |
+
"step": 6500
|
231 |
+
},
|
232 |
+
{
|
233 |
+
"epoch": 2.7,
|
234 |
+
"eval_accuracy": 0.8255697994241689,
|
235 |
+
"eval_f1": 0.8255697994241689,
|
236 |
+
"eval_loss": 0.9870807528495789,
|
237 |
+
"eval_precision": 0.8255697994241689,
|
238 |
+
"eval_recall": 0.8255697994241689,
|
239 |
+
"eval_runtime": 34.6532,
|
240 |
+
"eval_samples_per_second": 59.215,
|
241 |
+
"eval_steps_per_second": 3.723,
|
242 |
+
"step": 6500
|
243 |
}
|
244 |
],
|
245 |
"max_steps": 12035,
|
246 |
"num_train_epochs": 5,
|
247 |
+
"total_flos": 1.0845796506564096e+16,
|
248 |
"trial_name": null,
|
249 |
"trial_params": null
|
250 |
}
|
{checkpoint-5000 → checkpoint-6500}/training_args.bin
RENAMED
File without changes
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c5ee445768534ea29279d89b14a0f720766edc05f5f4988ee819d7fd74f6c91
|
3 |
size 1134425553
|
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fe49282ece83f2b951a8a5e3ecb00a72d560e9d3422709897756658604d5989
|
3 |
+
size 12806
|