Commit
·
86104c8
1
Parent(s):
b081990
Training in progress, step 8500
Browse files- {checkpoint-7000 → checkpoint-8000}/config.json +0 -0
- {checkpoint-7000 → checkpoint-8000}/optimizer.pt +1 -1
- {checkpoint-7500 → checkpoint-8000}/pytorch_model.bin +1 -1
- {checkpoint-7500 → checkpoint-8000}/rng_state.pth +1 -1
- {checkpoint-7500 → checkpoint-8000}/scaler.pt +1 -1
- {checkpoint-7000 → checkpoint-8000}/scheduler.pt +1 -1
- {checkpoint-7000 → checkpoint-8000}/special_tokens_map.json +0 -0
- {checkpoint-7000 → checkpoint-8000}/tokenizer.json +0 -0
- {checkpoint-7000 → checkpoint-8000}/tokenizer_config.json +0 -0
- {checkpoint-7500 → checkpoint-8000}/trainer_state.json +21 -3
- {checkpoint-7000 → checkpoint-8000}/training_args.bin +0 -0
- {checkpoint-7500 → checkpoint-8500}/config.json +0 -0
- {checkpoint-7500 → checkpoint-8500}/optimizer.pt +1 -1
- {checkpoint-7000 → checkpoint-8500}/pytorch_model.bin +1 -1
- {checkpoint-7000 → checkpoint-8500}/rng_state.pth +1 -1
- {checkpoint-7000 → checkpoint-8500}/scaler.pt +1 -1
- {checkpoint-7500 → checkpoint-8500}/scheduler.pt +1 -1
- {checkpoint-7500 → checkpoint-8500}/special_tokens_map.json +0 -0
- {checkpoint-7500 → checkpoint-8500}/tokenizer.json +0 -0
- {checkpoint-7500 → checkpoint-8500}/tokenizer_config.json +0 -0
- {checkpoint-7000 → checkpoint-8500}/trainer_state.json +59 -5
- {checkpoint-7500 → checkpoint-8500}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-7000 → checkpoint-8000}/config.json
RENAMED
File without changes
|
{checkpoint-7000 → checkpoint-8000}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2265828101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b39cb815a920edaf287fed25e2a19b016671ea73dd16f75036bf2bcfaf1b767a
|
3 |
size 2265828101
|
{checkpoint-7500 → checkpoint-8000}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27b504e227955abd271e8dfb3a65060b57aab9124c9a51342289b2487370d857
|
3 |
size 1134425553
|
{checkpoint-7500 → checkpoint-8000}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:960a0ff8566f0b77c05a97c9fc1c687f7ca7734da4222daf4902d9e243e0137d
|
3 |
size 14575
|
{checkpoint-7500 → checkpoint-8000}/scaler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05c943ac5112ace01757b5472903bea87985b301a9f82c01afb7df322762c49c
|
3 |
size 557
|
{checkpoint-7000 → checkpoint-8000}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c82aba72db92b65d16e163361936c8fce2a4ed55ab1b817ceacaf38e10c5cade
|
3 |
size 627
|
{checkpoint-7000 → checkpoint-8000}/special_tokens_map.json
RENAMED
File without changes
|
{checkpoint-7000 → checkpoint-8000}/tokenizer.json
RENAMED
File without changes
|
{checkpoint-7000 → checkpoint-8000}/tokenizer_config.json
RENAMED
File without changes
|
{checkpoint-7500 → checkpoint-8000}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 0.8573209374145502,
|
3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
|
4 |
-
"epoch": 3.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -276,11 +276,29 @@
|
|
276 |
"eval_samples_per_second": 61.609,
|
277 |
"eval_steps_per_second": 3.873,
|
278 |
"step": 7500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
279 |
}
|
280 |
],
|
281 |
"max_steps": 12035,
|
282 |
"num_train_epochs": 5,
|
283 |
-
"total_flos": 1.
|
284 |
"trial_name": null,
|
285 |
"trial_params": null
|
286 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 0.8573209374145502,
|
3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
|
4 |
+
"epoch": 3.3236393851267136,
|
5 |
+
"global_step": 8000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
276 |
"eval_samples_per_second": 61.609,
|
277 |
"eval_steps_per_second": 3.873,
|
278 |
"step": 7500
|
279 |
+
},
|
280 |
+
{
|
281 |
+
"epoch": 3.32,
|
282 |
+
"learning_rate": 1.6792687993352722e-05,
|
283 |
+
"loss": 0.0788,
|
284 |
+
"step": 8000
|
285 |
+
},
|
286 |
+
{
|
287 |
+
"epoch": 3.32,
|
288 |
+
"eval_accuracy": 0.8364993324862074,
|
289 |
+
"eval_f1": 0.8364993324862076,
|
290 |
+
"eval_loss": 1.028805136680603,
|
291 |
+
"eval_precision": 0.8364993324862074,
|
292 |
+
"eval_recall": 0.8364993324862074,
|
293 |
+
"eval_runtime": 38.2117,
|
294 |
+
"eval_samples_per_second": 53.701,
|
295 |
+
"eval_steps_per_second": 3.376,
|
296 |
+
"step": 8000
|
297 |
}
|
298 |
],
|
299 |
"max_steps": 12035,
|
300 |
"num_train_epochs": 5,
|
301 |
+
"total_flos": 1.3347886251942144e+16,
|
302 |
"trial_name": null,
|
303 |
"trial_params": null
|
304 |
}
|
{checkpoint-7000 → checkpoint-8000}/training_args.bin
RENAMED
File without changes
|
{checkpoint-7500 → checkpoint-8500}/config.json
RENAMED
File without changes
|
{checkpoint-7500 → checkpoint-8500}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2265828101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea130ecc564ac6fe490d67f54147e9dc00bf72e39d0688a66ba68802757a9e2b
|
3 |
size 2265828101
|
{checkpoint-7000 → checkpoint-8500}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e39c7d7515bc3fd9710bfa20bd4d1d7c408894096e55b518c4e64c07ac0ff33b
|
3 |
size 1134425553
|
{checkpoint-7000 → checkpoint-8500}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c16ad00f12a6b00ebecd82041529c62f714ed6d5992e9f831161d0979641cda
|
3 |
size 14575
|
{checkpoint-7000 → checkpoint-8500}/scaler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4c06e32f681823ca88423b1784605ca44bf8a960abc7518ae6b79b079157ccc
|
3 |
size 557
|
{checkpoint-7500 → checkpoint-8500}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53b7ca82f31c9b2520ad7f958578cfcb752be5bbfebe85216932fd844130a1eb
|
3 |
size 627
|
{checkpoint-7500 → checkpoint-8500}/special_tokens_map.json
RENAMED
File without changes
|
{checkpoint-7500 → checkpoint-8500}/tokenizer.json
RENAMED
File without changes
|
{checkpoint-7500 → checkpoint-8500}/tokenizer_config.json
RENAMED
File without changes
|
{checkpoint-7000 → checkpoint-8500}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -258,11 +258,65 @@
|
|
258 |
"eval_samples_per_second": 51.982,
|
259 |
"eval_steps_per_second": 3.268,
|
260 |
"step": 7000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
261 |
}
|
262 |
],
|
263 |
"max_steps": 12035,
|
264 |
"num_train_epochs": 5,
|
265 |
-
"total_flos": 1.
|
266 |
"trial_name": null,
|
267 |
"trial_params": null
|
268 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.8849383152916955,
|
3 |
+
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
|
4 |
+
"epoch": 3.5313668466971335,
|
5 |
+
"global_step": 8500,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
258 |
"eval_samples_per_second": 51.982,
|
259 |
"eval_steps_per_second": 3.268,
|
260 |
"step": 7000
|
261 |
+
},
|
262 |
+
{
|
263 |
+
"epoch": 3.12,
|
264 |
+
"learning_rate": 1.886996260905692e-05,
|
265 |
+
"loss": 0.1012,
|
266 |
+
"step": 7500
|
267 |
+
},
|
268 |
+
{
|
269 |
+
"epoch": 3.12,
|
270 |
+
"eval_accuracy": 0.8385581702079747,
|
271 |
+
"eval_f1": 0.8385581702079747,
|
272 |
+
"eval_loss": 0.8271787166595459,
|
273 |
+
"eval_precision": 0.8385581702079747,
|
274 |
+
"eval_recall": 0.8385581702079747,
|
275 |
+
"eval_runtime": 33.307,
|
276 |
+
"eval_samples_per_second": 61.609,
|
277 |
+
"eval_steps_per_second": 3.873,
|
278 |
+
"step": 7500
|
279 |
+
},
|
280 |
+
{
|
281 |
+
"epoch": 3.32,
|
282 |
+
"learning_rate": 1.6792687993352722e-05,
|
283 |
+
"loss": 0.0788,
|
284 |
+
"step": 8000
|
285 |
+
},
|
286 |
+
{
|
287 |
+
"epoch": 3.32,
|
288 |
+
"eval_accuracy": 0.8364993324862074,
|
289 |
+
"eval_f1": 0.8364993324862076,
|
290 |
+
"eval_loss": 1.028805136680603,
|
291 |
+
"eval_precision": 0.8364993324862074,
|
292 |
+
"eval_recall": 0.8364993324862074,
|
293 |
+
"eval_runtime": 38.2117,
|
294 |
+
"eval_samples_per_second": 53.701,
|
295 |
+
"eval_steps_per_second": 3.376,
|
296 |
+
"step": 8000
|
297 |
+
},
|
298 |
+
{
|
299 |
+
"epoch": 3.53,
|
300 |
+
"learning_rate": 1.4715413377648527e-05,
|
301 |
+
"loss": 0.0802,
|
302 |
+
"step": 8500
|
303 |
+
},
|
304 |
+
{
|
305 |
+
"epoch": 3.53,
|
306 |
+
"eval_accuracy": 0.8849383152916955,
|
307 |
+
"eval_f1": 0.8849383152916955,
|
308 |
+
"eval_loss": 0.719699501991272,
|
309 |
+
"eval_precision": 0.8849383152916955,
|
310 |
+
"eval_recall": 0.8849383152916955,
|
311 |
+
"eval_runtime": 34.4056,
|
312 |
+
"eval_samples_per_second": 59.641,
|
313 |
+
"eval_steps_per_second": 3.749,
|
314 |
+
"step": 8500
|
315 |
}
|
316 |
],
|
317 |
"max_steps": 12035,
|
318 |
"num_train_epochs": 5,
|
319 |
+
"total_flos": 1.4182402968486144e+16,
|
320 |
"trial_name": null,
|
321 |
"trial_params": null
|
322 |
}
|
{checkpoint-7500 → checkpoint-8500}/training_args.bin
RENAMED
File without changes
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1134425553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e39c7d7515bc3fd9710bfa20bd4d1d7c408894096e55b518c4e64c07ac0ff33b
|
3 |
size 1134425553
|
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f7c4c7428bf319a3138119ab5d1663f67efa67393e048e30432a37e3bf8e016
|
3 |
+
size 15322
|