pierreguillou commited on
Commit
91b6951
β€’
1 Parent(s): 4e02099

Training in progress, step 11500

Browse files
Files changed (24) hide show
  1. {checkpoint-10000 β†’ checkpoint-11000}/config.json +0 -0
  2. {checkpoint-10000 β†’ checkpoint-11000}/optimizer.pt +1 -1
  3. {checkpoint-10500 β†’ checkpoint-11000}/pytorch_model.bin +1 -1
  4. {checkpoint-10500 β†’ checkpoint-11000}/rng_state.pth +1 -1
  5. {checkpoint-10500 β†’ checkpoint-11000}/scaler.pt +1 -1
  6. {checkpoint-10000 β†’ checkpoint-11000}/scheduler.pt +1 -1
  7. {checkpoint-10000 β†’ checkpoint-11000}/special_tokens_map.json +0 -0
  8. {checkpoint-10000 β†’ checkpoint-11000}/tokenizer.json +0 -0
  9. {checkpoint-10000 β†’ checkpoint-11000}/tokenizer_config.json +0 -0
  10. {checkpoint-10500 β†’ checkpoint-11000}/trainer_state.json +21 -3
  11. {checkpoint-10000 β†’ checkpoint-11000}/training_args.bin +0 -0
  12. {checkpoint-10500 β†’ checkpoint-11500}/config.json +0 -0
  13. {checkpoint-10500 β†’ checkpoint-11500}/optimizer.pt +1 -1
  14. {checkpoint-10000 β†’ checkpoint-11500}/pytorch_model.bin +1 -1
  15. {checkpoint-10000 β†’ checkpoint-11500}/rng_state.pth +1 -1
  16. {checkpoint-10000 β†’ checkpoint-11500}/scaler.pt +1 -1
  17. {checkpoint-10500 β†’ checkpoint-11500}/scheduler.pt +1 -1
  18. {checkpoint-10500 β†’ checkpoint-11500}/special_tokens_map.json +0 -0
  19. {checkpoint-10500 β†’ checkpoint-11500}/tokenizer.json +0 -0
  20. {checkpoint-10500 β†’ checkpoint-11500}/tokenizer_config.json +0 -0
  21. {checkpoint-10000 β†’ checkpoint-11500}/trainer_state.json +57 -3
  22. {checkpoint-10500 β†’ checkpoint-11500}/training_args.bin +0 -0
  23. pytorch_model.bin +1 -1
  24. runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-10000 β†’ checkpoint-11000}/config.json RENAMED
File without changes
{checkpoint-10000 β†’ checkpoint-11000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d284277e529a50e3e8bb5292a6ded11322ad1fc7a52ec65935b405cb7662695
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a373613aeeb4d6be34886b231335f8c8f20879c526ba375b702a8ec78acc96a8
3
  size 2265828101
{checkpoint-10500 β†’ checkpoint-11000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ded9cb2eeea21506721e8c61ffb8b582933f1daa41565103186b7c1e36b4c34
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c57e05d3f7e9c882e3cf561394a94532ce7d4df59b422bf335fad1498c1cc3e
3
  size 1134425553
{checkpoint-10500 β†’ checkpoint-11000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71d4bb3c3265e07b1b570a635f165856008288f9ef44970f54c27bda7a78510a
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edc6c1a25455a0ac08a6ba15e2bb0949f0e47c53b5d7e9f6781b4d75bdb78a0d
3
  size 14575
{checkpoint-10500 β†’ checkpoint-11000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0189e6a21dbc7825032487f150c86eee8abb079d598cf29704ea468feba66754
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1cf22c2871c42a245e6e913d024763352b9f1be40e2deb2b845f641c7d0252c
3
  size 557
{checkpoint-10000 β†’ checkpoint-11000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c34c3aa5eb00aba6650e668fcf350c18b296ed27ff6b939de04b85351858f303
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bc076744799314c413b1a22fd57768d86453e79c6cbb2e75e964b3a373c4958
3
  size 627
{checkpoint-10000 β†’ checkpoint-11000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-10000 β†’ checkpoint-11000}/tokenizer.json RENAMED
File without changes
{checkpoint-10000 β†’ checkpoint-11000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-10500 β†’ checkpoint-11000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.8849383152916955,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
4
- "epoch": 4.362276692978812,
5
- "global_step": 10500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -384,11 +384,29 @@
384
  "eval_samples_per_second": 58.947,
385
  "eval_steps_per_second": 3.706,
386
  "step": 10500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
387
  }
388
  ],
389
  "max_steps": 12035,
390
  "num_train_epochs": 5,
391
- "total_flos": 1.7519009430408192e+16,
392
  "trial_name": null,
393
  "trial_params": null
394
  }
 
1
  {
2
  "best_metric": 0.8849383152916955,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
4
+ "epoch": 4.570004154549231,
5
+ "global_step": 11000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
384
  "eval_samples_per_second": 58.947,
385
  "eval_steps_per_second": 3.706,
386
  "step": 10500
387
+ },
388
+ {
389
+ "epoch": 4.57,
390
+ "learning_rate": 4.333194848358953e-06,
391
+ "loss": 0.039,
392
+ "step": 11000
393
+ },
394
+ {
395
+ "epoch": 4.57,
396
+ "eval_accuracy": 0.8635778739283588,
397
+ "eval_f1": 0.8635778739283588,
398
+ "eval_loss": 0.9634060263633728,
399
+ "eval_precision": 0.8635778739283588,
400
+ "eval_recall": 0.8635778739283588,
401
+ "eval_runtime": 39.6244,
402
+ "eval_samples_per_second": 51.786,
403
+ "eval_steps_per_second": 3.256,
404
+ "step": 11000
405
  }
406
  ],
407
  "max_steps": 12035,
408
  "num_train_epochs": 5,
409
+ "total_flos": 1.835352614695219e+16,
410
  "trial_name": null,
411
  "trial_params": null
412
  }
{checkpoint-10000 β†’ checkpoint-11000}/training_args.bin RENAMED
File without changes
{checkpoint-10500 β†’ checkpoint-11500}/config.json RENAMED
File without changes
{checkpoint-10500 β†’ checkpoint-11500}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f73f8178eb8edf00ed5b572bab08ed8dc9a6b9f127b9da0845ce6897121f30d4
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a987de3ede3a55ee97ff63886937a088657c2157826f53d07345ccc9c7e5d778
3
  size 2265828101
{checkpoint-10000 β†’ checkpoint-11500}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9cdd3999fd22f100fd94dce143c740e69b3c530d00c63fa0da503c17bada7be
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a336d572b84d95a1c812e645a72e90873027257b83cee92eef0d3a78890c576
3
  size 1134425553
{checkpoint-10000 β†’ checkpoint-11500}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cabb7b3cf7014541a06db66ed776280360aa7ac5090dfa97d8fd96cf3ffc0723
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0b8ef7d104554cd305a60fb7a5d256c7f82cfc12dc853397197d87e16ef1f65
3
  size 14575
{checkpoint-10000 β†’ checkpoint-11500}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33042e23a1c163afce06998300e1af98d04bb036d7a9fc004dc4fc5115c37477
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ee4f114f4e57c077eb75e91b7efc254c244508b080b0e6980415bdd75809aff
3
  size 557
{checkpoint-10500 β†’ checkpoint-11500}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bc651b3c4e5c2b5a130baba8a17171ec720b664d0099fc5a91625bbe706a9d8
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ec4d60da8dcded02dd5639d5b8b5174bf534b01c0f3a7ab99393164e017b39f
3
  size 627
{checkpoint-10500 β†’ checkpoint-11500}/special_tokens_map.json RENAMED
File without changes
{checkpoint-10500 β†’ checkpoint-11500}/tokenizer.json RENAMED
File without changes
{checkpoint-10500 β†’ checkpoint-11500}/tokenizer_config.json RENAMED
File without changes
{checkpoint-10000 β†’ checkpoint-11500}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.8849383152916955,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
4
- "epoch": 4.154549231408392,
5
- "global_step": 10000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -366,11 +366,65 @@
366
  "eval_samples_per_second": 52.98,
367
  "eval_steps_per_second": 3.331,
368
  "step": 10000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
369
  }
370
  ],
371
  "max_steps": 12035,
372
  "num_train_epochs": 5,
373
- "total_flos": 1.6684492713864192e+16,
374
  "trial_name": null,
375
  "trial_params": null
376
  }
 
1
  {
2
  "best_metric": 0.8849383152916955,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
4
+ "epoch": 4.777731616119651,
5
+ "global_step": 11500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
366
  "eval_samples_per_second": 52.98,
367
  "eval_steps_per_second": 3.331,
368
  "step": 10000
369
+ },
370
+ {
371
+ "epoch": 4.36,
372
+ "learning_rate": 6.406314914831742e-06,
373
+ "loss": 0.0412,
374
+ "step": 10500
375
+ },
376
+ {
377
+ "epoch": 4.36,
378
+ "eval_accuracy": 0.8439143652185103,
379
+ "eval_f1": 0.8439143652185103,
380
+ "eval_loss": 1.1184284687042236,
381
+ "eval_precision": 0.8439143652185103,
382
+ "eval_recall": 0.8439143652185103,
383
+ "eval_runtime": 34.8108,
384
+ "eval_samples_per_second": 58.947,
385
+ "eval_steps_per_second": 3.706,
386
+ "step": 10500
387
+ },
388
+ {
389
+ "epoch": 4.57,
390
+ "learning_rate": 4.333194848358953e-06,
391
+ "loss": 0.039,
392
+ "step": 11000
393
+ },
394
+ {
395
+ "epoch": 4.57,
396
+ "eval_accuracy": 0.8635778739283588,
397
+ "eval_f1": 0.8635778739283588,
398
+ "eval_loss": 0.9634060263633728,
399
+ "eval_precision": 0.8635778739283588,
400
+ "eval_recall": 0.8635778739283588,
401
+ "eval_runtime": 39.6244,
402
+ "eval_samples_per_second": 51.786,
403
+ "eval_steps_per_second": 3.256,
404
+ "step": 11000
405
+ },
406
+ {
407
+ "epoch": 4.78,
408
+ "learning_rate": 2.2559202326547573e-06,
409
+ "loss": 0.0469,
410
+ "step": 11500
411
+ },
412
+ {
413
+ "epoch": 4.78,
414
+ "eval_accuracy": 0.8634089848964952,
415
+ "eval_f1": 0.8634089848964951,
416
+ "eval_loss": 0.9584938883781433,
417
+ "eval_precision": 0.8634089848964952,
418
+ "eval_recall": 0.8634089848964952,
419
+ "eval_runtime": 35.0357,
420
+ "eval_samples_per_second": 58.569,
421
+ "eval_steps_per_second": 3.682,
422
+ "step": 11500
423
  }
424
  ],
425
  "max_steps": 12035,
426
  "num_train_epochs": 5,
427
+ "total_flos": 1.918804286349619e+16,
428
  "trial_name": null,
429
  "trial_params": null
430
  }
{checkpoint-10500 β†’ checkpoint-11500}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ded9cb2eeea21506721e8c61ffb8b582933f1daa41565103186b7c1e36b4c34
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a336d572b84d95a1c812e645a72e90873027257b83cee92eef0d3a78890c576
3
  size 1134425553
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd243e364357934c6c9869396572a0adcc90607302d0df94af11534a3f187cd2
3
- size 17838
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21b09326263f0fbe132c2f3bc4c0d88999487e384816c9a0719ad3719c72fd3d
3
+ size 19096