pierreguillou commited on
Commit
2e14fb8
•
1 Parent(s): b583cf5

Training in progress, step 3500

Browse files
Files changed (24) hide show
  1. {checkpoint-1500 → checkpoint-3000}/config.json +0 -0
  2. {checkpoint-1500 → checkpoint-3000}/optimizer.pt +1 -1
  3. {checkpoint-2500 → checkpoint-3000}/pytorch_model.bin +1 -1
  4. {checkpoint-2500 → checkpoint-3000}/rng_state.pth +1 -1
  5. {checkpoint-2500 → checkpoint-3000}/scaler.pt +1 -1
  6. {checkpoint-1500 → checkpoint-3000}/scheduler.pt +1 -1
  7. {checkpoint-1500 → checkpoint-3000}/special_tokens_map.json +0 -0
  8. {checkpoint-1500 → checkpoint-3000}/tokenizer.json +0 -0
  9. {checkpoint-1500 → checkpoint-3000}/tokenizer_config.json +0 -0
  10. {checkpoint-2500 → checkpoint-3000}/trainer_state.json +21 -3
  11. {checkpoint-1500 → checkpoint-3000}/training_args.bin +0 -0
  12. {checkpoint-2500 → checkpoint-3500}/config.json +0 -0
  13. {checkpoint-2500 → checkpoint-3500}/optimizer.pt +1 -1
  14. {checkpoint-1500 → checkpoint-3500}/pytorch_model.bin +1 -1
  15. {checkpoint-1500 → checkpoint-3500}/rng_state.pth +1 -1
  16. {checkpoint-1500 → checkpoint-3500}/scaler.pt +1 -1
  17. {checkpoint-2500 → checkpoint-3500}/scheduler.pt +1 -1
  18. {checkpoint-2500 → checkpoint-3500}/special_tokens_map.json +0 -0
  19. {checkpoint-2500 → checkpoint-3500}/tokenizer.json +0 -0
  20. {checkpoint-2500 → checkpoint-3500}/tokenizer_config.json +0 -0
  21. {checkpoint-1500 → checkpoint-3500}/trainer_state.json +77 -5
  22. {checkpoint-2500 → checkpoint-3500}/training_args.bin +0 -0
  23. pytorch_model.bin +1 -1
  24. runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-1500 → checkpoint-3000}/config.json RENAMED
File without changes
{checkpoint-1500 → checkpoint-3000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e23364a6999277a663e128d860936666da5c97d392396e7e1bb598c485db3e4c
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea30a7a290b75e6639badd0ebfe8594014d2cc513e9d18b2249bd41588645928
3
  size 2265828101
{checkpoint-2500 → checkpoint-3000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a13afdc894a855563bdc308de94030cb3ee880f8e35ef0b0686b90e4be049c5
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a4df4b206cec3ac33800bf53b9770b506aee9e140e2756dfcd4dfb7ea309183
3
  size 1134425553
{checkpoint-2500 → checkpoint-3000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c9591d44de932d974bc8f226917be3716a00b069a491eca25e99d763d7d1202
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c1d2c6980d4c9d77f21501530c26c1da9f3782a90a07e0ad58f806cca3b17da
3
  size 14575
{checkpoint-2500 → checkpoint-3000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0657c6296ff60320a3cd6258c348ecc016115157a70e0b03987126ec22d4801f
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11e954dd65b2459d99d79aa1c0dbd58ae609a1a5900b64ee547452af45217be0
3
  size 557
{checkpoint-1500 → checkpoint-3000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cb4c24baee1d80158990ceb4f9780c1a6dd6396dffda96df7d63fa2d0ae5653
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb16ae567012aed0ca098fc1879d6f8c8fca82e03a708abcc358edf60eabad88
3
  size 627
{checkpoint-1500 → checkpoint-3000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-1500 → checkpoint-3000}/tokenizer.json RENAMED
File without changes
{checkpoint-1500 → checkpoint-3000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-2500 → checkpoint-3000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.8337166846278812,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-2000",
4
- "epoch": 1.038637307852098,
5
- "global_step": 2500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -96,11 +96,29 @@
96
  "eval_samples_per_second": 61.014,
97
  "eval_steps_per_second": 3.836,
98
  "step": 2500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
99
  }
100
  ],
101
  "max_steps": 12035,
102
  "num_train_epochs": 5,
103
- "total_flos": 4171123178466048.0,
104
  "trial_name": null,
105
  "trial_params": null
106
  }
 
1
  {
2
  "best_metric": 0.8337166846278812,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-2000",
4
+ "epoch": 1.2463647694225177,
5
+ "global_step": 3000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
96
  "eval_samples_per_second": 61.014,
97
  "eval_steps_per_second": 3.836,
98
  "step": 2500
99
+ },
100
+ {
101
+ "epoch": 1.25,
102
+ "learning_rate": 3.756543415039468e-05,
103
+ "loss": 0.2377,
104
+ "step": 3000
105
+ },
106
+ {
107
+ "epoch": 1.25,
108
+ "eval_accuracy": 0.8165945537308391,
109
+ "eval_f1": 0.8165945537308391,
110
+ "eval_loss": 0.9047627449035645,
111
+ "eval_precision": 0.8165945537308391,
112
+ "eval_recall": 0.8165945537308391,
113
+ "eval_runtime": 39.8436,
114
+ "eval_samples_per_second": 51.501,
115
+ "eval_steps_per_second": 3.238,
116
+ "step": 3000
117
  }
118
  ],
119
  "max_steps": 12035,
120
  "num_train_epochs": 5,
121
+ "total_flos": 5005639895010048.0,
122
  "trial_name": null,
123
  "trial_params": null
124
  }
{checkpoint-1500 → checkpoint-3000}/training_args.bin RENAMED
File without changes
{checkpoint-2500 → checkpoint-3500}/config.json RENAMED
File without changes
{checkpoint-2500 → checkpoint-3500}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:249b736b0ee96830be7e13d95931eda8b17d72ed799b1d53bf204baa5ec28678
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15c3fdcaf971cedf361391dddb094e11c51b1ce421726a0675d31804062b208a
3
  size 2265828101
{checkpoint-1500 → checkpoint-3500}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70b1a29b3ccb13877c06b9c50bf20c54e7d085e260a305e3376c872a9cfa9e2e
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0454cb45818aca52487c033cfff5471ad7a3bbe0b013a07ead41acb7b4a1942d
3
  size 1134425553
{checkpoint-1500 → checkpoint-3500}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8c587b97653ca2e1fe2cda77f5e5c4a3c7a1593d3d2f35db0d2ca4e7933179f
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a90e565ec1ab563c341221b882d443636296fc51d1146f3693fa6818dc5ec762
3
  size 14575
{checkpoint-1500 → checkpoint-3500}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c2561ef8d03a8a364e3db0bdeeef0d1ebf7cf016b7859262ac8c8947d6e8539
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c38e23af2776207a290160225119b128d6a33e614e6a29f1b7b09e1994694f4
3
  size 557
{checkpoint-2500 → checkpoint-3500}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36e6282265457b125586a29b2d41aff2b5860b72c24a97a3146a6d4661533245
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68e5c2c2b17e96e3a127df56a8de776ff834bfeacb361f5e48bcd5d1f4f76195
3
  size 627
{checkpoint-2500 → checkpoint-3500}/special_tokens_map.json RENAMED
File without changes
{checkpoint-2500 → checkpoint-3500}/tokenizer.json RENAMED
File without changes
{checkpoint-2500 → checkpoint-3500}/tokenizer_config.json RENAMED
File without changes
{checkpoint-1500 → checkpoint-3500}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.8311511798105226,
3
- "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-1000",
4
- "epoch": 0.6231823847112589,
5
- "global_step": 1500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -60,11 +60,83 @@
60
  "eval_samples_per_second": 59.285,
61
  "eval_steps_per_second": 3.727,
62
  "step": 1500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  }
64
  ],
65
  "max_steps": 12035,
66
  "num_train_epochs": 5,
67
- "total_flos": 2503550149632000.0,
68
  "trial_name": null,
69
  "trial_params": null
70
  }
 
1
  {
2
+ "best_metric": 0.8337166846278812,
3
+ "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-2000",
4
+ "epoch": 1.4540922309929374,
5
+ "global_step": 3500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
60
  "eval_samples_per_second": 59.285,
61
  "eval_steps_per_second": 3.727,
62
  "step": 1500
63
+ },
64
+ {
65
+ "epoch": 0.83,
66
+ "learning_rate": 4.171582883257167e-05,
67
+ "loss": 0.3361,
68
+ "step": 2000
69
+ },
70
+ {
71
+ "epoch": 0.83,
72
+ "eval_accuracy": 0.8337166846278812,
73
+ "eval_f1": 0.8337166846278812,
74
+ "eval_loss": 0.6990912556648254,
75
+ "eval_precision": 0.8337166846278812,
76
+ "eval_recall": 0.8337166846278812,
77
+ "eval_runtime": 38.6559,
78
+ "eval_samples_per_second": 53.084,
79
+ "eval_steps_per_second": 3.337,
80
+ "step": 2000
81
+ },
82
+ {
83
+ "epoch": 1.04,
84
+ "learning_rate": 3.964270876609888e-05,
85
+ "loss": 0.2784,
86
+ "step": 2500
87
+ },
88
+ {
89
+ "epoch": 1.04,
90
+ "eval_accuracy": 0.8119380418523106,
91
+ "eval_f1": 0.8119380418523107,
92
+ "eval_loss": 0.7512525320053101,
93
+ "eval_precision": 0.8119380418523106,
94
+ "eval_recall": 0.8119380418523106,
95
+ "eval_runtime": 33.6314,
96
+ "eval_samples_per_second": 61.014,
97
+ "eval_steps_per_second": 3.836,
98
+ "step": 2500
99
+ },
100
+ {
101
+ "epoch": 1.25,
102
+ "learning_rate": 3.756543415039468e-05,
103
+ "loss": 0.2377,
104
+ "step": 3000
105
+ },
106
+ {
107
+ "epoch": 1.25,
108
+ "eval_accuracy": 0.8165945537308391,
109
+ "eval_f1": 0.8165945537308391,
110
+ "eval_loss": 0.9047627449035645,
111
+ "eval_precision": 0.8165945537308391,
112
+ "eval_recall": 0.8165945537308391,
113
+ "eval_runtime": 39.8436,
114
+ "eval_samples_per_second": 51.501,
115
+ "eval_steps_per_second": 3.238,
116
+ "step": 3000
117
+ },
118
+ {
119
+ "epoch": 1.45,
120
+ "learning_rate": 3.548815953469049e-05,
121
+ "loss": 0.2401,
122
+ "step": 3500
123
+ },
124
+ {
125
+ "epoch": 1.45,
126
+ "eval_accuracy": 0.7939071271171446,
127
+ "eval_f1": 0.7939071271171445,
128
+ "eval_loss": 1.241086721420288,
129
+ "eval_precision": 0.7939071271171446,
130
+ "eval_recall": 0.7939071271171446,
131
+ "eval_runtime": 34.8048,
132
+ "eval_samples_per_second": 58.957,
133
+ "eval_steps_per_second": 3.706,
134
+ "step": 3500
135
  }
136
  ],
137
  "max_steps": 12035,
138
  "num_train_epochs": 5,
139
+ "total_flos": 5840156611554048.0,
140
  "trial_name": null,
141
  "trial_params": null
142
  }
{checkpoint-2500 → checkpoint-3500}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a13afdc894a855563bdc308de94030cb3ee880f8e35ef0b0686b90e4be049c5
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0454cb45818aca52487c033cfff5471ad7a3bbe0b013a07ead41acb7b4a1942d
3
  size 1134425553
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f05a519a608fafd274f915fc85bdff10be90a22cf289b452daf5700ae30a1f1
3
- size 7774
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcf52f75b3c858901dfc7c486fc00d7c6bc29f1aed5cd11073e2774f11b78b82
3
+ size 9032