pierreguillou commited on
Commit
dbd4532
•
1 Parent(s): a00a34d

Training in progress, step 6500

Browse files
Files changed (24) hide show
  1. {checkpoint-4500 → checkpoint-6000}/config.json +0 -0
  2. {checkpoint-4500 → checkpoint-6000}/optimizer.pt +1 -1
  3. {checkpoint-5000 → checkpoint-6000}/pytorch_model.bin +1 -1
  4. {checkpoint-5000 → checkpoint-6000}/rng_state.pth +1 -1
  5. {checkpoint-5000 → checkpoint-6000}/scaler.pt +1 -1
  6. {checkpoint-4500 → checkpoint-6000}/scheduler.pt +1 -1
  7. {checkpoint-4500 → checkpoint-6000}/special_tokens_map.json +0 -0
  8. {checkpoint-4500 → checkpoint-6000}/tokenizer.json +0 -0
  9. {checkpoint-4500 → checkpoint-6000}/tokenizer_config.json +0 -0
  10. {checkpoint-5000 → checkpoint-6000}/trainer_state.json +41 -5
  11. {checkpoint-4500 → checkpoint-6000}/training_args.bin +0 -0
  12. {checkpoint-5000 → checkpoint-6500}/config.json +0 -0
  13. {checkpoint-5000 → checkpoint-6500}/optimizer.pt +1 -1
  14. {checkpoint-4500 → checkpoint-6500}/pytorch_model.bin +1 -1
  15. {checkpoint-4500 → checkpoint-6500}/rng_state.pth +1 -1
  16. {checkpoint-4500 → checkpoint-6500}/scaler.pt +1 -1
  17. {checkpoint-5000 → checkpoint-6500}/scheduler.pt +1 -1
  18. {checkpoint-5000 → checkpoint-6500}/special_tokens_map.json +0 -0
  19. {checkpoint-5000 → checkpoint-6500}/tokenizer.json +0 -0
  20. {checkpoint-5000 → checkpoint-6500}/tokenizer_config.json +0 -0
  21. {checkpoint-4500 → checkpoint-6500}/trainer_state.json +77 -5
  22. {checkpoint-5000 → checkpoint-6500}/training_args.bin +0 -0
  23. pytorch_model.bin +1 -1
  24. runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-4500 → checkpoint-6000}/config.json RENAMED
File without changes
{checkpoint-4500 → checkpoint-6000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c2f998a9b6f8369b53c91c97453360581cf5031214c0a4ec6ae85ecea3372b2
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6ccab808598cafaa3502eaf827acb795d751b863043a68024a8ebc252765dda
3
  size 2265828101
{checkpoint-5000 → checkpoint-6000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:826a115bd1f49a5fd6ad8834ab59356109e291dab9ee2ebf7e7079622823f521
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9effd102ed93d81722319ca88162190926ca77de0e9c79bcdf05fedc7571c41
3
  size 1134425553
{checkpoint-5000 → checkpoint-6000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:322213ce84acef97a1d009f4a95470d562524fe104f583c777a9886789ed90a6
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33f25f963833bb60f4e565ecbfcbf34d003c383bcd545a16637c61002e2435ad
3
  size 14575
{checkpoint-5000 → checkpoint-6000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d521e0e6865aafff22fef97e6b783e4fcbd42a34dedc30bf0c2f849637dfbde6
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06535ee946097fce21c4464212b93d33310a3a654d4286c652849b57cf50a7f8
3
  size 557
{checkpoint-4500 → checkpoint-6000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82119bc6700e4fbce2c931750dd7da685db2db7703ad686612f7d1a894483990
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72f3b66da2277cfe6e060fe737d382a511cc283da3a6c66c08f0ac5f7793cfb9
3
  size 627
{checkpoint-4500 → checkpoint-6000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-4500 → checkpoint-6000}/tokenizer.json RENAMED
File without changes
{checkpoint-4500 → checkpoint-6000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-5000 → checkpoint-6000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.842474787280243,
3
- "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-4500",
4
- "epoch": 2.077274615704196,
5
- "global_step": 5000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -186,11 +186,47 @@
186
  "eval_samples_per_second": 53.645,
187
  "eval_steps_per_second": 3.372,
188
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
189
  }
190
  ],
191
  "max_steps": 12035,
192
  "num_train_epochs": 5,
193
- "total_flos": 8342246356932096.0,
194
  "trial_name": null,
195
  "trial_params": null
196
  }
 
1
  {
2
+ "best_metric": 0.8573209374145502,
3
+ "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
4
+ "epoch": 2.4927295388450355,
5
+ "global_step": 6000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
186
  "eval_samples_per_second": 53.645,
187
  "eval_steps_per_second": 3.372,
188
  "step": 5000
189
+ },
190
+ {
191
+ "epoch": 2.29,
192
+ "learning_rate": 2.7179061071873702e-05,
193
+ "loss": 0.1294,
194
+ "step": 5500
195
+ },
196
+ {
197
+ "epoch": 2.29,
198
+ "eval_accuracy": 0.8489327821653182,
199
+ "eval_f1": 0.8489327821653182,
200
+ "eval_loss": 0.8485749959945679,
201
+ "eval_precision": 0.8489327821653182,
202
+ "eval_recall": 0.8489327821653182,
203
+ "eval_runtime": 33.5765,
204
+ "eval_samples_per_second": 61.114,
205
+ "eval_steps_per_second": 3.842,
206
+ "step": 5500
207
+ },
208
+ {
209
+ "epoch": 2.49,
210
+ "learning_rate": 2.5101786456169508e-05,
211
+ "loss": 0.134,
212
+ "step": 6000
213
+ },
214
+ {
215
+ "epoch": 2.49,
216
+ "eval_accuracy": 0.8573209374145502,
217
+ "eval_f1": 0.8573209374145502,
218
+ "eval_loss": 0.7681939005851746,
219
+ "eval_precision": 0.8573209374145502,
220
+ "eval_recall": 0.8573209374145502,
221
+ "eval_runtime": 39.5768,
222
+ "eval_samples_per_second": 51.849,
223
+ "eval_steps_per_second": 3.259,
224
+ "step": 6000
225
  }
226
  ],
227
  "max_steps": 12035,
228
  "num_train_epochs": 5,
229
+ "total_flos": 1.0011279790020096e+16,
230
  "trial_name": null,
231
  "trial_params": null
232
  }
{checkpoint-4500 → checkpoint-6000}/training_args.bin RENAMED
File without changes
{checkpoint-5000 → checkpoint-6500}/config.json RENAMED
File without changes
{checkpoint-5000 → checkpoint-6500}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08b84d52785a38380247450ccf7219098ead85f3af921462c7f9cea34fc457af
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:363b00981239b12adf86f779858e84efae5e7df9ed3d90c59b318b8b8fd859b0
3
  size 2265828101
{checkpoint-4500 → checkpoint-6500}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ab31af496b83252a0734273c407717be54e25e7236af6050a2c0755b5a8410e
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c5ee445768534ea29279d89b14a0f720766edc05f5f4988ee819d7fd74f6c91
3
  size 1134425553
{checkpoint-4500 → checkpoint-6500}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b637499f7564729172f931fb947eca2274013d5c119ca4825529baec3098ba4
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2155603d2a90e6f05afc18565c0a7971b5a33e500179dd735d7729ffabd71cf8
3
  size 14575
{checkpoint-4500 → checkpoint-6500}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe7c767111accfefd8c962f6b3f65e0837fac0d4f2fb9b95baf14515e7dae4e1
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eec39e20dd1d19e75d63c9ea6180a447b93a16fe8c240630ce7a3dddde70b3a
3
  size 557
{checkpoint-5000 → checkpoint-6500}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edd7471042c806219d2a11bac18a23846c94c3ba80ac0f47d46e260c2e00b6a4
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9d8fc4d7b4bac08d88a4d03d2daffd167bc9d42006a1ae8f011989b8eedebcd
3
  size 627
{checkpoint-5000 → checkpoint-6500}/special_tokens_map.json RENAMED
File without changes
{checkpoint-5000 → checkpoint-6500}/tokenizer.json RENAMED
File without changes
{checkpoint-5000 → checkpoint-6500}/tokenizer_config.json RENAMED
File without changes
{checkpoint-4500 → checkpoint-6500}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.842474787280243,
3
- "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-4500",
4
- "epoch": 1.8695471541337765,
5
- "global_step": 4500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -168,11 +168,83 @@
168
  "eval_samples_per_second": 58.527,
169
  "eval_steps_per_second": 3.679,
170
  "step": 4500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
171
  }
172
  ],
173
  "max_steps": 12035,
174
  "num_train_epochs": 5,
175
- "total_flos": 7509190044642048.0,
176
  "trial_name": null,
177
  "trial_params": null
178
  }
 
1
  {
2
+ "best_metric": 0.8573209374145502,
3
+ "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
4
+ "epoch": 2.700457000415455,
5
+ "global_step": 6500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
168
  "eval_samples_per_second": 58.527,
169
  "eval_steps_per_second": 3.679,
170
  "step": 4500
171
+ },
172
+ {
173
+ "epoch": 2.08,
174
+ "learning_rate": 2.9256335687577903e-05,
175
+ "loss": 0.1704,
176
+ "step": 5000
177
+ },
178
+ {
179
+ "epoch": 2.08,
180
+ "eval_accuracy": 0.8317543549243216,
181
+ "eval_f1": 0.8317543549243216,
182
+ "eval_loss": 0.856721818447113,
183
+ "eval_precision": 0.8317543549243216,
184
+ "eval_recall": 0.8317543549243216,
185
+ "eval_runtime": 38.2513,
186
+ "eval_samples_per_second": 53.645,
187
+ "eval_steps_per_second": 3.372,
188
+ "step": 5000
189
+ },
190
+ {
191
+ "epoch": 2.29,
192
+ "learning_rate": 2.7179061071873702e-05,
193
+ "loss": 0.1294,
194
+ "step": 5500
195
+ },
196
+ {
197
+ "epoch": 2.29,
198
+ "eval_accuracy": 0.8489327821653182,
199
+ "eval_f1": 0.8489327821653182,
200
+ "eval_loss": 0.8485749959945679,
201
+ "eval_precision": 0.8489327821653182,
202
+ "eval_recall": 0.8489327821653182,
203
+ "eval_runtime": 33.5765,
204
+ "eval_samples_per_second": 61.114,
205
+ "eval_steps_per_second": 3.842,
206
+ "step": 5500
207
+ },
208
+ {
209
+ "epoch": 2.49,
210
+ "learning_rate": 2.5101786456169508e-05,
211
+ "loss": 0.134,
212
+ "step": 6000
213
+ },
214
+ {
215
+ "epoch": 2.49,
216
+ "eval_accuracy": 0.8573209374145502,
217
+ "eval_f1": 0.8573209374145502,
218
+ "eval_loss": 0.7681939005851746,
219
+ "eval_precision": 0.8573209374145502,
220
+ "eval_recall": 0.8573209374145502,
221
+ "eval_runtime": 39.5768,
222
+ "eval_samples_per_second": 51.849,
223
+ "eval_steps_per_second": 3.259,
224
+ "step": 6000
225
+ },
226
+ {
227
+ "epoch": 2.7,
228
+ "learning_rate": 2.302451184046531e-05,
229
+ "loss": 0.1354,
230
+ "step": 6500
231
+ },
232
+ {
233
+ "epoch": 2.7,
234
+ "eval_accuracy": 0.8255697994241689,
235
+ "eval_f1": 0.8255697994241689,
236
+ "eval_loss": 0.9870807528495789,
237
+ "eval_precision": 0.8255697994241689,
238
+ "eval_recall": 0.8255697994241689,
239
+ "eval_runtime": 34.6532,
240
+ "eval_samples_per_second": 59.215,
241
+ "eval_steps_per_second": 3.723,
242
+ "step": 6500
243
  }
244
  ],
245
  "max_steps": 12035,
246
  "num_train_epochs": 5,
247
+ "total_flos": 1.0845796506564096e+16,
248
  "trial_name": null,
249
  "trial_params": null
250
  }
{checkpoint-5000 → checkpoint-6500}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ad5877b0b97895626b7a47603fd8c76c7a1dcb7f8da77da732de52ebd6fe498
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c5ee445768534ea29279d89b14a0f720766edc05f5f4988ee819d7fd74f6c91
3
  size 1134425553
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4350d0a4bb2974f01fdf48b3f8f7990549e813e56d160d998d704b15030fe2ef
3
- size 11548
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fe49282ece83f2b951a8a5e3ecb00a72d560e9d3422709897756658604d5989
3
+ size 12806