pierreguillou commited on
Commit
b081990
•
1 Parent(s): dbd4532

Training in progress, step 7500

Browse files
Files changed (24) hide show
  1. {checkpoint-5500 → checkpoint-7000}/config.json +0 -0
  2. {checkpoint-5500 → checkpoint-7000}/optimizer.pt +1 -1
  3. {checkpoint-6500 → checkpoint-7000}/pytorch_model.bin +1 -1
  4. {checkpoint-6500 → checkpoint-7000}/rng_state.pth +1 -1
  5. {checkpoint-6500 → checkpoint-7000}/scaler.pt +1 -1
  6. {checkpoint-5500 → checkpoint-7000}/scheduler.pt +1 -1
  7. {checkpoint-5500 → checkpoint-7000}/special_tokens_map.json +0 -0
  8. {checkpoint-5500 → checkpoint-7000}/tokenizer.json +0 -0
  9. {checkpoint-5500 → checkpoint-7000}/tokenizer_config.json +0 -0
  10. {checkpoint-6500 → checkpoint-7000}/trainer_state.json +21 -3
  11. {checkpoint-5500 → checkpoint-7000}/training_args.bin +0 -0
  12. {checkpoint-6500 → checkpoint-7500}/config.json +0 -0
  13. {checkpoint-6500 → checkpoint-7500}/optimizer.pt +1 -1
  14. {checkpoint-5500 → checkpoint-7500}/pytorch_model.bin +1 -1
  15. {checkpoint-5500 → checkpoint-7500}/rng_state.pth +1 -1
  16. {checkpoint-5500 → checkpoint-7500}/scaler.pt +1 -1
  17. {checkpoint-6500 → checkpoint-7500}/scheduler.pt +1 -1
  18. {checkpoint-6500 → checkpoint-7500}/special_tokens_map.json +0 -0
  19. {checkpoint-6500 → checkpoint-7500}/tokenizer.json +0 -0
  20. {checkpoint-6500 → checkpoint-7500}/tokenizer_config.json +0 -0
  21. {checkpoint-5500 → checkpoint-7500}/trainer_state.json +77 -5
  22. {checkpoint-6500 → checkpoint-7500}/training_args.bin +0 -0
  23. pytorch_model.bin +1 -1
  24. runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-5500 → checkpoint-7000}/config.json RENAMED
File without changes
{checkpoint-5500 → checkpoint-7000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d3a74874f53beb0dd61e7742a119b65b3a7c6efdfcf021d79679adb8f4e296d
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9c6f5f525ee9bbad8e4c2914bb464706b90024fc72ec20e2cf61404fcbbae79
3
  size 2265828101
{checkpoint-6500 → checkpoint-7000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c5ee445768534ea29279d89b14a0f720766edc05f5f4988ee819d7fd74f6c91
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b28f1b03749d0fbb9870ea45989658c662220d5ce43d7aa82a871d99139334fa
3
  size 1134425553
{checkpoint-6500 → checkpoint-7000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2155603d2a90e6f05afc18565c0a7971b5a33e500179dd735d7729ffabd71cf8
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7be49988c0b55da3ad61eade275963315f89474e302a1ef659f269c6b2dd2ef4
3
  size 14575
{checkpoint-6500 → checkpoint-7000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8eec39e20dd1d19e75d63c9ea6180a447b93a16fe8c240630ce7a3dddde70b3a
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bc9b0718f152aae5e6bdba42771601266a9b8e0b992ecafee7d56cf889e09f7
3
  size 557
{checkpoint-5500 → checkpoint-7000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96574ab09e5e2e54af42547122334b19c9d0414475ddd65dd2890b9b6e6b7def
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f037e582d30bae872bb40f11a54323c3c3de9a9b56a3fbc16559292c4bb4ad4
3
  size 627
{checkpoint-5500 → checkpoint-7000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-5500 → checkpoint-7000}/tokenizer.json RENAMED
File without changes
{checkpoint-5500 → checkpoint-7000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-6500 → checkpoint-7000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.8573209374145502,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
4
- "epoch": 2.700457000415455,
5
- "global_step": 6500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -240,11 +240,29 @@
240
  "eval_samples_per_second": 59.215,
241
  "eval_steps_per_second": 3.723,
242
  "step": 6500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
243
  }
244
  ],
245
  "max_steps": 12035,
246
  "num_train_epochs": 5,
247
- "total_flos": 1.0845796506564096e+16,
248
  "trial_name": null,
249
  "trial_params": null
250
  }
 
1
  {
2
  "best_metric": 0.8573209374145502,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
4
+ "epoch": 2.9081844619858748,
5
+ "global_step": 7000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
240
  "eval_samples_per_second": 59.215,
241
  "eval_steps_per_second": 3.723,
242
  "step": 6500
243
+ },
244
+ {
245
+ "epoch": 2.91,
246
+ "learning_rate": 2.0947237224761117e-05,
247
+ "loss": 0.1239,
248
+ "step": 7000
249
+ },
250
+ {
251
+ "epoch": 2.91,
252
+ "eval_accuracy": 0.8189268308375287,
253
+ "eval_f1": 0.8189268308375287,
254
+ "eval_loss": 1.1430405378341675,
255
+ "eval_precision": 0.8189268308375287,
256
+ "eval_recall": 0.8189268308375287,
257
+ "eval_runtime": 39.4751,
258
+ "eval_samples_per_second": 51.982,
259
+ "eval_steps_per_second": 3.268,
260
+ "step": 7000
261
  }
262
  ],
263
  "max_steps": 12035,
264
  "num_train_epochs": 5,
265
+ "total_flos": 1.1680313223108096e+16,
266
  "trial_name": null,
267
  "trial_params": null
268
  }
{checkpoint-5500 → checkpoint-7000}/training_args.bin RENAMED
File without changes
{checkpoint-6500 → checkpoint-7500}/config.json RENAMED
File without changes
{checkpoint-6500 → checkpoint-7500}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:363b00981239b12adf86f779858e84efae5e7df9ed3d90c59b318b8b8fd859b0
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82387df7e7125fbeaaffcea1ea9067f548395eae05b211d472b47a2692c68cec
3
  size 2265828101
{checkpoint-5500 → checkpoint-7500}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ad5877b0b97895626b7a47603fd8c76c7a1dcb7f8da77da732de52ebd6fe498
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5c9961a421ba331f30b142fb3b0509e93e9e2f8d62f1c4981f37ce14a397e8a
3
  size 1134425553
{checkpoint-5500 → checkpoint-7500}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4b2654002f35c8d69a538e102e8376633570a6ea9bfd4a14b35a0f1a0043945
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f76f5d5cccc05cff73afe76fd9886e0c5c108c8cd2440a0dd4326a8f801030d2
3
  size 14575
{checkpoint-5500 → checkpoint-7500}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:609eb953721cf5cce74da27a7bae781c2bfe011d3b35b8e9f9b5692c47839041
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ece5e78a472a3b76204d2622fb05fcfd484df75b22422832aa6c9030f03d7149
3
  size 557
{checkpoint-6500 → checkpoint-7500}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9d8fc4d7b4bac08d88a4d03d2daffd167bc9d42006a1ae8f011989b8eedebcd
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1130cd316ba76c991772afe19f88717c71deab99e54ae54e3828ee796771bf
3
  size 627
{checkpoint-6500 → checkpoint-7500}/special_tokens_map.json RENAMED
File without changes
{checkpoint-6500 → checkpoint-7500}/tokenizer.json RENAMED
File without changes
{checkpoint-6500 → checkpoint-7500}/tokenizer_config.json RENAMED
File without changes
{checkpoint-5500 → checkpoint-7500}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.8489327821653182,
3
- "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-5500",
4
- "epoch": 2.2850020772746156,
5
- "global_step": 5500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -204,11 +204,83 @@
204
  "eval_samples_per_second": 61.114,
205
  "eval_steps_per_second": 3.842,
206
  "step": 5500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
207
  }
208
  ],
209
  "max_steps": 12035,
210
  "num_train_epochs": 5,
211
- "total_flos": 9176763073476096.0,
212
  "trial_name": null,
213
  "trial_params": null
214
  }
 
1
  {
2
+ "best_metric": 0.8573209374145502,
3
+ "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
4
+ "epoch": 3.115911923556294,
5
+ "global_step": 7500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
204
  "eval_samples_per_second": 61.114,
205
  "eval_steps_per_second": 3.842,
206
  "step": 5500
207
+ },
208
+ {
209
+ "epoch": 2.49,
210
+ "learning_rate": 2.5101786456169508e-05,
211
+ "loss": 0.134,
212
+ "step": 6000
213
+ },
214
+ {
215
+ "epoch": 2.49,
216
+ "eval_accuracy": 0.8573209374145502,
217
+ "eval_f1": 0.8573209374145502,
218
+ "eval_loss": 0.7681939005851746,
219
+ "eval_precision": 0.8573209374145502,
220
+ "eval_recall": 0.8573209374145502,
221
+ "eval_runtime": 39.5768,
222
+ "eval_samples_per_second": 51.849,
223
+ "eval_steps_per_second": 3.259,
224
+ "step": 6000
225
+ },
226
+ {
227
+ "epoch": 2.7,
228
+ "learning_rate": 2.302451184046531e-05,
229
+ "loss": 0.1354,
230
+ "step": 6500
231
+ },
232
+ {
233
+ "epoch": 2.7,
234
+ "eval_accuracy": 0.8255697994241689,
235
+ "eval_f1": 0.8255697994241689,
236
+ "eval_loss": 0.9870807528495789,
237
+ "eval_precision": 0.8255697994241689,
238
+ "eval_recall": 0.8255697994241689,
239
+ "eval_runtime": 34.6532,
240
+ "eval_samples_per_second": 59.215,
241
+ "eval_steps_per_second": 3.723,
242
+ "step": 6500
243
+ },
244
+ {
245
+ "epoch": 2.91,
246
+ "learning_rate": 2.0947237224761117e-05,
247
+ "loss": 0.1239,
248
+ "step": 7000
249
+ },
250
+ {
251
+ "epoch": 2.91,
252
+ "eval_accuracy": 0.8189268308375287,
253
+ "eval_f1": 0.8189268308375287,
254
+ "eval_loss": 1.1430405378341675,
255
+ "eval_precision": 0.8189268308375287,
256
+ "eval_recall": 0.8189268308375287,
257
+ "eval_runtime": 39.4751,
258
+ "eval_samples_per_second": 51.982,
259
+ "eval_steps_per_second": 3.268,
260
+ "step": 7000
261
+ },
262
+ {
263
+ "epoch": 3.12,
264
+ "learning_rate": 1.886996260905692e-05,
265
+ "loss": 0.1012,
266
+ "step": 7500
267
+ },
268
+ {
269
+ "epoch": 3.12,
270
+ "eval_accuracy": 0.8385581702079747,
271
+ "eval_f1": 0.8385581702079747,
272
+ "eval_loss": 0.8271787166595459,
273
+ "eval_precision": 0.8385581702079747,
274
+ "eval_recall": 0.8385581702079747,
275
+ "eval_runtime": 33.307,
276
+ "eval_samples_per_second": 61.609,
277
+ "eval_steps_per_second": 3.873,
278
+ "step": 7500
279
  }
280
  ],
281
  "max_steps": 12035,
282
  "num_train_epochs": 5,
283
+ "total_flos": 1.2513369535398144e+16,
284
  "trial_name": null,
285
  "trial_params": null
286
  }
{checkpoint-6500 → checkpoint-7500}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c5ee445768534ea29279d89b14a0f720766edc05f5f4988ee819d7fd74f6c91
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5c9961a421ba331f30b142fb3b0509e93e9e2f8d62f1c4981f37ce14a397e8a
3
  size 1134425553
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fe49282ece83f2b951a8a5e3ecb00a72d560e9d3422709897756658604d5989
3
- size 12806
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60237bfbe8c03c8322ddb9053845170fc6b1ec849653dbcca5e58f121abad57e
3
+ size 14064