pierreguillou commited on
Commit
0a6fb58
β€’
1 Parent(s): 27433f3

Training in progress, step 1300

Browse files
Files changed (24) hide show
  1. {checkpoint-700 β†’ checkpoint-1200}/config.json +0 -0
  2. {checkpoint-700 β†’ checkpoint-1200}/optimizer.pt +1 -1
  3. {checkpoint-800 β†’ checkpoint-1200}/pytorch_model.bin +1 -1
  4. {checkpoint-800 β†’ checkpoint-1200}/rng_state.pth +1 -1
  5. {checkpoint-800 β†’ checkpoint-1200}/scaler.pt +1 -1
  6. {checkpoint-700 β†’ checkpoint-1200}/scheduler.pt +1 -1
  7. {checkpoint-700 β†’ checkpoint-1200}/special_tokens_map.json +0 -0
  8. {checkpoint-700 β†’ checkpoint-1200}/tokenizer.json +0 -0
  9. {checkpoint-700 β†’ checkpoint-1200}/tokenizer_config.json +0 -0
  10. {checkpoint-800 β†’ checkpoint-1200}/trainer_state.json +57 -3
  11. {checkpoint-700 β†’ checkpoint-1200}/training_args.bin +0 -0
  12. {checkpoint-800 β†’ checkpoint-1300}/config.json +0 -0
  13. {checkpoint-800 β†’ checkpoint-1300}/optimizer.pt +1 -1
  14. {checkpoint-700 β†’ checkpoint-1300}/pytorch_model.bin +1 -1
  15. {checkpoint-700 β†’ checkpoint-1300}/rng_state.pth +1 -1
  16. {checkpoint-700 β†’ checkpoint-1300}/scaler.pt +1 -1
  17. {checkpoint-800 β†’ checkpoint-1300}/scheduler.pt +1 -1
  18. {checkpoint-800 β†’ checkpoint-1300}/special_tokens_map.json +0 -0
  19. {checkpoint-800 β†’ checkpoint-1300}/tokenizer.json +0 -0
  20. {checkpoint-800 β†’ checkpoint-1300}/tokenizer_config.json +0 -0
  21. {checkpoint-700 β†’ checkpoint-1300}/trainer_state.json +81 -3
  22. {checkpoint-800 β†’ checkpoint-1300}/training_args.bin +0 -0
  23. pytorch_model.bin +1 -1
  24. runs/Feb15_07-53-26_e220f522c880/events.out.tfevents.1676447621.e220f522c880.495.0 +2 -2
{checkpoint-700 β†’ checkpoint-1200}/config.json RENAMED
File without changes
{checkpoint-700 β†’ checkpoint-1200}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e3fe13c1ea3aa84e754ff7abe68da7eec60a7e1dc2e5dfc4a93ad1d3f636fa3
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:280a221cc64b57effe5c7a796f38b48321fed8fcb3ff1e239c462a69ff81116c
3
  size 2265828101
{checkpoint-800 β†’ checkpoint-1200}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8126932772d64c007aa46752a8678869bff8e31fb1d734f060c2aef68f5b5c3
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:129796804ce986931f94bfed0dab6f25dddc2e97c3a332294d4f52bf3528c96a
3
  size 1134425553
{checkpoint-800 β†’ checkpoint-1200}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64c8402a2a8dcf25bb022948010e12c766380abe6897e4ffad7784a45553b860
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd6ffa5eb17c8d65486aa60854f05719c6a9abb0d32d2839b3ba42058bd6991d
3
  size 14575
{checkpoint-800 β†’ checkpoint-1200}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d15232b452895e36dc91e0446f6e8ef9af073f8677f732bb005840a10ca7266
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b74d76706ac346849ec903aa334b83db05c630c620b87dcbe1a7b129aecd1c1
3
  size 557
{checkpoint-700 β†’ checkpoint-1200}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec7fcec2c61a14f594e0c95f40c28d94feca9810fd5de97d1910aa5fc27619dd
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a2c927b05979c18fd3e62e50ba927b4a9c741248dda26234d8cd08f20d64a8
3
  size 627
{checkpoint-700 β†’ checkpoint-1200}/special_tokens_map.json RENAMED
File without changes
{checkpoint-700 β†’ checkpoint-1200}/tokenizer.json RENAMED
File without changes
{checkpoint-700 β†’ checkpoint-1200}/tokenizer_config.json RENAMED
File without changes
{checkpoint-800 β†’ checkpoint-1200}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.885723696687195,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
4
- "epoch": 0.42643923240938164,
5
- "global_step": 800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -108,11 +108,65 @@
108
  "eval_samples_per_second": 35.233,
109
  "eval_steps_per_second": 2.214,
110
  "step": 800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
111
  }
112
  ],
113
  "max_steps": 1876,
114
  "num_train_epochs": 1,
115
- "total_flos": 1780302328627200.0,
116
  "trial_name": null,
117
  "trial_params": null
118
  }
 
1
  {
2
  "best_metric": 0.885723696687195,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
4
+ "epoch": 0.6396588486140725,
5
+ "global_step": 1200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
108
  "eval_samples_per_second": 35.233,
109
  "eval_steps_per_second": 2.214,
110
  "step": 800
111
+ },
112
+ {
113
+ "epoch": 0.48,
114
+ "eval_accuracy": 0.8833980456546259,
115
+ "eval_f1": 0.8833980456546259,
116
+ "eval_loss": 0.38389313220977783,
117
+ "eval_precision": 0.8833980456546259,
118
+ "eval_recall": 0.8833980456546259,
119
+ "eval_runtime": 47.6493,
120
+ "eval_samples_per_second": 33.726,
121
+ "eval_steps_per_second": 2.12,
122
+ "step": 900
123
+ },
124
+ {
125
+ "epoch": 0.53,
126
+ "learning_rate": 9.381663113006397e-06,
127
+ "loss": 0.4464,
128
+ "step": 1000
129
+ },
130
+ {
131
+ "epoch": 0.53,
132
+ "eval_accuracy": 0.8498407977082855,
133
+ "eval_f1": 0.8498407977082856,
134
+ "eval_loss": 0.4365050792694092,
135
+ "eval_precision": 0.8498407977082855,
136
+ "eval_recall": 0.8498407977082855,
137
+ "eval_runtime": 47.0078,
138
+ "eval_samples_per_second": 34.186,
139
+ "eval_steps_per_second": 2.149,
140
+ "step": 1000
141
+ },
142
+ {
143
+ "epoch": 0.59,
144
+ "eval_accuracy": 0.8811622266361904,
145
+ "eval_f1": 0.8811622266361904,
146
+ "eval_loss": 0.36158204078674316,
147
+ "eval_precision": 0.8811622266361904,
148
+ "eval_recall": 0.8811622266361904,
149
+ "eval_runtime": 44.8724,
150
+ "eval_samples_per_second": 35.813,
151
+ "eval_steps_per_second": 2.251,
152
+ "step": 1100
153
+ },
154
+ {
155
+ "epoch": 0.64,
156
+ "eval_accuracy": 0.8795751943864972,
157
+ "eval_f1": 0.8795751943864972,
158
+ "eval_loss": 0.3948919177055359,
159
+ "eval_precision": 0.8795751943864972,
160
+ "eval_recall": 0.8795751943864972,
161
+ "eval_runtime": 45.1224,
162
+ "eval_samples_per_second": 35.614,
163
+ "eval_steps_per_second": 2.238,
164
+ "step": 1200
165
  }
166
  ],
167
  "max_steps": 1876,
168
  "num_train_epochs": 1,
169
+ "total_flos": 2670453492940800.0,
170
  "trial_name": null,
171
  "trial_params": null
172
  }
{checkpoint-700 β†’ checkpoint-1200}/training_args.bin RENAMED
File without changes
{checkpoint-800 β†’ checkpoint-1300}/config.json RENAMED
File without changes
{checkpoint-800 β†’ checkpoint-1300}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5927a29acc1b827e5e81631185eaee6608e45cc4c08f5547e015207b8c3e1f36
3
  size 2265828101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c08cf141a111f37d0566da69d0c30d72707ecd26196f04456a9b2121b4d97d3
3
  size 2265828101
{checkpoint-700 β†’ checkpoint-1300}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfe775f2f5e3266c5d9bceb93d7b7d60750dc69b67a1bed6e77aa7d295da49d0
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d4698a9bcd9f4d1b85cd29935ce42f4264d331bc9713045308140215396cd2e
3
  size 1134425553
{checkpoint-700 β†’ checkpoint-1300}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96a57174e6d28245887299f8c18770addda0c495bdadadc4f17326f19f3cdd79
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55d131675f12693ae085c3c3a36adf556143b9deea694fe5308eef74c5dc9628
3
  size 14575
{checkpoint-700 β†’ checkpoint-1300}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55749a54a2c0aac733a45a67ee5b21dbfaa7cb45a667adecbc1609b113af0b09
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af7a31e9f5bbee16af877be66fd13ae4491e1f0e57f209ceef7ac824ca84139d
3
  size 557
{checkpoint-800 β†’ checkpoint-1300}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:965edcc2ade2296ca06465ca794bdd6e45524f6fe975b06d7cc6014955adf226
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:893ff4c60fcbf7662c0d4334e0bfce704fb88be1f6c471b5adc0626650efe85d
3
  size 627
{checkpoint-800 β†’ checkpoint-1300}/special_tokens_map.json RENAMED
File without changes
{checkpoint-800 β†’ checkpoint-1300}/tokenizer.json RENAMED
File without changes
{checkpoint-800 β†’ checkpoint-1300}/tokenizer_config.json RENAMED
File without changes
{checkpoint-700 β†’ checkpoint-1300}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.885723696687195,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
4
- "epoch": 0.373134328358209,
5
- "global_step": 700,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -96,11 +96,89 @@
96
  "eval_samples_per_second": 35.056,
97
  "eval_steps_per_second": 2.203,
98
  "step": 700
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
99
  }
100
  ],
101
  "max_steps": 1876,
102
  "num_train_epochs": 1,
103
- "total_flos": 1557764537548800.0,
104
  "trial_name": null,
105
  "trial_params": null
106
  }
 
1
  {
2
  "best_metric": 0.885723696687195,
3
  "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
4
+ "epoch": 0.6929637526652452,
5
+ "global_step": 1300,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
96
  "eval_samples_per_second": 35.056,
97
  "eval_steps_per_second": 2.203,
98
  "step": 700
99
+ },
100
+ {
101
+ "epoch": 0.43,
102
+ "eval_accuracy": 0.8528252168445007,
103
+ "eval_f1": 0.8528252168445007,
104
+ "eval_loss": 0.44917240738868713,
105
+ "eval_precision": 0.8528252168445007,
106
+ "eval_recall": 0.8528252168445007,
107
+ "eval_runtime": 45.6102,
108
+ "eval_samples_per_second": 35.233,
109
+ "eval_steps_per_second": 2.214,
110
+ "step": 800
111
+ },
112
+ {
113
+ "epoch": 0.48,
114
+ "eval_accuracy": 0.8833980456546259,
115
+ "eval_f1": 0.8833980456546259,
116
+ "eval_loss": 0.38389313220977783,
117
+ "eval_precision": 0.8833980456546259,
118
+ "eval_recall": 0.8833980456546259,
119
+ "eval_runtime": 47.6493,
120
+ "eval_samples_per_second": 33.726,
121
+ "eval_steps_per_second": 2.12,
122
+ "step": 900
123
+ },
124
+ {
125
+ "epoch": 0.53,
126
+ "learning_rate": 9.381663113006397e-06,
127
+ "loss": 0.4464,
128
+ "step": 1000
129
+ },
130
+ {
131
+ "epoch": 0.53,
132
+ "eval_accuracy": 0.8498407977082855,
133
+ "eval_f1": 0.8498407977082856,
134
+ "eval_loss": 0.4365050792694092,
135
+ "eval_precision": 0.8498407977082855,
136
+ "eval_recall": 0.8498407977082855,
137
+ "eval_runtime": 47.0078,
138
+ "eval_samples_per_second": 34.186,
139
+ "eval_steps_per_second": 2.149,
140
+ "step": 1000
141
+ },
142
+ {
143
+ "epoch": 0.59,
144
+ "eval_accuracy": 0.8811622266361904,
145
+ "eval_f1": 0.8811622266361904,
146
+ "eval_loss": 0.36158204078674316,
147
+ "eval_precision": 0.8811622266361904,
148
+ "eval_recall": 0.8811622266361904,
149
+ "eval_runtime": 44.8724,
150
+ "eval_samples_per_second": 35.813,
151
+ "eval_steps_per_second": 2.251,
152
+ "step": 1100
153
+ },
154
+ {
155
+ "epoch": 0.64,
156
+ "eval_accuracy": 0.8795751943864972,
157
+ "eval_f1": 0.8795751943864972,
158
+ "eval_loss": 0.3948919177055359,
159
+ "eval_precision": 0.8795751943864972,
160
+ "eval_recall": 0.8795751943864972,
161
+ "eval_runtime": 45.1224,
162
+ "eval_samples_per_second": 35.614,
163
+ "eval_steps_per_second": 2.238,
164
+ "step": 1200
165
+ },
166
+ {
167
+ "epoch": 0.69,
168
+ "eval_accuracy": 0.8612794075079601,
169
+ "eval_f1": 0.8612794075079601,
170
+ "eval_loss": 0.41840043663978577,
171
+ "eval_precision": 0.8612794075079601,
172
+ "eval_recall": 0.8612794075079601,
173
+ "eval_runtime": 39.7377,
174
+ "eval_samples_per_second": 40.44,
175
+ "eval_steps_per_second": 2.542,
176
+ "step": 1300
177
  }
178
  ],
179
  "max_steps": 1876,
180
  "num_train_epochs": 1,
181
+ "total_flos": 2892991284019200.0,
182
  "trial_name": null,
183
  "trial_params": null
184
  }
{checkpoint-800 β†’ checkpoint-1300}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8126932772d64c007aa46752a8678869bff8e31fb1d734f060c2aef68f5b5c3
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d4698a9bcd9f4d1b85cd29935ce42f4264d331bc9713045308140215396cd2e
3
  size 1134425553
runs/Feb15_07-53-26_e220f522c880/events.out.tfevents.1676447621.e220f522c880.495.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97dbcb650d21eb583ff331584d595df99b7abe792fa93031ec793779393434c8
3
- size 8597
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aec79be76242a342cf813e35be39731a4cf8ff91fe61776b977f2529b2fa0e92
3
+ size 11114