pierreguillou commited on
Commit
e1f7461
1 Parent(s): a6276de

Training in progress, step 1500

Browse files
checkpoint-1000/config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "nielsr/lilt-xlm-roberta-base",
3
+ "architectures": [
4
+ "LiltForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "channel_shrink_ratio": 4,
9
+ "classifier_dropout": null,
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "Caption",
16
+ "1": "Footnote",
17
+ "2": "Formula",
18
+ "3": "List-item",
19
+ "4": "Page-footer",
20
+ "5": "Page-header",
21
+ "6": "Picture",
22
+ "7": "Section-header",
23
+ "8": "Table",
24
+ "9": "Text",
25
+ "10": "Title"
26
+ },
27
+ "initializer_range": 0.02,
28
+ "intermediate_size": 3072,
29
+ "label2id": {
30
+ "Caption": 0,
31
+ "Footnote": 1,
32
+ "Formula": 2,
33
+ "List-item": 3,
34
+ "Page-footer": 4,
35
+ "Page-header": 5,
36
+ "Picture": 6,
37
+ "Section-header": 7,
38
+ "Table": 8,
39
+ "Text": 9,
40
+ "Title": 10
41
+ },
42
+ "layer_norm_eps": 1e-05,
43
+ "max_2d_position_embeddings": 1024,
44
+ "max_position_embeddings": 514,
45
+ "model_type": "lilt",
46
+ "num_attention_heads": 12,
47
+ "num_hidden_layers": 12,
48
+ "output_past": true,
49
+ "pad_token_id": 1,
50
+ "position_embedding_type": "absolute",
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.26.0",
53
+ "type_vocab_size": 1,
54
+ "use_cache": true,
55
+ "vocab_size": 250002
56
+ }
checkpoint-1000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:850031ce3243a80d3659b496331db88ba7151ffeacf08604ac7171638cef7b44
3
+ size 2265828101
checkpoint-1000/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03c23af0358fb05f012a6b62f08cda0f0f77800ae18932f19ad494e52ef62d8e
3
+ size 1134425553
checkpoint-1000/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b77afc8dc240a230df75727f986b17d934e998fdd9251c9afa1179522f006116
3
+ size 14575
checkpoint-1000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:549c363f84648ad8593fc1d45abed2e334ff664013812020536a7e08d3a19ed2
3
+ size 557
checkpoint-1000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcab0ffe66d73213bb723e7ed3816ba449fe7bd0b2f3ceae044473cf432e3783
3
+ size 627
checkpoint-1000/special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
15
+ }
checkpoint-1000/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62c24cdc13d4c9952d63718d6c9fa4c287974249e16b7ade6d5a85e7bbb75626
3
+ size 17082660
checkpoint-1000/tokenizer_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "__type": "AddedToken",
7
+ "content": "<mask>",
8
+ "lstrip": true,
9
+ "normalized": true,
10
+ "rstrip": false,
11
+ "single_word": false
12
+ },
13
+ "model_max_length": 512,
14
+ "name_or_path": "nielsr/lilt-xlm-roberta-base",
15
+ "pad_token": "<pad>",
16
+ "sep_token": "</s>",
17
+ "special_tokens_map_file": null,
18
+ "tokenizer_class": "XLMRobertaTokenizer",
19
+ "unk_token": "<unk>"
20
+ }
checkpoint-1000/trainer_state.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8311511798105226,
3
+ "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-1000",
4
+ "epoch": 0.4154549231408392,
5
+ "global_step": 1000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.21,
12
+ "learning_rate": 4.793934358122144e-05,
13
+ "loss": 0.7223,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.21,
18
+ "eval_accuracy": 0.7741471103890881,
19
+ "eval_f1": 0.7741471103890881,
20
+ "eval_loss": 0.7764509916305542,
21
+ "eval_precision": 0.7741471103890881,
22
+ "eval_recall": 0.7741471103890881,
23
+ "eval_runtime": 33.2902,
24
+ "eval_samples_per_second": 61.64,
25
+ "eval_steps_per_second": 3.875,
26
+ "step": 500
27
+ },
28
+ {
29
+ "epoch": 0.42,
30
+ "learning_rate": 4.5870378063980065e-05,
31
+ "loss": 0.4469,
32
+ "step": 1000
33
+ },
34
+ {
35
+ "epoch": 0.42,
36
+ "eval_accuracy": 0.8311511798105226,
37
+ "eval_f1": 0.8311511798105226,
38
+ "eval_loss": 0.5913723707199097,
39
+ "eval_precision": 0.8311511798105226,
40
+ "eval_recall": 0.8311511798105226,
41
+ "eval_runtime": 37.4699,
42
+ "eval_samples_per_second": 54.764,
43
+ "eval_steps_per_second": 3.443,
44
+ "step": 1000
45
+ }
46
+ ],
47
+ "max_steps": 12035,
48
+ "num_train_epochs": 5,
49
+ "total_flos": 1669033433088000.0,
50
+ "trial_name": null,
51
+ "trial_params": null
52
+ }
checkpoint-1000/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b3cb303483efa6f2dc51db1cfb9b16000da398e2d72673041025bfff104b3b8
3
+ size 3643
checkpoint-1500/config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "nielsr/lilt-xlm-roberta-base",
3
+ "architectures": [
4
+ "LiltForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "channel_shrink_ratio": 4,
9
+ "classifier_dropout": null,
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "Caption",
16
+ "1": "Footnote",
17
+ "2": "Formula",
18
+ "3": "List-item",
19
+ "4": "Page-footer",
20
+ "5": "Page-header",
21
+ "6": "Picture",
22
+ "7": "Section-header",
23
+ "8": "Table",
24
+ "9": "Text",
25
+ "10": "Title"
26
+ },
27
+ "initializer_range": 0.02,
28
+ "intermediate_size": 3072,
29
+ "label2id": {
30
+ "Caption": 0,
31
+ "Footnote": 1,
32
+ "Formula": 2,
33
+ "List-item": 3,
34
+ "Page-footer": 4,
35
+ "Page-header": 5,
36
+ "Picture": 6,
37
+ "Section-header": 7,
38
+ "Table": 8,
39
+ "Text": 9,
40
+ "Title": 10
41
+ },
42
+ "layer_norm_eps": 1e-05,
43
+ "max_2d_position_embeddings": 1024,
44
+ "max_position_embeddings": 514,
45
+ "model_type": "lilt",
46
+ "num_attention_heads": 12,
47
+ "num_hidden_layers": 12,
48
+ "output_past": true,
49
+ "pad_token_id": 1,
50
+ "position_embedding_type": "absolute",
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.26.0",
53
+ "type_vocab_size": 1,
54
+ "use_cache": true,
55
+ "vocab_size": 250002
56
+ }
checkpoint-1500/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e23364a6999277a663e128d860936666da5c97d392396e7e1bb598c485db3e4c
3
+ size 2265828101
checkpoint-1500/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b1a29b3ccb13877c06b9c50bf20c54e7d085e260a305e3376c872a9cfa9e2e
3
+ size 1134425553
checkpoint-1500/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8c587b97653ca2e1fe2cda77f5e5c4a3c7a1593d3d2f35db0d2ca4e7933179f
3
+ size 14575
checkpoint-1500/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c2561ef8d03a8a364e3db0bdeeef0d1ebf7cf016b7859262ac8c8947d6e8539
3
+ size 557
checkpoint-1500/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cb4c24baee1d80158990ceb4f9780c1a6dd6396dffda96df7d63fa2d0ae5653
3
+ size 627
checkpoint-1500/special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
15
+ }
checkpoint-1500/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62c24cdc13d4c9952d63718d6c9fa4c287974249e16b7ade6d5a85e7bbb75626
3
+ size 17082660
checkpoint-1500/tokenizer_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "__type": "AddedToken",
7
+ "content": "<mask>",
8
+ "lstrip": true,
9
+ "normalized": true,
10
+ "rstrip": false,
11
+ "single_word": false
12
+ },
13
+ "model_max_length": 512,
14
+ "name_or_path": "nielsr/lilt-xlm-roberta-base",
15
+ "pad_token": "<pad>",
16
+ "sep_token": "</s>",
17
+ "special_tokens_map_file": null,
18
+ "tokenizer_class": "XLMRobertaTokenizer",
19
+ "unk_token": "<unk>"
20
+ }
checkpoint-1500/trainer_state.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8311511798105226,
3
+ "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-1000",
4
+ "epoch": 0.6231823847112589,
5
+ "global_step": 1500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.21,
12
+ "learning_rate": 4.793934358122144e-05,
13
+ "loss": 0.7223,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.21,
18
+ "eval_accuracy": 0.7741471103890881,
19
+ "eval_f1": 0.7741471103890881,
20
+ "eval_loss": 0.7764509916305542,
21
+ "eval_precision": 0.7741471103890881,
22
+ "eval_recall": 0.7741471103890881,
23
+ "eval_runtime": 33.2902,
24
+ "eval_samples_per_second": 61.64,
25
+ "eval_steps_per_second": 3.875,
26
+ "step": 500
27
+ },
28
+ {
29
+ "epoch": 0.42,
30
+ "learning_rate": 4.5870378063980065e-05,
31
+ "loss": 0.4469,
32
+ "step": 1000
33
+ },
34
+ {
35
+ "epoch": 0.42,
36
+ "eval_accuracy": 0.8311511798105226,
37
+ "eval_f1": 0.8311511798105226,
38
+ "eval_loss": 0.5913723707199097,
39
+ "eval_precision": 0.8311511798105226,
40
+ "eval_recall": 0.8311511798105226,
41
+ "eval_runtime": 37.4699,
42
+ "eval_samples_per_second": 54.764,
43
+ "eval_steps_per_second": 3.443,
44
+ "step": 1000
45
+ },
46
+ {
47
+ "epoch": 0.62,
48
+ "learning_rate": 4.3793103448275864e-05,
49
+ "loss": 0.3819,
50
+ "step": 1500
51
+ },
52
+ {
53
+ "epoch": 0.62,
54
+ "eval_accuracy": 0.8102330668639719,
55
+ "eval_f1": 0.8102330668639719,
56
+ "eval_loss": 0.8744572997093201,
57
+ "eval_precision": 0.8102330668639719,
58
+ "eval_recall": 0.8102330668639719,
59
+ "eval_runtime": 34.6123,
60
+ "eval_samples_per_second": 59.285,
61
+ "eval_steps_per_second": 3.727,
62
+ "step": 1500
63
+ }
64
+ ],
65
+ "max_steps": 12035,
66
+ "num_train_epochs": 5,
67
+ "total_flos": 2503550149632000.0,
68
+ "trial_name": null,
69
+ "trial_params": null
70
+ }
checkpoint-1500/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b3cb303483efa6f2dc51db1cfb9b16000da398e2d72673041025bfff104b3b8
3
+ size 3643
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5de718e31c9f491c0dfba691cef2fadf6de01ce7e4513429474a72b167fc8394
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b1a29b3ccb13877c06b9c50bf20c54e7d085e260a305e3376c872a9cfa9e2e
3
  size 1134425553
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01422eac22c1e831a9f9acda84370c4c1858be607d7cd440776b6e970bb0b54f
3
- size 5258
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:643429707a800789d4f201880cd98c1a2057b31f9dc89474acd274f39e537fbf
3
+ size 6516