geletka commited on
Commit
d2c4bec
1 Parent(s): c299ddc

Upload 11 files

Browse files

first version of the model

config.json ADDED
@@ -0,0 +1,168 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/layoutlmv2-large-uncased",
3
+ "architectures": [
4
+ "LayoutLMv2ForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "convert_sync_batchnorm": true,
8
+ "coordinate_size": 171,
9
+ "detectron2_config_args": {
10
+ "MODEL.ANCHOR_GENERATOR.SIZES": [
11
+ [
12
+ 32
13
+ ],
14
+ [
15
+ 64
16
+ ],
17
+ [
18
+ 128
19
+ ],
20
+ [
21
+ 256
22
+ ],
23
+ [
24
+ 512
25
+ ]
26
+ ],
27
+ "MODEL.BACKBONE.NAME": "build_resnet_fpn_backbone",
28
+ "MODEL.FPN.IN_FEATURES": [
29
+ "res2",
30
+ "res3",
31
+ "res4",
32
+ "res5"
33
+ ],
34
+ "MODEL.MASK_ON": true,
35
+ "MODEL.PIXEL_STD": [
36
+ 57.375,
37
+ 57.12,
38
+ 58.395
39
+ ],
40
+ "MODEL.POST_NMS_TOPK_TEST": 1000,
41
+ "MODEL.RESNETS.ASPECT_RATIOS": [
42
+ [
43
+ 0.5,
44
+ 1.0,
45
+ 2.0
46
+ ]
47
+ ],
48
+ "MODEL.RESNETS.DEPTH": 101,
49
+ "MODEL.RESNETS.NUM_GROUPS": 32,
50
+ "MODEL.RESNETS.OUT_FEATURES": [
51
+ "res2",
52
+ "res3",
53
+ "res4",
54
+ "res5"
55
+ ],
56
+ "MODEL.RESNETS.SIZES": [
57
+ [
58
+ 32
59
+ ],
60
+ [
61
+ 64
62
+ ],
63
+ [
64
+ 128
65
+ ],
66
+ [
67
+ 256
68
+ ],
69
+ [
70
+ 512
71
+ ]
72
+ ],
73
+ "MODEL.RESNETS.STRIDE_IN_1X1": false,
74
+ "MODEL.RESNETS.WIDTH_PER_GROUP": 8,
75
+ "MODEL.ROI_BOX_HEAD.NAME": "FastRCNNConvFCHead",
76
+ "MODEL.ROI_BOX_HEAD.NUM_FC": 2,
77
+ "MODEL.ROI_BOX_HEAD.POOLER_RESOLUTION": 14,
78
+ "MODEL.ROI_HEADS.IN_FEATURES": [
79
+ "p2",
80
+ "p3",
81
+ "p4",
82
+ "p5"
83
+ ],
84
+ "MODEL.ROI_HEADS.NAME": "StandardROIHeads",
85
+ "MODEL.ROI_HEADS.NUM_CLASSES": 5,
86
+ "MODEL.ROI_MASK_HEAD.NAME": "MaskRCNNConvUpsampleHead",
87
+ "MODEL.ROI_MASK_HEAD.NUM_CONV": 4,
88
+ "MODEL.ROI_MASK_HEAD.POOLER_RESOLUTION": 7,
89
+ "MODEL.RPN.IN_FEATURES": [
90
+ "p2",
91
+ "p3",
92
+ "p4",
93
+ "p5",
94
+ "p6"
95
+ ],
96
+ "MODEL.RPN.POST_NMS_TOPK_TRAIN": 1000,
97
+ "MODEL.RPN.PRE_NMS_TOPK_TEST": 1000,
98
+ "MODEL.RPN.PRE_NMS_TOPK_TRAIN": 2000
99
+ },
100
+ "fast_qkv": false,
101
+ "gradient_checkpointing": false,
102
+ "has_relative_attention_bias": true,
103
+ "has_spatial_attention_bias": true,
104
+ "has_visual_segment_embedding": false,
105
+ "hidden_act": "gelu",
106
+ "hidden_dropout_prob": 0.1,
107
+ "hidden_size": 1024,
108
+ "id2label": {
109
+ "0": "DIC",
110
+ "1": "IBAN",
111
+ "2": "ICO",
112
+ "3": "O",
113
+ "4": "account_number",
114
+ "5": "bank_code",
115
+ "6": "const_symbol",
116
+ "7": "contr_address",
117
+ "8": "contr_name",
118
+ "9": "due_date",
119
+ "10": "invoice_date",
120
+ "11": "invoice_number",
121
+ "12": "qr_code",
122
+ "13": "spec_symbol",
123
+ "14": "total_amount",
124
+ "15": "var_symbol"
125
+ },
126
+ "image_feature_pool_shape": [
127
+ 7,
128
+ 7,
129
+ 256
130
+ ],
131
+ "initializer_range": 0.02,
132
+ "intermediate_size": 4096,
133
+ "label2id": {
134
+ "DIC": 0,
135
+ "IBAN": 1,
136
+ "ICO": 2,
137
+ "O": 3,
138
+ "account_number": 4,
139
+ "bank_code": 5,
140
+ "const_symbol": 6,
141
+ "contr_address": 7,
142
+ "contr_name": 8,
143
+ "due_date": 9,
144
+ "invoice_date": 10,
145
+ "invoice_number": 11,
146
+ "qr_code": 12,
147
+ "spec_symbol": 13,
148
+ "total_amount": 14,
149
+ "var_symbol": 15
150
+ },
151
+ "layer_norm_eps": 1e-12,
152
+ "max_2d_position_embeddings": 1024,
153
+ "max_position_embeddings": 512,
154
+ "max_rel_2d_pos": 256,
155
+ "max_rel_pos": 128,
156
+ "model_type": "layoutlmv2",
157
+ "num_attention_heads": 16,
158
+ "num_hidden_layers": 24,
159
+ "output_past": true,
160
+ "pad_token_id": 0,
161
+ "rel_2d_pos_bins": 64,
162
+ "rel_pos_bins": 32,
163
+ "shape_size": 170,
164
+ "torch_dtype": "float32",
165
+ "transformers_version": "4.21.0",
166
+ "type_vocab_size": 2,
167
+ "vocab_size": 30522
168
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0540ef6f6c09af67bd84180c8fe13f33ad4434740fbc98174e4f9d6b8ea1e26
3
+ size 3382390311
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76795a99dca4d119d5d450f03405098fbcd58ea6da771b040550349198743610
3
+ size 1705974883
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3671d32d7e68d908b61d68f659b7b064d131ce43ac58616534bafabe38edc159
3
+ size 14439
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4eb92341ebdc6a151646e2e89df28c54b26e8410408faa62c48b1e57c90c6ed
3
+ size 623
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "cls_token": "[CLS]",
4
+ "cls_token_box": [
5
+ 0,
6
+ 0,
7
+ 0,
8
+ 0
9
+ ],
10
+ "do_basic_tokenize": true,
11
+ "do_lower_case": true,
12
+ "mask_token": "[MASK]",
13
+ "model_max_length": 512,
14
+ "name_or_path": "microsoft/layoutlmv2-large-uncased",
15
+ "never_split": null,
16
+ "only_label_first_subword": true,
17
+ "pad_token": "[PAD]",
18
+ "pad_token_box": [
19
+ 0,
20
+ 0,
21
+ 0,
22
+ 0
23
+ ],
24
+ "pad_token_label": -100,
25
+ "sep_token": "[SEP]",
26
+ "sep_token_box": [
27
+ 1000,
28
+ 1000,
29
+ 1000,
30
+ 1000
31
+ ],
32
+ "special_tokens_map_file": null,
33
+ "strip_accents": null,
34
+ "tokenize_chinese_chars": true,
35
+ "tokenizer_class": "LayoutLMv2Tokenizer",
36
+ "unk_token": "[UNK]"
37
+ }
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32638b12f032c2492960a944930684d4150141c53ab06b19be2c343d5e5b5688
3
+ size 3439
vocab.txt ADDED
The diff for this file is too large to render. See raw diff