File size: 3,640 Bytes
09db8e5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
{
  "EE_config": {
    "alpha": 0.5,
    "apply_ocr": true,
    "batch_size": 2,
    "benchmark_OCR": false,
    "checkpoint": "",
    "data_parallel": false,
    "dataset": "jordyvl/rvl_cdip_100_examples_per_class",
    "device": "cuda",
    "downsampling": 0,
    "encoder_layer_strategy": "ramp",
    "epochs": 60,
    "eval_batch_size": 1,
    "eval_start": false,
    "exit_head_num_layers": 2,
    "exit_threshold": -1,
    "exits": "text_visual_concat,1,2,3,4,5,6,7,8,9,10,11,12",
    "forward_signature": [
      "input_ids",
      "attention_mask",
      "bbox",
      "pixel_values",
      "labels",
      "token_type_ids",
      "position_ids",
      "head_mask",
      "inputs_embeds",
      "output_attentions",
      "output_hidden_states",
      "return_dict",
      "kwargs"
    ],
    "gamma": 0.5,
    "get_raw_ocr_data": true,
    "global_threshold": 1.000001,
    "gradient_accumulation_steps": 24,
    "inference_strategy": "max_confidence",
    "labelset": "test",
    "lowercase": false,
    "lr": 2e-05,
    "model": "EElayoutlmv3",
    "model_weights": "microsoft/layoutlmv3-base",
    "optimizer": "AdamW",
    "plot_exits": false,
    "print_freq": 50,
    "seed": 42,
    "temperature": 1,
    "test_dataset": "jordyvl/rvl_cdip_100_examples_per_class",
    "training_strategy": "one_stage_subgraphs_weighted",
    "use_images": true,
    "use_lte": false,
    "use_wandb": false,
    "warmup_ratio": 0,
    "weight_decay": 0
  },
  "_name_or_path": "microsoft/layoutlmv3-base",
  "architectures": [
    "LayoutLMv3EEForSequenceClassification"
  ],
  "attention_probs_dropout_prob": 0.1,
  "bos_token_id": 0,
  "classifier_dropout": null,
  "coordinate_size": 128,
  "eos_token_id": 2,
  "exit_config": {
    "encoder_layer_strategy": "ramp",
    "exit_head_num_layers": 2,
    "exits": [
      "text_visual_concat",
      1,
      2,
      3,
      4,
      5,
      6,
      7,
      8,
      9,
      10,
      11,
      12
    ],
    "global_threshold": 1.000001,
    "inference_strategy": "max_confidence",
    "training_strategy": "one_stage_subgraphs_weighted"
  },
  "has_relative_attention_bias": true,
  "has_spatial_attention_bias": true,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "letter",
    "1": "form",
    "2": "email",
    "3": "handwritten",
    "4": "advertisement",
    "5": "scientific_report",
    "6": "scientific_publication",
    "7": "specification",
    "8": "file_folder",
    "9": "news_article",
    "10": "budget",
    "11": "invoice",
    "12": "presentation",
    "13": "questionnaire",
    "14": "resume",
    "15": "memo"
  },
  "initializer_range": 0.02,
  "input_size": 224,
  "intermediate_size": 3072,
  "label2id": {
    "advertisement": 4,
    "budget": 10,
    "email": 2,
    "file_folder": 8,
    "form": 1,
    "handwritten": 3,
    "invoice": 11,
    "letter": 0,
    "memo": 15,
    "news_article": 9,
    "presentation": 12,
    "questionnaire": 13,
    "resume": 14,
    "scientific_publication": 6,
    "scientific_report": 5,
    "specification": 7
  },
  "layer_norm_eps": 1e-05,
  "max_2d_position_embeddings": 1024,
  "max_position_embeddings": 514,
  "max_rel_2d_pos": 256,
  "max_rel_pos": 128,
  "model_type": "layoutlmv3",
  "num_attention_heads": 12,
  "num_channels": 3,
  "num_hidden_layers": 12,
  "pad_token_id": 1,
  "patch_size": 16,
  "rel_2d_pos_bins": 64,
  "rel_pos_bins": 32,
  "second_input_size": 112,
  "shape_size": 128,
  "text_embed": true,
  "torch_dtype": "float32",
  "transformers_version": "4.26.1",
  "type_vocab_size": 1,
  "visual_embed": true,
  "vocab_size": 50265
}