{ "EE_config": { "alpha": 0.5, "apply_ocr": true, "batch_size": 2, "benchmark_OCR": false, "checkpoint": "", "data_parallel": false, "dataset": "jordyvl/rvl_cdip_100_examples_per_class", "device": "cuda", "downsampling": 0, "encoder_layer_strategy": "ramp", "epochs": 60, "eval_batch_size": 1, "eval_start": false, "exit_head_num_layers": 2, "exit_threshold": -1, "exits": "text_avg,vision_avg,1,2,3,4,5,6,7,8,9,10,11,12", "forward_signature": [ "input_ids", "attention_mask", "bbox", "pixel_values", "labels", "token_type_ids", "position_ids", "head_mask", "inputs_embeds", "output_attentions", "output_hidden_states", "return_dict", "kwargs" ], "gamma": 0.5, "get_raw_ocr_data": true, "global_threshold": 1.000001, "gradient_accumulation_steps": 24, "inference_strategy": "max_confidence", "labelset": "test", "lowercase": false, "lr": 2e-05, "model": "EElayoutlmv3", "model_weights": "microsoft/layoutlmv3-base", "optimizer": "AdamW", "plot_exits": false, "print_freq": 50, "seed": 42, "temperature": 1, "test_dataset": "jordyvl/rvl_cdip_100_examples_per_class", "training_strategy": "one_stage_subgraphs_entropyreg", "use_images": true, "use_lte": false, "use_wandb": false, "warmup_ratio": 0, "weight_decay": 0 }, "_name_or_path": "microsoft/layoutlmv3-base", "architectures": [ "LayoutLMv3EEForSequenceClassification" ], "attention_probs_dropout_prob": 0.1, "bos_token_id": 0, "classifier_dropout": null, "coordinate_size": 128, "eos_token_id": 2, "exit_config": { "encoder_layer_strategy": "ramp", "exit_head_num_layers": 2, "exits": [ "text_avg", "vision_avg", 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12 ], "global_threshold": 1.000001, "inference_strategy": "max_confidence", "training_strategy": "one_stage_subgraphs_entropyreg" }, "has_relative_attention_bias": true, "has_spatial_attention_bias": true, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": { "0": "letter", "1": "form", "2": "email", "3": "handwritten", "4": "advertisement", "5": "scientific_report", "6": "scientific_publication", "7": "specification", "8": "file_folder", "9": "news_article", "10": "budget", "11": "invoice", "12": "presentation", "13": "questionnaire", "14": "resume", "15": "memo" }, "initializer_range": 0.02, "input_size": 224, "intermediate_size": 3072, "label2id": { "advertisement": 4, "budget": 10, "email": 2, "file_folder": 8, "form": 1, "handwritten": 3, "invoice": 11, "letter": 0, "memo": 15, "news_article": 9, "presentation": 12, "questionnaire": 13, "resume": 14, "scientific_publication": 6, "scientific_report": 5, "specification": 7 }, "layer_norm_eps": 1e-05, "max_2d_position_embeddings": 1024, "max_position_embeddings": 514, "max_rel_2d_pos": 256, "max_rel_pos": 128, "model_type": "layoutlmv3", "num_attention_heads": 12, "num_channels": 3, "num_hidden_layers": 12, "pad_token_id": 1, "patch_size": 16, "rel_2d_pos_bins": 64, "rel_pos_bins": 32, "second_input_size": 112, "shape_size": 128, "text_embed": true, "torch_dtype": "float32", "transformers_version": "4.31.0", "type_vocab_size": 1, "visual_embed": true, "vocab_size": 50265 }