Omar95farag's picture
Saving best model to hub
94fda82
{
"EE_config": {
"alpha": 0.5,
"apply_ocr": true,
"batch_size": 2,
"benchmark_OCR": false,
"checkpoint": "",
"data_parallel": false,
"dataset": "jordyvl/rvl_cdip_100_examples_per_class",
"device": "cuda",
"downsampling": 0,
"encoder_layer_strategy": "ramp",
"epochs": 60,
"eval_batch_size": 1,
"eval_start": false,
"exit_head_num_layers": 2,
"exit_threshold": -1,
"exits": "text_avg,vision_avg,1,2,3,4,5,6,7,8,9,10,11,12",
"forward_signature": [
"input_ids",
"attention_mask",
"bbox",
"pixel_values",
"labels",
"token_type_ids",
"position_ids",
"head_mask",
"inputs_embeds",
"output_attentions",
"output_hidden_states",
"return_dict",
"kwargs"
],
"gamma": 0.5,
"get_raw_ocr_data": true,
"global_threshold": 1.000001,
"gradient_accumulation_steps": 24,
"inference_strategy": "max_confidence",
"labelset": "test",
"lowercase": false,
"lr": 2e-05,
"model": "EElayoutlmv3",
"model_weights": "microsoft/layoutlmv3-base",
"optimizer": "AdamW",
"plot_exits": false,
"print_freq": 50,
"seed": 42,
"temperature": 1,
"test_dataset": "jordyvl/rvl_cdip_100_examples_per_class",
"training_strategy": "one_stage_subgraphs_entropyreg",
"use_images": true,
"use_lte": false,
"use_wandb": false,
"warmup_ratio": 0,
"weight_decay": 0
},
"_name_or_path": "microsoft/layoutlmv3-base",
"architectures": [
"LayoutLMv3EEForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"classifier_dropout": null,
"coordinate_size": 128,
"eos_token_id": 2,
"exit_config": {
"encoder_layer_strategy": "ramp",
"exit_head_num_layers": 2,
"exits": [
"text_avg",
"vision_avg",
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12
],
"global_threshold": 1.000001,
"inference_strategy": "max_confidence",
"training_strategy": "one_stage_subgraphs_entropyreg"
},
"has_relative_attention_bias": true,
"has_spatial_attention_bias": true,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "letter",
"1": "form",
"2": "email",
"3": "handwritten",
"4": "advertisement",
"5": "scientific_report",
"6": "scientific_publication",
"7": "specification",
"8": "file_folder",
"9": "news_article",
"10": "budget",
"11": "invoice",
"12": "presentation",
"13": "questionnaire",
"14": "resume",
"15": "memo"
},
"initializer_range": 0.02,
"input_size": 224,
"intermediate_size": 3072,
"label2id": {
"advertisement": 4,
"budget": 10,
"email": 2,
"file_folder": 8,
"form": 1,
"handwritten": 3,
"invoice": 11,
"letter": 0,
"memo": 15,
"news_article": 9,
"presentation": 12,
"questionnaire": 13,
"resume": 14,
"scientific_publication": 6,
"scientific_report": 5,
"specification": 7
},
"layer_norm_eps": 1e-05,
"max_2d_position_embeddings": 1024,
"max_position_embeddings": 514,
"max_rel_2d_pos": 256,
"max_rel_pos": 128,
"model_type": "layoutlmv3",
"num_attention_heads": 12,
"num_channels": 3,
"num_hidden_layers": 12,
"pad_token_id": 1,
"patch_size": 16,
"rel_2d_pos_bins": 64,
"rel_pos_bins": 32,
"second_input_size": 112,
"shape_size": 128,
"text_embed": true,
"torch_dtype": "float32",
"transformers_version": "4.31.0",
"type_vocab_size": 1,
"visual_embed": true,
"vocab_size": 50265
}