jordyvl's picture
Saving best model to hub
e902962
{
"EE_config": {
"alpha": 0.5,
"apply_ocr": true,
"batch_size": 2,
"benchmark_OCR": false,
"checkpoint": "",
"data_parallel": false,
"dataset": "maveriq/tobacco3482",
"device": "cuda",
"downsampling": 0,
"encoder_layer_strategy": "ramp",
"epochs": 5,
"eval_batch_size": 1,
"eval_start": false,
"exit_head_num_layers": 2,
"exit_threshold": -1,
"exits": [
"text_avg",
"vision_avg",
1,
4,
8
],
"forward_signature": [
"input_ids",
"attention_mask",
"token_type_ids",
"position_ids",
"head_mask",
"inputs_embeds",
"labels",
"output_attentions",
"output_hidden_states",
"return_dict",
"bbox",
"pixel_values"
],
"gamma": 0,
"get_raw_ocr_data": true,
"global_threshold": 1.000001,
"gradient_accumulation_steps": 32,
"inference_strategy": "max_confidence",
"lowercase": false,
"lr": 2e-05,
"model": "LayoutLMv3",
"model_weights": "microsoft/layoutlmv3-base",
"optimizer": "AdamW",
"plot_exits": false,
"print_freq": 50,
"seed": 42,
"temperature": 1,
"test_dataset": "jordyvl/rvl_cdip_100_examples_per_class",
"training_strategy": "joint_weighted_avg",
"use_images": true,
"warmup_ratio": 0,
"weight_decay": 0
},
"_name_or_path": "microsoft/layoutlmv3-base",
"architectures": [
"LayoutLMv3ForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"classifier_dropout": null,
"coordinate_size": 128,
"eos_token_id": 2,
"has_relative_attention_bias": true,
"has_spatial_attention_bias": true,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "ADVE",
"1": "Email",
"2": "Form",
"3": "Letter",
"4": "Memo",
"5": "News",
"6": "Note",
"7": "Report",
"8": "Resume",
"9": "Scientific"
},
"initializer_range": 0.02,
"input_size": 224,
"intermediate_size": 3072,
"label2id": {
"ADVE": 0,
"Email": 1,
"Form": 2,
"Letter": 3,
"Memo": 4,
"News": 5,
"Note": 6,
"Report": 7,
"Resume": 8,
"Scientific": 9
},
"layer_norm_eps": 1e-05,
"max_2d_position_embeddings": 1024,
"max_position_embeddings": 514,
"max_rel_2d_pos": 256,
"max_rel_pos": 128,
"model_type": "layoutlmv3",
"num_attention_heads": 12,
"num_channels": 3,
"num_hidden_layers": 12,
"pad_token_id": 1,
"patch_size": 16,
"problem_type": "single_label_classification",
"rel_2d_pos_bins": 64,
"rel_pos_bins": 32,
"second_input_size": 112,
"shape_size": 128,
"text_embed": true,
"torch_dtype": "float32",
"transformers_version": "4.26.1",
"type_vocab_size": 1,
"visual_embed": true,
"vocab_size": 50265
}