File size: 1,395 Bytes
6b65441 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 |
{
"class_token_index": 128002,
"dropout": 0.1,
"encoder_config": null,
"ent_token": "<<ENT>>",
"eval_every": 2500,
"fine_tune": true,
"freeze_token_rep": false,
"gpu": "pds@a100",
"has_rnn": true,
"hidden_size": 768,
"log_dir": "/gpfsdswork/projects/rech/bwq/upa43yu/gliner-pip/train_gliner/token_gliner_ft_logs/deberta-v3-base_0",
"loss_alpha": -1,
"loss_gamma": 0,
"loss_reduction": "sum",
"lr_encoder": "1e-6",
"lr_others": "1e-6",
"max_len": 384,
"max_neg_type_ratio": 1,
"max_types": 25,
"max_width": 100,
"model_name": "microsoft/deberta-v3-base",
"model_type": "gliner",
"name": "token level gliner",
"num_steps": 30000,
"prev_path": "/gpfswork/rech/bwq/upa43yu/gliner-pip/train_gliner/token_gliner_logs/deberta-v3-base_4/model_30000",
"random_drop": true,
"root_dir": "token_gliner_ft_logs",
"run_time": "3:30:00",
"scheduler_type": "cosine",
"sep_token": "<<SEP>>",
"shuffle_types": true,
"size_sup": -1,
"span_mode": "token_level",
"subtoken_pooling": "first",
"train_batch_size": 8,
"train_data": "/gpfswork/rech/bwq/upa43yu/gliner-pip/train_gliner/train_new.json",
"transformers_version": "4.38.2",
"val_data_dir": "/gpfswork/rech/ohy/upa43yu/NER_datasets",
"vocab_size": 128004,
"warmup_ratio": 0.1,
"weight_decay_encoder": 0.01,
"weight_decay_other": 0.01,
"words_splitter_type": "whitespace"
}
|