{ "model_name": "microsoft/mdeberta-v3-base", "name": "token level gliner", "max_width": 100, "hidden_size": 768, "dropout": 0.0, "fine_tune": true, "subtoken_pooling": "first", "span_mode": "token_level", "num_steps": 1000000, "train_batch_size": 4, "eval_every": 20000, "warmup_ratio": 0.1, "scheduler_type": "cosine", "gradient_accumulation_steps": 2, "loss_alpha": 0.25, "loss_gamma": 2, "label_smoothing": 0, "loss_reduction": "sum", "lr_encoder": "3e-5", "lr_others": "3e-5", "weight_decay_encoder": 0.01, "weight_decay_other": 0.01, "root_dir": "gliner_logs", "train_data": "/home/ltngoc/Move Gliner/data/viner_train.json", "val_data_dir": "/home/ltngoc/Move Gliner/data/viner", "log_dir": "mdeberta", "prev_path": "/home/ltngoc/Move Gliner/mdeberta/model_20000", "save_total_limit": 10, "size_sup": -1, "max_types": 13000, "shuffle_types": true, "random_drop": true, "max_neg_type_ratio": 1, "max_len": 768, "freeze_token_rep": false }