{ | |
"dataset_args": { | |
"max_utterances": 20, | |
"max_tokens": 512, | |
"dataroot": "data/all/fact_full/nlu" | |
}, | |
"task": "linking", | |
"model_name_or_path": "microsoft/deberta-v3-large", | |
"per_gpu_train_batch_size": 2, | |
"per_gpu_eval_batch_size": 2, | |
"gradient_accumulation_steps": 1, | |
"learning_rate": 2e-07, | |
"adam_epsilon": 1e-08, | |
"max_grad_norm": 1.0, | |
"num_train_epochs": 20, | |
"warmup_steps": 0, | |
"fp16": "", | |
"seed": 47 | |
} |