comfact-deberta-v2 / params-deberta-large.json
Mete Ismayil
add model files
f26fd39
raw
history blame
443 Bytes
{
"dataset_args": {
"max_utterances": 20,
"max_tokens": 512,
"dataroot": "data/all/fact_full/nlu"
},
"task": "linking",
"model_name_or_path": "microsoft/deberta-v3-large",
"per_gpu_train_batch_size": 2,
"per_gpu_eval_batch_size": 2,
"gradient_accumulation_steps": 1,
"learning_rate": 2e-07,
"adam_epsilon": 1e-08,
"max_grad_norm": 1.0,
"num_train_epochs": 20,
"warmup_steps": 0,
"fp16": "",
"seed": 47
}