wilsontam's picture
Bert model with sequence classifier and LM heads
6f2fb4b
raw history blame
No virus
621 Bytes
{
"dataset_args": {
"history_max_utterances": 1000000,
"history_max_tokens": 128,
"dataroot": "data_exclude_kb",
"knowledge_file": "knowledge.json"
},
"task": "clusterid_classification",
"model_name_or_path": "bert-base-uncased",
"tokenizer_name_or_path": "/scratch/yt2267/public/alexa-with-dstc9-track1-dataset/bert-base-uncased-local",
"per_gpu_train_batch_size": 16,
"per_gpu_eval_batch_size": 32,
"gradient_accumulation_steps": 1,
"learning_rate": 6.25e-05,
"adam_epsilon": 1e-08,
"max_grad_norm": 1.0,
"num_train_epochs": 100,
"warmup_steps": 0,
"fp16": "",
"seed": 42
}