{ "dataset_args": { "history_max_utterances": 1000000, "history_max_tokens": 128, "dataroot": "data_exclude_kb", "knowledge_file": "knowledge.json" }, "task": "clusterid_classification", "model_name_or_path": "bert-base-uncased", "tokenizer_name_or_path": "/scratch/yt2267/public/alexa-with-dstc9-track1-dataset/bert-base-uncased-local", "per_gpu_train_batch_size": 16, "per_gpu_eval_batch_size": 32, "gradient_accumulation_steps": 1, "learning_rate": 6.25e-05, "adam_epsilon": 1e-08, "max_grad_norm": 1.0, "num_train_epochs": 100, "warmup_steps": 0, "fp16": "", "seed": 42 }