{ "adam_epsilon": 1e-08, "cache_dir": "", "config_name": "", "data_dir": "/content/data/glue/MNLI", "dev": null, "device": "cuda", "do_eval": true, "do_lower_case": true, "do_test": false, "do_train": true, "eval_all_checkpoints": false, "eval_batch_size": 96, "evaluate_during_training": true, "evaluate_during_training_epoch": false, "features_cache_dir": "/content/data/glue/MNLI/cache_36891", "fp16": false, "fp16_opt_level": "01", "gradient_accumulation_steps": 1, "learning_rate": 1.0993071205018916e-05, "local_rank": -1, "logging_steps": 1000, "max_grad_norm": 1.0, "max_seq_length": 128, "max_steps": -1, "model_name_or_path": "roberta-base", "model_type": "roberta", "n_gpu": 1, "no_cuda": false, "num_train_epochs": 6, "output_dir": "/content/results", "output_mode": "classification", "overwrite_cache": false, "overwrite_output_dir": false, "patience": 3, "per_gpu_eval_batch_size": 96, "per_gpu_train_batch_size": 64, "save_steps": 0, "seed": 36891, "server_ip": "", "server_port": "", "task_name": "mnli", "test": null, "tokenizer_name": "", "train": null, "train_batch_size": 64, "warmup_steps": 0, "weight_decay": 0.0 }