File size: 1,270 Bytes
1f57e37
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
{
    "adam_epsilon": 1e-08,
    "cache_dir": "",
    "config_name": "",
    "data_dir": "/content/data/glue/SNLI",
    "dev": null,
    "device": "cuda",
    "do_eval": true,
    "do_lower_case": true,
    "do_test": false,
    "do_train": true,
    "eval_all_checkpoints": false,
    "evaluate_during_training": true,
    "evaluate_during_training_epoch": false,
    "features_cache_dir": "/content/data/glue/SNLI/cache_93078",
    "fp16": false,
    "fp16_opt_level": "01",
    "gradient_accumulation_steps": 1,
    "learning_rate": 1.0708609960508476e-05,
    "local_rank": -1,
    "logging_steps": 1000,
    "max_grad_norm": 1.0,
    "max_seq_length": 128,
    "max_steps": -1,
    "model_name_or_path": "roberta-base",
    "model_type": "roberta",
    "n_gpu": 1,
    "no_cuda": false,
    "num_train_epochs": 6,
    "output_dir": "/content/results",
    "output_mode": "classification",
    "overwrite_cache": false,
    "overwrite_output_dir": false,
    "patience": 6,
    "per_gpu_eval_batch_size": 96,
    "per_gpu_train_batch_size": 64,
    "save_steps": 0,
    "seed": 93078,
    "server_ip": "",
    "server_port": "",
    "task_name": "snli",
    "test": null,
    "tokenizer_name": "",
    "train": null,
    "warmup_steps": 0,
    "weight_decay": 0.0
}