File size: 411 Bytes
6ea4250 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
{
"model": "gpt2",
"dataset": "wikitext",
"subset": "wikitext-103-v1",
"output_dir": "output",
"num_epochs": 20,
"num_tokens": 100000000,
"window_size": 16,
"batch_size": 1024,
"learning_rate": 1e-05,
"warmup_steps": 3000,
"scheduler": "cosine",
"weight_decay": 0.1,
"random_seed": 42,
"eval_steps": 1000,
"patience": 5,
"id": "1c15056cf51bff47"
} |