File size: 235 Bytes
1542971
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
{
  "batch_size": 64,
  "mask_probability": 0.15,
  "num_layers": 6,
  "num_heads": 8,
  "d_model": 256,
  "d_ff": 512,
  "p_dropout": 0.1,
  "max_seq_len": 128,
  "vocab_size": 20000,
  "learning_rate": 3e-4,
  "grad_clip_value": 1
}