File size: 346 Bytes
9579df3
cac7a4b
9579df3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
{
  "model_type": "krdmodel", 
  "vocab_size": 111,
  "dim": 1024,
  "n_layers": 16,
  "n_heads": 16,
  "n_kv_heads": 4,
  "ffn_dim": 2816,
  "max_seq_len": 2048,
  "batch_size": 4,
  "gradient_accumulation": 8,
  "train_steps": 5000,
  "lr": 2e-4,
  "mixed_precision": "fp16",
  "lora_rank": 32,
  "use_flash": true,
  "grad_checkpoint": true
}