File size: 276 Bytes
2f044c1
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
model:
  transformer_model: "microsoft/deberta-v3-small"

optimizer:
  lr: 0.00005
  warmup_steps: 25000
  total_steps: ${training.trainer.max_steps}
  weight_decay: 0.01
  no_decay_params:
    - "bias"
    - LayerNorm.weight

relations_per_forward: 16
entities_per_forward: