File size: 276 Bytes
2f044c1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 |
model:
transformer_model: "microsoft/deberta-v3-small"
optimizer:
lr: 0.00005
warmup_steps: 25000
total_steps: ${training.trainer.max_steps}
weight_decay: 0.01
no_decay_params:
- "bias"
- LayerNorm.weight
relations_per_forward: 16
entities_per_forward:
|