File size: 1,113 Bytes
b66a148 240597c b66a148 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 |
# @package _group_
common:
fp16: true
log_format: json
log_interval: 200
tensorboard_logdir: /home/joregan/wav2vec2-swedish-riksdag-100h-transcripts-nolm/runs
checkpoint:
no_epoch_checkpoints: true
best_checkpoint_metric: wer
task:
_name: audio_finetuning
data: /home/joregan/fairseq-data3/
normalize: true
labels: ltr
dataset:
num_workers: 6
max_tokens: 128000
skip_invalid_size_inputs_valid_test: true
valid_subset: valid
distributed_training:
ddp_backend: legacy_ddp
distributed_world_size: 8
criterion:
_name: ctc
zero_infinity: true
optimization:
max_update: 80000
lr: [0.00003]
sentence_avg: true
update_freq: [5]
optimizer:
_name: adam
adam_betas: (0.9,0.98)
adam_eps: 1e-08
lr_scheduler:
_name: tri_stage
phase_ratio: [0.1, 0.4, 0.5]
final_lr_scale: 0.05
model:
_name: wav2vec_ctc
w2v_path: /home/joregan/kb_wav2vec2_checkpoint/checkpoint_last.pt
apply_mask: true
mask_prob: 0.5
mask_channel_prob: 0.5
mask_channel_length: 64
layerdrop: 0.1
activation_dropout: 0.1
feature_grad_mult: 0.0
freeze_finetune_updates: 10000
|