File size: 1,113 Bytes
fcf1d1f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 |
# @package _group_
common:
tpu: true
fp16: false
log_format: json
log_interval: 10
wandb_project: pretrain_tpu_960h
checkpoint:
save_interval_updates: 500
keep_interval_updates: 2
no_epoch_checkpoints: false
task:
_name: audio_pretraining
data: ???
max_sample_size: 257600
min_sample_size: 46400
normalize: false
num_batch_buckets: 3
precompute_mask_indices: true
enable_padding: true
dataset:
num_workers: 12
max_tokens: 1200000
skip_invalid_size_inputs_valid_test: true
distributed_training:
distributed_world_size: 8
ddp_backend: legacy_ddp
criterion:
_name: wav2vec
infonce: true
log_keys: ["prob_perplexity","code_perplexity","temp"]
loss_weights: [0.1, 0]
optimization:
max_update: 400000
lr: [0.0005]
optimizer:
_name: adam
adam_betas: (0.9,0.98)
adam_eps: 1e-06
weight_decay: 0.01
lr_scheduler:
_name: polynomial_decay
warmup_updates: 32000
model:
_name: wav2vec2
quantize_targets: true
final_dim: 256
encoder_layerdrop: 0.05
dropout_input: 0.1
dropout_features: 0.1
feature_grad_mult: 0.1
encoder_embed_dim: 768
|