Spaces:
Sleeping
Sleeping
File size: 1,152 Bytes
50f034f 75a7169 50f034f b688797 50f034f 63015d5 50f034f 881d56d 50f034f d48dcc4 50f034f d48dcc4 50f034f d48dcc4 50f034f 4687dd9 50f034f d48dcc4 50f034f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 |
codec_ckpt: ./models/spotdl/codec.pth
save_path: ckpt
max_epochs: 1000
epoch_length: 1000
save_audio_epochs: 2
val_idx: [0,1,2,3,4,5,6,7,8,9]
prefix_amt: 0.0
suffix_amt: 0.0
prefix_dropout: 0.1
suffix_dropout: 0.1
batch_size: 8
num_workers: 10
# Optimization
detect_anomaly: false
amp: false
CrossEntropyLoss.label_smoothing: 0.1
AdamW.lr: 0.001
NoamScheduler.factor: 2.0
NoamScheduler.warmup: 10000
PitchShift.shift_amount: [const, 0]
PitchShift.prob: 0.0
VampNet.vocab_size: 1024
VampNet.n_codebooks: 4
VampNet.n_conditioning_codebooks: 0
VampNet.r_cond_dim: 0
VampNet.noise_mode: mask
VampNet.embedding_dim: 1280
VampNet.n_layers: 20
VampNet.n_heads: 20
VampNet.flash_attn: false
VampNet.dropout: 0.1
AudioLoader.relative_path: /data/
AudioDataset.loudness_cutoff: -30.0
AudioDataset.without_replacement: true
AudioLoader.shuffle: true
AudioDataset.duration: 10.0
train/AudioDataset.n_examples: 10000000
train/AudioLoader.sources:
- /data/spotdl/audio/train
val/AudioDataset.n_examples: 2000
val/AudioLoader.sources:
- /data/spotdl/audio/val
test/AudioDataset.n_examples: 1000
test/AudioLoader.sources:
- /data/spotdl/audio/test
|