File size: 1,152 Bytes
50f034f
75a7169
50f034f
b688797
50f034f
 
 
 
 
 
 
 
 
63015d5
 
50f034f
 
 
 
 
 
 
 
 
 
 
 
881d56d
 
 
50f034f
d48dcc4
50f034f
d48dcc4
 
50f034f
d48dcc4
50f034f
 
4687dd9
50f034f
 
 
 
 
 
d48dcc4
 
50f034f
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60

codec_ckpt: ./models/spotdl/codec.pth
save_path: ckpt
max_epochs: 1000
epoch_length: 1000
save_audio_epochs: 2
val_idx: [0,1,2,3,4,5,6,7,8,9]

prefix_amt: 0.0
suffix_amt: 0.0
prefix_dropout: 0.1
suffix_dropout: 0.1

batch_size: 8
num_workers: 10

# Optimization
detect_anomaly: false
amp: false

CrossEntropyLoss.label_smoothing: 0.1

AdamW.lr: 0.001

NoamScheduler.factor: 2.0
NoamScheduler.warmup: 10000

PitchShift.shift_amount: [const, 0]
PitchShift.prob: 0.0

VampNet.vocab_size: 1024
VampNet.n_codebooks: 4
VampNet.n_conditioning_codebooks: 0
VampNet.r_cond_dim: 0
VampNet.noise_mode: mask
VampNet.embedding_dim: 1280
VampNet.n_layers: 20
VampNet.n_heads: 20
VampNet.flash_attn: false
VampNet.dropout: 0.1

AudioLoader.relative_path: /data/
AudioDataset.loudness_cutoff: -30.0
AudioDataset.without_replacement: true
AudioLoader.shuffle: true

AudioDataset.duration: 10.0

train/AudioDataset.n_examples: 10000000
train/AudioLoader.sources:
  - /data/spotdl/audio/train

val/AudioDataset.n_examples: 2000
val/AudioLoader.sources:
  - /data/spotdl/audio/val

test/AudioDataset.n_examples: 1000
test/AudioLoader.sources:
  - /data/spotdl/audio/test