|
|
|
|
|
defaults:
|
|
- /solver/default
|
|
- /model: score/basic
|
|
- override /dset: audio/default
|
|
- _self_
|
|
|
|
solver: diffusion
|
|
|
|
sample_rate: ???
|
|
channels: ???
|
|
compression_model_checkpoint: ???
|
|
n_q: ???
|
|
|
|
|
|
dataset:
|
|
batch_size: 128
|
|
num_workers: 10
|
|
segment_duration: 1
|
|
train:
|
|
num_samples: 500000
|
|
valid:
|
|
num_samples: 10000
|
|
evaluate:
|
|
batch_size: 16
|
|
num_samples: 10000
|
|
generate:
|
|
batch_size: 32
|
|
num_samples: 50
|
|
segment_duration: 10
|
|
audio:
|
|
sample_rate: ${sample_rate}
|
|
|
|
loss:
|
|
kind: mse
|
|
norm_power: 0.
|
|
|
|
valid:
|
|
every: 1
|
|
|
|
evaluate:
|
|
every: 20
|
|
num_workers: 5
|
|
metrics:
|
|
visqol: false
|
|
sisnr: false
|
|
rvm: true
|
|
|
|
generate:
|
|
every: 25
|
|
num_workers: 5
|
|
|
|
checkpoint:
|
|
save_last: true
|
|
save_every: 25
|
|
keep_last: 10
|
|
keep_every_states: null
|
|
|
|
|
|
optim:
|
|
epochs: 20000
|
|
updates_per_epoch: 2000
|
|
lr: 2e-4
|
|
max_norm: 0
|
|
optimizer: adam
|
|
adam:
|
|
betas: [0.9, 0.999]
|
|
weight_decay: 0.
|
|
ema:
|
|
use: true
|
|
updates: 1
|
|
device: ${device}
|
|
decay: 0.99
|
|
|
|
processor:
|
|
name: multi_band_processor
|
|
use: false
|
|
n_bands: 8
|
|
num_samples: 10_000
|
|
power_std: 1.
|
|
|
|
resampling:
|
|
use: false
|
|
target_sr: 16000
|
|
|
|
filter:
|
|
use: false
|
|
n_bands: 4
|
|
idx_band: 0
|
|
cutoffs: null
|
|
|
|
schedule:
|
|
repartition: "power"
|
|
variable_step_batch: true
|
|
beta_t0: 1.0e-5
|
|
beta_t1: 2.9e-2
|
|
beta_exp: 7.5
|
|
num_steps: 1000
|
|
variance: 'beta'
|
|
clip: 5.
|
|
rescale: 1.
|
|
n_bands: null
|
|
noise_scale: 1.0
|
|
|
|
metrics:
|
|
num_stage: 4
|
|
|