Spaces:
Running
on
A10G
Running
on
A10G
# @package __global__ | |
defaults: | |
- /solver/default | |
- /model: score/basic | |
- override /dset: audio/default | |
- _self_ | |
solver: diffusion | |
sample_rate: 16000 | |
channels: 1 | |
compression_model_checkpoint: //sig/5091833e | |
n_q: 2 # number of codebooks to keep | |
dataset: | |
batch_size: 8 | |
num_workers: 10 | |
segment_duration: 1 | |
train: | |
num_samples: 100 | |
valid: | |
num_samples: 100 | |
evaluate: | |
batch_size: 8 | |
num_samples: 10 | |
generate: | |
batch_size: 8 | |
num_samples: 10 | |
segment_duration: 10 | |
loss: | |
kind: mse | |
norm_power: 0. | |
valid: | |
every: 1 | |
evaluate: | |
every: 5 | |
num_workers: 5 | |
metrics: | |
visqol: false | |
sisnr: false | |
rvm: true | |
generate: | |
every: 5 | |
num_workers: 5 | |
audio: | |
sample_rate: ${sample_rate} | |
checkpoint: | |
save_last: true | |
save_every: 25 | |
keep_last: 10 | |
keep_every_states: null | |
optim: | |
epochs: 50 | |
updates_per_epoch: 2000 | |
lr: 2e-4 | |
max_norm: 0 | |
optimizer: adam | |
adam: | |
betas: [0.9, 0.999] | |
weight_decay: 0. | |
ema: | |
use: true # whether to use EMA or not | |
updates: 1 # update at every step | |
device: ${device} # device for EMA, can be put on GPU if more frequent updates | |
decay: 0.99 # EMA decay value, if null, no EMA is used | |
processor: | |
name: multi_band_processor | |
use: false | |
n_bands: 8 | |
num_samples: 10_000 | |
power_std: 1. | |
resampling: | |
use: false | |
target_sr: 16000 | |
filter: | |
use: false | |
n_bands: 4 | |
idx_band: 0 | |
cutoffs: null | |
schedule: | |
repartition: "power" | |
variable_step_batch: true | |
beta_t0: 1.0e-5 | |
beta_t1: 2.9e-2 | |
beta_exp: 7.5 | |
num_steps: 1000 | |
variance: 'beta' | |
clip: 5. | |
rescale: 1. | |
n_bands: null | |
noise_scale: 1.0 | |
metrics: | |
num_stage: 4 | |