VQMIVC / config /model /default.yaml
akhaliq3
spaces demo
2b7bf83
raw
history blame
694 Bytes
model:
encoder:
in_channels: 80
channels: 512
n_embeddings: 512
z_dim: 64
c_dim: 256
cpc:
n_prediction_steps: ${training.n_prediction_steps}
n_speakers_per_batch: ${training.n_speakers_per_batch}
n_utterances_per_speaker: ${training.n_utterances_per_speaker}
n_negatives: ${training.n_negatives}
z_dim: ${model.encoder.z_dim}
c_dim: ${model.encoder.c_dim}
cpc_model:
nPredicts: 12
dimOutputAR: 256
dimOutputEncoder: 64
negativeSamplingExt: 64
rnnMode: ffd
dropout: False
speakerEmbedding: 0
nSpeakers: 0
sizeInputSeq: 64