bambara-vqvae / config.json
oza75's picture
oza75/bambara-vqvae
0c7c64d verified
raw
history blame
573 Bytes
{
"_name_or_path": "oza75/bambara-vqvae",
"act_fn": "relu",
"architectures": [
"BMSpeechVQVAE"
],
"in_channels": 1,
"initial_filters": 64,
"input_shape": null,
"kernel_size": 4,
"latent_channels": 512,
"model_type": "bm_speech_vq_vae",
"norm_num_groups": 32,
"norm_type": "group",
"num_layers": 4,
"num_vq_embeddings": 512,
"out_channels": 1,
"padding": 1,
"sample_size": 32,
"scaling_factor": 0.18215,
"speaker_embed_dim": 512,
"stride": 2,
"torch_dtype": "float32",
"transformers_version": "4.41.1",
"vq_embed_dim": 64
}