encodec-32khz-bfloat16 / config.json
awni's picture
850978763c248627823e3b7ae8397d13b3b81aa9adfff2c3d8261f048eada316
7d4003d verified
raw
history blame
841 Bytes
{
"architectures": [
"EncodecModel"
],
"audio_channels": 1,
"chunk_length_s": null,
"codebook_dim": 128,
"codebook_size": 2048,
"compress": 2,
"dilation_growth_rate": 2,
"hidden_size": 128,
"kernel_size": 7,
"last_kernel_size": 7,
"model_type": "encodec",
"norm_type": "weight_norm",
"normalize": false,
"num_filters": 64,
"num_lstm_layers": 2,
"num_residual_layers": 1,
"overlap": null,
"pad_mode": "reflect",
"residual_kernel_size": 3,
"sampling_rate": 32000,
"target_bandwidths": [
2.2
],
"torch_dtype": "float32",
"transformers_version": "4.31.0.dev0",
"trim_right_ratio": 1.0,
"upsampling_ratios": [
8,
5,
4,
4
],
"use_causal_conv": false,
"use_conv_shortcut": false
}