{ "activation": "ELU", "activation_params": { "alpha": 1.0 }, "architectures": [ "EnCodecModel" ], "audio_channels": 2, "audio_normalize": true, "causal": false, "compress": 2, "dilation_base": 2, "dimension": 128, "final_activation": null, "final_activation_params": null, "is_encoder_decoder": true, "kernel_size": 7, "last_kernel_size": 7, "lstm": 2, "model_type": "encodec", "norm": "time_group_norm", "norm_params": {}, "num_filters": 32, "num_residual_layers": 1, "overlap": 0.01, "pad_mode": "reflect", "ratios": [ 8, 5, 4, 2 ], "residual_kernel_size": 3, "sampling_rate": 48000, "segment": 1.0, "target_bandwidths": [ 3.0, 6.0, 12.0, 24.0 ], "torch_dtype": "float32", "transformers_version": "4.30.0.dev0", "trim_right_ratio": 1.0, "true_skip": false }