{ "activation": "ELU", "activation_params": { "alpha": 1.0 }, "architectures": [ "EncodecModel" ], "audio_channels": 1, "bins": 1024, "causal": true, "codebook_dim": null, "commitment_weight": 1.0, "compress": 2, "decay": 0.99, "dilation_base": 2, "dimension": 128, "epsilon": 1e-05, "final_activation": null, "final_activation_params": null, "is_encoder_decoder": true, "kernel_size": 7, "kmeans_init": true, "kmeans_iters": 50, "last_kernel_size": 7, "model_type": "encodec", "norm": "weight_norm", "norm_params": {}, "normalize": false, "num_filters": 32, "num_lstm_layers": 2, "num_residual_layers": 1, "overlap": 0.01, "pad_mode": "reflect", "ratios": [ 8, 5, 4, 2 ], "residual_kernel_size": 3, "sampling_rate": 24000, "segment": null, "target_bandwidths": [ 1.5, 3.0, 6.0, 12.0, 24.0 ], "threshold_ema_dead_code": 2, "torch_dtype": "float32", "transformers_version": "4.31.0.dev0", "trim_right_ratio": 1.0, "true_skip": false }