|
{ |
|
"architectures": [ |
|
"EncodecModel" |
|
], |
|
"audio_channels": 1, |
|
"chunk_length_s": null, |
|
"codebook_dim": 128, |
|
"codebook_size": 2048, |
|
"compress": 2, |
|
"dilation_growth_rate": 2, |
|
"hidden_size": 128, |
|
"kernel_size": 7, |
|
"last_kernel_size": 7, |
|
"model_type": "encodec", |
|
"norm_type": "weight_norm", |
|
"normalize": false, |
|
"num_filters": 64, |
|
"num_lstm_layers": 2, |
|
"num_residual_layers": 1, |
|
"overlap": null, |
|
"pad_mode": "reflect", |
|
"residual_kernel_size": 3, |
|
"sampling_rate": 32000, |
|
"target_bandwidths": [ |
|
2.2 |
|
], |
|
"torch_dtype": "float32", |
|
"transformers_version": "4.31.0.dev0", |
|
"trim_right_ratio": 1.0, |
|
"upsampling_ratios": [ |
|
8, |
|
5, |
|
4, |
|
4 |
|
], |
|
"use_causal_conv": false, |
|
"use_conv_shortcut": true |
|
} |
|
|