{ "feature_extractor_type": "VocosFeatureExtractor", "feature_size": 100, "hop_length": 256, "n_fft": 1024, "n_mels": 100, "padding": "center", "padding_side": "right", "padding_value": 0.0, "processor_class": "VocosEncodecProcessor", "return_attention_mask": true, "sampling_rate": 24000, "win_length": 1024 }