{ "feature_size": 80, "sampling_rate": 16000, "padding_value": 0.0, "padding_side": "right", "return_attention_mask": false, "feature_extractor_type": "WhisperFeatureExtractor", "n_samples": 480000, "nb_max_frames": 3000, "n_fft": 400, "hop_length": 160, "chunk_length": 30, "dither": 0.0, "sequence_length": 1000, "processor_class": "VoiceEmbedderProcessor" }