{
    "audio_processor_class": "ImageBindAudioProcessor",
    "num_mel_bins": 128,
    "target_length": 204,
    "sample_rate": 16000,
    "clip_duration": 2,
    "clips_per_video": 3,
    "mean": -4.268,
    "std": 9.138
}