# list of examples for quick inferences:
infer_from_audio_examples = [
    ["catalan_audio_examples/catalan_female_speech_1.wav", None],
    ["catalan_audio_examples/catalan_female_speech_2.wav", None],
    ["catalan_audio_examples/catalan_male_speech_1.wav", None],
]