import whisper import gradio as gr model = whisper.load_model("base") def transcribe(audio): result = model.transcribe(audio) return result["text"] gr.Interface(fn=transcribe, inputs="audio", outputs="text").launch()