NeonBohdan's picture
Update to streaming_stt_nemo==0.2.0
f6d75ca
raw
history blame contribute delete
824 Bytes
from streaming_stt_nemo import Model, available_languages
import gradio as gr
LANGUAGES = available_languages
default_lang = "en"
engines = {
default_lang: Model(default_lang)
}
examples = [[f"./audio/{lang}.mp3", lang] for lang in LANGUAGES]
def transcribe(audio, language: str):
if language not in engines:
engines[language] = Model(language)
model = engines[language]
text = model.stt_file(audio)[0]
return text
gr.Interface(
fn=transcribe,
inputs=[
gr.Audio(source="microphone", type="filepath"),
gr.Radio(
label="Language",
choices=LANGUAGES,
value=default_lang
)
],
outputs=[
"textbox"
],
examples = examples,
cache_examples=True,
live=True).launch()