Spaces:

Merlintxu
/

Wav2Txt

Build error

App Files Files Community

Merlintxu commited on Jul 7, 2024

Commit

1851c8f

verified ·

1 Parent(s): df609a3

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -6

app.py CHANGED Viewed

@@ -12,7 +12,6 @@ from transformers import logging
 warnings.filterwarnings("ignore")
 logging.set_verbosity_error()
 # Updated models by language
 MODELS = {
     "es": [
@@ -23,7 +22,7 @@ MODELS = {
     "en": [
         "openai/whisper-large-v3",
         "facebook/wav2vec2-large-960h",
-        "microsoft/wav2vec2-base-960"
     ],
     "pt": [
         "facebook/wav2vec2-large-xlsr-53-portuguese",
@@ -103,18 +102,18 @@ def combined_interface(audio):
         language, model_options = detect_and_select_model(audio)
         selected_model = model_options[0]
-        yield language, gr.Dropdown.update(choices=model_options, value=selected_model), selected_model, ""
         full_transcription = ""
         for partial_transcription in transcribe_audio_stream(audio, selected_model):
             full_transcription += partial_transcription + " "
-            yield language, gr.Dropdown.update(choices=model_options, value=selected_model), selected_model, full_transcription.strip()
         # Clean up temporary files
         os.remove("converted_audio.wav")
     except Exception as e:
-        yield str(e), gr.Dropdown.update(choices=[]), "", "An error occurred during processing."
 iface = gr.Interface(
     fn=combined_interface,
@@ -126,7 +125,7 @@ iface = gr.Interface(
         gr.Textbox(label="Transcription", lines=10)
     ],
     title="Multilingual Audio Transcriber with Real-time Display",
-    description="Upload an audio file to detect the language, select the transcription model, and get the transcription in real-time. Optimized for Spanish and English.",
     live=True
 )

 warnings.filterwarnings("ignore")
 logging.set_verbosity_error()
 # Updated models by language
 MODELS = {
     "es": [
     "en": [
         "openai/whisper-large-v3",
         "facebook/wav2vec2-large-960h",
+        "microsoft/wav2vec2-base-960h"
     ],
     "pt": [
         "facebook/wav2vec2-large-xlsr-53-portuguese",
         language, model_options = detect_and_select_model(audio)
         selected_model = model_options[0]
+        yield language, model_options, selected_model, ""
         full_transcription = ""
         for partial_transcription in transcribe_audio_stream(audio, selected_model):
             full_transcription += partial_transcription + " "
+            yield language, model_options, selected_model, full_transcription.strip()
         # Clean up temporary files
         os.remove("converted_audio.wav")
     except Exception as e:
+        yield str(e), [], "", "An error occurred during processing."
 iface = gr.Interface(
     fn=combined_interface,
         gr.Textbox(label="Transcription", lines=10)
     ],
     title="Multilingual Audio Transcriber with Real-time Display",
+    description="Upload an audio file to detect the language, select the transcription model, and get the transcription in real-time. Optimized for Spanish, English, and Portuguese.",
     live=True
 )