datnth1709 commited on
Commit
4357214
·
1 Parent(s): 85cd50e
Files changed (1) hide show
  1. app.py +10 -11
app.py CHANGED
@@ -162,7 +162,7 @@ def transcribe_vi(audio, state_vi="", state_en=""):
162
  state_vi += beam_search_output + " "
163
  en_text = translate_vi2en(beam_search_output)
164
  state_en += en_text + " "
165
- return state_vi, state_en, state_vi, state_en
166
 
167
  def transcribe_en(audio, state_en="", state_vi=""):
168
  speech = load_data(audio)
@@ -179,7 +179,7 @@ def transcribe_en(audio, state_en="", state_vi=""):
179
  state_en += transcription + " "
180
  vi_text = translate_en2vi(transcription)
181
  state_vi += vi_text + " "
182
- return state_en, state_vi, state_en, state_vi
183
 
184
  """Gradio demo"""
185
 
@@ -207,27 +207,27 @@ with gr.Blocks() as demo:
207
  translate_button_vien_1.click(lambda text: translate_vi2en(text), inputs=vietnamese_text, outputs=english_out_1)
208
  gr.Examples(examples=vi_example_text,
209
  inputs=[vietnamese_text])
 
210
  with gr.TabItem("Speech2text and Vi-En Translation"):
211
  with gr.Row():
212
  with gr.Column():
213
- vi_audio = gr.Audio(source="microphone", label="Input Vietnamese Audio", type="file", streaming=False)
214
  translate_button_vien_2 = gr.Button(value="Translate To English")
215
  with gr.Column():
216
  speech2text_vi1 = gr.Textbox(label="Vietnamese Text")
217
  english_out_2 = gr.Textbox(label="English Text")
218
-
219
- translate_button_vien_2.click(lambda vi_voice: inference_vien(vi_voice), inputs=vi_audio, outputs=[speech2text_vi1, english_out_2])
220
  gr.Examples(examples=vi_example_voice,
221
- inputs=[vi_audio])
 
222
  with gr.TabItem("Vi-En Realtime Translation"):
223
  with gr.Row():
224
  with gr.Column():
225
- vi_audio = gr.Audio(source="microphone", label="Input Vietnamese Audio", type="file", streaming=True)
226
- translate_button_vien_2 = gr.Button(value="Translate To English")
227
  with gr.Column():
228
  speech2text_vi2 = gr.Textbox(label="Vietnamese Text")
229
  english_out_3 = gr.Textbox(label="English Text")
230
- vi_audio.change(transcribe_vi, [vi_audio, "state_vi", "state_en"], [speech2text_vi2, english_out_3, "state_vi", "state_en"])
231
 
232
 
233
  with gr.Tabs():
@@ -258,11 +258,10 @@ with gr.Blocks() as demo:
258
  with gr.Row():
259
  with gr.Column():
260
  en_audio_2 = gr.Audio(source="microphone", label="Input English Audio", type="filepath", streaming=True)
261
- # translate_button_envi_2 = gr.Button(value="Translate To Vietnamese")
262
  with gr.Column():
263
  speech2text_en2 = gr.Textbox(label="English Text")
264
  vietnamese_out_3 = gr.Textbox(label="Vietnamese Text")
265
- en_audio_2.change(transcribe_en, [en_audio_2, "state_en", "state_vi"], [speech2text_en2, vietnamese_out_3, "state_en", "state_vi"])
266
 
267
  if __name__ == "__main__":
268
  demo.launch()
 
162
  state_vi += beam_search_output + " "
163
  en_text = translate_vi2en(beam_search_output)
164
  state_en += en_text + " "
165
+ return state_vi, state_en
166
 
167
  def transcribe_en(audio, state_en="", state_vi=""):
168
  speech = load_data(audio)
 
179
  state_en += transcription + " "
180
  vi_text = translate_en2vi(transcription)
181
  state_vi += vi_text + " "
182
+ return state_en, state_vi
183
 
184
  """Gradio demo"""
185
 
 
207
  translate_button_vien_1.click(lambda text: translate_vi2en(text), inputs=vietnamese_text, outputs=english_out_1)
208
  gr.Examples(examples=vi_example_text,
209
  inputs=[vietnamese_text])
210
+
211
  with gr.TabItem("Speech2text and Vi-En Translation"):
212
  with gr.Row():
213
  with gr.Column():
214
+ vi_audio_1 = gr.Audio(source="microphone", label="Input Vietnamese Audio", type="file", streaming=False)
215
  translate_button_vien_2 = gr.Button(value="Translate To English")
216
  with gr.Column():
217
  speech2text_vi1 = gr.Textbox(label="Vietnamese Text")
218
  english_out_2 = gr.Textbox(label="English Text")
219
+ translate_button_vien_2.click(lambda vi_voice: inference_vien(vi_voice), inputs=vi_audio_1, outputs=[speech2text_vi1, english_out_2])
 
220
  gr.Examples(examples=vi_example_voice,
221
+ inputs=[vi_audio_1])
222
+
223
  with gr.TabItem("Vi-En Realtime Translation"):
224
  with gr.Row():
225
  with gr.Column():
226
+ vi_audio_2 = gr.Audio(source="microphone", label="Input Vietnamese Audio", type="file", streaming=True)
 
227
  with gr.Column():
228
  speech2text_vi2 = gr.Textbox(label="Vietnamese Text")
229
  english_out_3 = gr.Textbox(label="English Text")
230
+ vi_audio_2.change(transcribe_vi, [vi_audio_2, speech2text_vi2, english_out_3], [speech2text_vi2, english_out_3])
231
 
232
 
233
  with gr.Tabs():
 
258
  with gr.Row():
259
  with gr.Column():
260
  en_audio_2 = gr.Audio(source="microphone", label="Input English Audio", type="filepath", streaming=True)
 
261
  with gr.Column():
262
  speech2text_en2 = gr.Textbox(label="English Text")
263
  vietnamese_out_3 = gr.Textbox(label="Vietnamese Text")
264
+ en_audio_2.change(transcribe_en, [en_audio_2, speech2text_en2, vietnamese_out_3], [speech2text_en2, vietnamese_out_3])
265
 
266
  if __name__ == "__main__":
267
  demo.launch()