Spaces:

ovieyra21
/

speech-to-speech-translation-course

Running

ovieyra21 commited on Mar 13, 2024

Commit

636c11b

verified ·

1 Parent(s): e7b531f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,7 +10,6 @@ device = "cuda:0" if torch.cuda.is_available() else "cpu"
 # load speech translation checkpoint
 asr_pipe = pipeline("automatic-speech-recognition", model="openai/whisper-base", device=device)
-forced_decoder_ids = processor.get_decoder_prompt_ids(language="spanish", task="translate")
 # load text-to-speech checkpoint and speaker embeddings
@@ -27,6 +26,9 @@ def translate(audio):
     outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
     return outputs["text"]
 def synthesise(text):
     inputs = processor(text=text, return_tensors="pt")

 # load speech translation checkpoint
 asr_pipe = pipeline("automatic-speech-recognition", model="openai/whisper-base", device=device)
 # load text-to-speech checkpoint and speaker embeddings
     outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
     return outputs["text"]
+    set:"transcribe""language"
+    generate_kwargs={"task": "transcribe", "language": "es"}
 def synthesise(text):
     inputs = processor(text=text, return_tensors="pt")