Spaces:

Gregniuki
/

f5-tts_Polish_English_German

Running on Zero

Gregniuki commited on Nov 28, 2024

Commit

22e294e

verified ·

1 Parent(s): 4feb122

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -61,7 +61,7 @@ print(f"Using device: {device}, dtype: {dtype}")
 pipe = pipeline(
     "automatic-speech-recognition",
     model="openai/whisper-large-v3-turbo",
-    torch_dtype=torch.float32,
     device=device,
 )
 #vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
@@ -344,7 +344,7 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, cross_fa
     audio, sr = torchaudio.load(ref_audio)
     # Use the new chunk_text function to split gen_text
-    max_chars = int(len(ref_text.encode('utf-8')) / (audio.shape[-1] / sr) * (28 - audio.shape[-1] / sr))
     gen_text_batches = chunk_text(gen_text, max_chars=135)
     print('ref_text', ref_text)
     for i, batch_text in enumerate(gen_text_batches):

 pipe = pipeline(
     "automatic-speech-recognition",
     model="openai/whisper-large-v3-turbo",
+    torch_dtype=dtype,
     device=device,
 )
 #vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
     audio, sr = torchaudio.load(ref_audio)
     # Use the new chunk_text function to split gen_text
+    max_chars = int(len(ref_text.encode('utf-8')) / (audio.shape[-1] / sr) * (25 - audio.shape[-1] / sr))
     gen_text_batches = chunk_text(gen_text, max_chars=135)
     print('ref_text', ref_text)
     for i, batch_text in enumerate(gen_text_batches):