f5-tts_french

Runtime error

App Files Files Community

RASPIAUDIO commited on Nov 13, 2024

Commit

3e1ea4f

1 Parent(s): 62a0088

french version 1

Browse files

Files changed (1) hide show

app.py +3 -9

app.py CHANGED Viewed

@@ -92,7 +92,7 @@ F5TTS_model_cfg = dict(
 E2TTS_model_cfg = dict(dim=1024, depth=24, heads=16, ff_mult=4)
 F5TTS_ema_model = load_model(
-    "Gregniuki", "F5-tts_English_German_Polish", "Polish", DiT, F5TTS_model_cfg, 500000
 )
 #E2TTS_ema_model = load_model(
 #    "SWivid", "F5-TTS", "E2TTS_Base", UNetT, E2TTS_model_cfg, 1200000
@@ -759,7 +759,7 @@ This is a local web UI for F5 TTS with advanced batch processing support. This a
 * [F5-TTS](https://arxiv.org/abs/2410.06885) (A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching)
 * [E2 TTS](https://arxiv.org/abs/2406.18009) (Embarrassingly Easy Fully Non-Autoregressive Zero-Shot TTS)
-The checkpoint support Polish English and German.
 Generations using CPU takes usually 2-3 minutes
@@ -768,13 +768,7 @@ If you're having issues, try converting your reference audio to WAV or MP3, clip
 **NOTE: Reference text will be automatically transcribed with Whisper if not provided. For best results, keep your reference clips short (<15s). Ensure the audio is fully uploaded before generating.**
 """
     )
-    gr.HTML(
-        """
-        <a href="https://www.buymeacoffee.com/gregniuki" target="_blank">
-            <img src="https://cdn.buymeacoffee.com/buttons/v2/default-yellow.png" alt="Buy Me A Coffee" style="height: 60px !important;width: 217px !important;">
-        </a>
-        """
-    )
     gr.TabbedInterface([app_tts, app_podcast, app_emotional, app_credits], ["TTS", "Podcast", "Multi-Style", "Credits"])
 @click.command()

 E2TTS_model_cfg = dict(dim=1024, depth=24, heads=16, ff_mult=4)
 F5TTS_ema_model = load_model(
+    "RASPIAUDIO", "F5-French-MixedSpeakers-reduced", "model_last_reduced.pt", DiT, F5TTS_model_cfg, 500000
 )
 #E2TTS_ema_model = load_model(
 #    "SWivid", "F5-TTS", "E2TTS_Base", UNetT, E2TTS_model_cfg, 1200000
 * [F5-TTS](https://arxiv.org/abs/2410.06885) (A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching)
 * [E2 TTS](https://arxiv.org/abs/2406.18009) (Embarrassingly Easy Fully Non-Autoregressive Zero-Shot TTS)
+The checkpoint support French
 Generations using CPU takes usually 2-3 minutes
 **NOTE: Reference text will be automatically transcribed with Whisper if not provided. For best results, keep your reference clips short (<15s). Ensure the audio is fully uploaded before generating.**
 """
     )
     gr.TabbedInterface([app_tts, app_podcast, app_emotional, app_credits], ["TTS", "Podcast", "Multi-Style", "Credits"])
 @click.command()