Spaces:

Gregniuki
/

f5-tts_Polish_English_German

Running on Zero

App Files Files Community

Gregniuki commited on 10 days ago

Commit

42898bb

verified ·

1 Parent(s): 1be1cf6

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -13

app.py CHANGED Viewed

@@ -129,15 +129,15 @@ chat_tokenizer_state = None
 F5TTS_model_cfg = dict(dim=1024, depth=22, heads=16, ff_mult=2, text_dim=512, conv_layers=4)
 E2TTS_model_cfg = dict(dim=1024, depth=24, heads=16, ff_mult=4)
 F5TTS_ema_model = load_custom(
-    "hf://Gregniuki/F5-tts_English_German_Polish/English/model_222600.pt", "", F5TTS_model_cfg
-)
-E2TTS_ema_model = load_custom(
     "hf://Gregniuki/F5-tts_English_German_Polish/multi/model_300000.pt", "", F5TTS_model_cfg
 )
-E2TTS_ema_model2 = load_custom(
-    "hf://Gregniuki/F5-tts_English_German_Polish/Polish/model_500000.pt", "", F5TTS_model_cfg
-)
@@ -222,12 +222,12 @@ def text_to_ipa(text, language='en-gb'):
 @gpu_decorator
 def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence, cross_fade_duration=0.15, progress=gr.Progress(), language='en-gb'):
-    if exp_name == "English":
         ema_model = F5TTS_ema_model
-    elif exp_name == "Polish":
-        ema_model = E2TTS_ema_model
-    elif exp_name == "Deutsch":
-        ema_model = E2TTS_ema_model2
     #ref_audio, ref_text = preprocess_ref_audio_text(ref_audio, ref_text, show_info=show_info)
@@ -556,7 +556,7 @@ with gr.Blocks() as app_tts:
     ref_audio_input = gr.Audio(label="Reference Audio", type="filepath")
     gen_text_input = gr.Textbox(label="Text to Generate", lines=10)
     model_choice = gr.Radio(
-        choices=["English", "Polish", "Deutsch"], label="Choose TTS Model", value="English"
     )
     language_choice = gr.Dropdown(
         choices=["pl", "de", "en-us", "en-gb", "uk", "ru"], label="Choose Language", value="en-gb"
@@ -753,7 +753,7 @@ with gr.Blocks() as app_emotional:
     # Model choice
     model_choice_emotional = gr.Radio(
-        choices=["English","Polish","Deutsch"], label="Choose TTS Model", value="English"
     )
     with gr.Accordion("Advanced Settings", open=False):

 F5TTS_model_cfg = dict(dim=1024, depth=22, heads=16, ff_mult=2, text_dim=512, conv_layers=4)
 E2TTS_model_cfg = dict(dim=1024, depth=24, heads=16, ff_mult=4)
+#F5TTS_ema_model = load_custom(
+#    "hf://Gregniuki/F5-tts_English_German_Polish/English/model_222600.pt", "", F5TTS_model_cfg
+#)
 F5TTS_ema_model = load_custom(
     "hf://Gregniuki/F5-tts_English_German_Polish/multi/model_300000.pt", "", F5TTS_model_cfg
 )
+#E2TTS_ema_model2 = load_custom(
+#    "hf://Gregniuki/F5-tts_English_German_Polish/Polish/model_500000.pt", "", F5TTS_model_cfg
+#)
 @gpu_decorator
 def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence, cross_fade_duration=0.15, progress=gr.Progress(), language='en-gb'):
+    if exp_name == "Multi":
         ema_model = F5TTS_ema_model
+   # elif exp_name == "Polish":
+   #     ema_model = E2TTS_ema_model
+   # elif exp_name == "Deutsch":
+  #      ema_model = E2TTS_ema_model2
     #ref_audio, ref_text = preprocess_ref_audio_text(ref_audio, ref_text, show_info=show_info)
     ref_audio_input = gr.Audio(label="Reference Audio", type="filepath")
     gen_text_input = gr.Textbox(label="Text to Generate", lines=10)
     model_choice = gr.Radio(
+        choices=["Multi"], label="Choose TTS Model", value="Multi"
     )
     language_choice = gr.Dropdown(
         choices=["pl", "de", "en-us", "en-gb", "uk", "ru"], label="Choose Language", value="en-gb"
     # Model choice
     model_choice_emotional = gr.Radio(
+        choices=["Multi"], label="Choose TTS Model", value="Multi"
     )
     with gr.Accordion("Advanced Settings", open=False):