Spaces:

AlexK-PL
/

Tacotron2_GST_eng

Sleeping

AlexK-PL commited on Sep 5, 2023

Commit

cadb9c5

1 Parent(s): eec8d3d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,10 +10,8 @@ from melgan.utils.hparams import load_hparam
 import torch
 import numpy as np
-import random
 from matplotlib import pyplot as plt
-from matplotlib import gridspec
 # Adjust vertical spacing between subplots
 plt.subplots_adjust(hspace=0.15)  # You can adjust the value as needed
@@ -87,21 +85,11 @@ def synthesize(text, gst_1, gst_2, gst_3):
     fig_mel = plot_spec_align(mel_outputs_postnet, alignments)
     return (22050, audio_numpy), fig_mel  # fig_align
-def randomize_style_weights():
-    rand_weight_1 = random.randrange(0.3, 0.45, 0.01)
-    rand_weight_2 = random.randrange(0.3, 0.45, 0.01)
-    rand_weight_3 = 1.0 - (rand_weight_1 + rand_weight_2)
-    return rand_weight_1, rand_weight_2, rand_weight_3
-w1, w2, w3 = randomize_style_weights()
-iface = gr.Interface(fn=synthesize, inputs=[gr.Textbox(label="Input Text"), gr.Slider(0.2, 0.45, label="First style token weight:", value=w1),
-                                            gr.Slider(0.2, 0.45, label="Second style token weight:", value=w2),
-                                            gr.Slider(0.2, 0.45, label="Third style token weight:",value=w3)],
                      outputs=[gr.Audio(label="Generated Speech", type="numpy"), gr.Plot(label="Output"),],
                      title="Single-Head Attention Tacotron2 with Style Tokens", description=DESCRIPTION)
 iface.launch()

 import torch
 import numpy as np
 from matplotlib import pyplot as plt
 # Adjust vertical spacing between subplots
 plt.subplots_adjust(hspace=0.15)  # You can adjust the value as needed
     fig_mel = plot_spec_align(mel_outputs_postnet, alignments)
     return (22050, audio_numpy), fig_mel  # fig_align
+iface = gr.Interface(fn=synthesize, inputs=[gr.Textbox(label="Input Text"), gr.Slider(0.2, 0.45, label="First style token weight:", value=0.4),
+                                            gr.Slider(0.2, 0.45, label="Second style token weight:", value=0.26),
+                                            gr.Slider(0.2, 0.45, label="Third style token weight:", value=0.33)],
                      outputs=[gr.Audio(label="Generated Speech", type="numpy"), gr.Plot(label="Output"),],
                      title="Single-Head Attention Tacotron2 with Style Tokens", description=DESCRIPTION)
 iface.launch()