Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -6,7 +6,7 @@ from xcodec2.modeling_xcodec2 import XCodec2Model
|
|
6 |
import torchaudio
|
7 |
import gradio as gr
|
8 |
|
9 |
-
llasa_model_id = 'OmniAICreator/Galgame-Llasa-
|
10 |
|
11 |
tokenizer = AutoTokenizer.from_pretrained(llasa_model_id)
|
12 |
|
@@ -151,12 +151,12 @@ def infer(sample_audio_path, target_text, temperature, top_p, progress=gr.Progr
|
|
151 |
return (16000, gen_wav[0, 0, :].cpu().numpy())
|
152 |
|
153 |
with gr.Blocks() as app_tts:
|
154 |
-
gr.Markdown("# Galgame Llasa
|
155 |
ref_audio_input = gr.Audio(label="Reference Audio", type="filepath")
|
156 |
gen_text_input = gr.Textbox(label="Text to Generate", lines=10)
|
157 |
|
158 |
with gr.Row():
|
159 |
-
temperature_slider = gr.Slider(minimum=0.0, maximum=1.0, value=0.
|
160 |
top_p_slider = gr.Slider(minimum=0.0, maximum=1.0, value=1.0, step=0.05, label="Top-p")
|
161 |
|
162 |
generate_btn = gr.Button("Synthesize", variant="primary")
|
@@ -186,9 +186,9 @@ with gr.Blocks() as app_credits:
|
|
186 |
with gr.Blocks() as app:
|
187 |
gr.Markdown(
|
188 |
"""
|
189 |
-
# Galgame Llasa
|
190 |
|
191 |
-
This is a local web UI for Galgame Llasa
|
192 |
|
193 |
The model is fine-tuned by Japanese audio data.
|
194 |
|
|
|
6 |
import torchaudio
|
7 |
import gradio as gr
|
8 |
|
9 |
+
llasa_model_id = 'OmniAICreator/Galgame-Llasa-3B'
|
10 |
|
11 |
tokenizer = AutoTokenizer.from_pretrained(llasa_model_id)
|
12 |
|
|
|
151 |
return (16000, gen_wav[0, 0, :].cpu().numpy())
|
152 |
|
153 |
with gr.Blocks() as app_tts:
|
154 |
+
gr.Markdown("# Galgame Llasa 3B")
|
155 |
ref_audio_input = gr.Audio(label="Reference Audio", type="filepath")
|
156 |
gen_text_input = gr.Textbox(label="Text to Generate", lines=10)
|
157 |
|
158 |
with gr.Row():
|
159 |
+
temperature_slider = gr.Slider(minimum=0.0, maximum=1.0, value=0.8, step=0.05, label="Temperature")
|
160 |
top_p_slider = gr.Slider(minimum=0.0, maximum=1.0, value=1.0, step=0.05, label="Top-p")
|
161 |
|
162 |
generate_btn = gr.Button("Synthesize", variant="primary")
|
|
|
186 |
with gr.Blocks() as app:
|
187 |
gr.Markdown(
|
188 |
"""
|
189 |
+
# Galgame Llasa 3B
|
190 |
|
191 |
+
This is a local web UI for Galgame Llasa 3B TTS model.
|
192 |
|
193 |
The model is fine-tuned by Japanese audio data.
|
194 |
|