Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -52,7 +52,7 @@ vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
|
|
52 |
target_sample_rate = 24000
|
53 |
n_mel_channels = 100
|
54 |
hop_length = 256
|
55 |
-
target_rms = 0.
|
56 |
nfe_step = 8 # 16, 32
|
57 |
cfg_strength = 2.0
|
58 |
ode_method = "euler"
|
@@ -274,13 +274,7 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, cross_fa
|
|
274 |
|
275 |
if not ref_text.strip():
|
276 |
gr.Info("No reference text provided, transcribing reference audio...")
|
277 |
-
ref_text =
|
278 |
-
ref_audio,
|
279 |
-
chunk_length_s=30,
|
280 |
-
batch_size=128,
|
281 |
-
generate_kwargs={"task": "transcribe"},
|
282 |
-
return_timestamps=False,
|
283 |
-
)["text"].strip()
|
284 |
gr.Info("Finished transcription")
|
285 |
else:
|
286 |
gr.Info("Using custom reference text...")
|
|
|
52 |
target_sample_rate = 24000
|
53 |
n_mel_channels = 100
|
54 |
hop_length = 256
|
55 |
+
target_rms = 0.1
|
56 |
nfe_step = 8 # 16, 32
|
57 |
cfg_strength = 2.0
|
58 |
ode_method = "euler"
|
|
|
274 |
|
275 |
if not ref_text.strip():
|
276 |
gr.Info("No reference text provided, transcribing reference audio...")
|
277 |
+
ref_text = gen_text
|
|
|
|
|
|
|
|
|
|
|
|
|
278 |
gr.Info("Finished transcription")
|
279 |
else:
|
280 |
gr.Info("Using custom reference text...")
|