Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -172,6 +172,7 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence,
|
|
172 |
elif exp_name == "Deutsh":
|
173 |
ema_model = E2TTS_ema_model2
|
174 |
#ref_audio, ref_text = preprocess_ref_audio_text(ref_audio, ref_text, show_info=show_info)
|
|
|
175 |
|
176 |
audio, sr = ref_audio
|
177 |
if audio.shape[0] > 1:
|
@@ -183,7 +184,7 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence,
|
|
183 |
if sr != target_sample_rate:
|
184 |
resampler = torchaudio.transforms.Resample(sr, target_sample_rate)
|
185 |
audio = resampler(audio)
|
186 |
-
|
187 |
|
188 |
audio = audio.to(device)
|
189 |
|
|
|
172 |
elif exp_name == "Deutsh":
|
173 |
ema_model = E2TTS_ema_model2
|
174 |
#ref_audio, ref_text = preprocess_ref_audio_text(ref_audio, ref_text, show_info=show_info)
|
175 |
+
ref_audio = remove_silence_edges(ref_audio) + AudioSegment.silent(duration=50)
|
176 |
|
177 |
audio, sr = ref_audio
|
178 |
if audio.shape[0] > 1:
|
|
|
184 |
if sr != target_sample_rate:
|
185 |
resampler = torchaudio.transforms.Resample(sr, target_sample_rate)
|
186 |
audio = resampler(audio)
|
187 |
+
|
188 |
|
189 |
audio = audio.to(device)
|
190 |
|