Gregniuki commited on
Commit
745410d
·
verified ·
1 Parent(s): e6a69c1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -372,7 +372,7 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, cross_fa
372
  gr.Info("Converting audio...")
373
  with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
374
  aseg = AudioSegment.from_file(ref_audio_orig)
375
-
376
  non_silent_segs = silence.split_on_silence(
377
  aseg, min_silence_len=1000, silence_thresh=-42, keep_silence=1000
378
  )
@@ -381,7 +381,7 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, cross_fa
381
  non_silent_wave += non_silent_seg
382
 
383
  aseg = non_silent_wave
384
- aseg = remove_silence_edges(aseg) + AudioSegment.silent(duration=100)
385
 
386
  audio_duration = len(aseg)
387
  if audio_duration > 8000:
@@ -417,7 +417,7 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, cross_fa
417
  # Use the new chunk_text function to split gen_text
418
  max_chars = int(0.5 * (len(ref_text.encode('utf-8')) / (audio.shape[-1] / sr) * (15 - audio.shape[-1] / sr )))
419
  print(f"text: {gen_text} ")
420
- gen_text_batches = chunk_text(gen_text, max_chars=max_chars)
421
  print('ref_text', ref_text)
422
  for i, batch_text in enumerate(gen_text_batches):
423
  print(f'gen_text {i}', batch_text)
 
372
  gr.Info("Converting audio...")
373
  with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
374
  aseg = AudioSegment.from_file(ref_audio_orig)
375
+ aseg = remove_silence_edges(aseg) + AudioSegment.silent(duration=50)
376
  non_silent_segs = silence.split_on_silence(
377
  aseg, min_silence_len=1000, silence_thresh=-42, keep_silence=1000
378
  )
 
381
  non_silent_wave += non_silent_seg
382
 
383
  aseg = non_silent_wave
384
+
385
 
386
  audio_duration = len(aseg)
387
  if audio_duration > 8000:
 
417
  # Use the new chunk_text function to split gen_text
418
  max_chars = int(0.5 * (len(ref_text.encode('utf-8')) / (audio.shape[-1] / sr) * (15 - audio.shape[-1] / sr )))
419
  print(f"text: {gen_text} ")
420
+ gen_text_batches = chunk_text(gen_text, max_chars=100)
421
  print('ref_text', ref_text)
422
  for i, batch_text in enumerate(gen_text_batches):
423
  print(f'gen_text {i}', batch_text)