Gregniuki commited on
Commit
f914a1f
·
verified ·
1 Parent(s): dc292c6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -347,7 +347,9 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence,
347
  # Remove silence
348
  if remove_silence:
349
  with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
350
- sf.write(f.name, final_wave, target_sample_rate)
 
 
351
  aseg = AudioSegment.from_file(f.name)
352
  non_silent_segs = silence.split_on_silence(aseg, min_silence_len=1000, silence_thresh=-50, keep_silence=500)
353
  non_silent_wave = AudioSegment.silent(duration=0)
@@ -775,13 +777,13 @@ with gr.Blocks() as app_emotional:
775
 
776
  # generated_audio_segments.append(audio_data)
777
  # Ensure audio_data is float32
778
- audio_data = audio_data.astype(np.float32)
779
 
780
  generated_audio_segments.append(audio_data)
781
 
782
  # Concatenate all audio segments
783
  if generated_audio_segments:
784
- final_audio_data = np.concatenate(generated_audio_segments).astype(np.float32)
785
  return (sr, final_audio_data)
786
  else:
787
  gr.Warning("No audio generated.")
 
347
  # Remove silence
348
  if remove_silence:
349
  with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
350
+ # Convert to float32 before writing
351
+ final_wave_float32 = final_wave.astype(np.float32)
352
+ sf.write(f.name, final_wave_float32, target_sample_rate)
353
  aseg = AudioSegment.from_file(f.name)
354
  non_silent_segs = silence.split_on_silence(aseg, min_silence_len=1000, silence_thresh=-50, keep_silence=500)
355
  non_silent_wave = AudioSegment.silent(duration=0)
 
777
 
778
  # generated_audio_segments.append(audio_data)
779
  # Ensure audio_data is float32
780
+ #audio_data = audio_data.astype(np.float32)
781
 
782
  generated_audio_segments.append(audio_data)
783
 
784
  # Concatenate all audio segments
785
  if generated_audio_segments:
786
+ final_audio_data = np.concatenate(generated_audio_segments)#.astype(np.float32)
787
  return (sr, final_audio_data)
788
  else:
789
  gr.Warning("No audio generated.")