adowu commited on
Commit
29f6b1d
·
verified ·
1 Parent(s): d3b49fc

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -2
app.py CHANGED
@@ -4,6 +4,8 @@ import torch
4
  from TTS.api import TTS
5
  import os
6
  import json
 
 
7
 
8
  os.environ["COQUI_TOS_AGREED"] = "1"
9
 
@@ -16,19 +18,26 @@ def clone(text, audio):
16
  # Generowanie mowy
17
  wav = tts.tts(text=text, speaker_wav=audio, language="pl")
18
 
19
- # Zapisywanie pliku audio
20
- tts.save_wav(wav, file_path="./output.wav")
 
21
 
22
  # Uzyskanie informacji o fonemach
23
  phonemes_info = tts.synthesizer.get_phonemes(text, language="pl")
24
 
25
  # Przygotowanie informacji o fonemach
26
  phonemes_data = []
 
27
  for phoneme, duration in phonemes_info:
 
 
28
  phonemes_data.append({
29
  "phoneme": phoneme,
 
 
30
  "duration": float(duration)
31
  })
 
32
 
33
  # Zapisywanie informacji o fonemach do pliku JSON
34
  with open("./phonemes_info.json", "w", encoding="utf-8") as f:
 
4
  from TTS.api import TTS
5
  import os
6
  import json
7
+ import scipy.io.wavfile as wavfile
8
+ import numpy as np
9
 
10
  os.environ["COQUI_TOS_AGREED"] = "1"
11
 
 
18
  # Generowanie mowy
19
  wav = tts.tts(text=text, speaker_wav=audio, language="pl")
20
 
21
+ # Konwersja do numpy array i zapisanie jako plik WAV
22
+ wav_np = np.array(wav)
23
+ wavfile.write("./output.wav", 24000, (wav_np * 32767).astype(np.int16))
24
 
25
  # Uzyskanie informacji o fonemach
26
  phonemes_info = tts.synthesizer.get_phonemes(text, language="pl")
27
 
28
  # Przygotowanie informacji o fonemach
29
  phonemes_data = []
30
+ cumulative_duration = 0
31
  for phoneme, duration in phonemes_info:
32
+ start_time = cumulative_duration
33
+ end_time = start_time + duration
34
  phonemes_data.append({
35
  "phoneme": phoneme,
36
+ "start": float(start_time),
37
+ "end": float(end_time),
38
  "duration": float(duration)
39
  })
40
+ cumulative_duration = end_time
41
 
42
  # Zapisywanie informacji o fonemach do pliku JSON
43
  with open("./phonemes_info.json", "w", encoding="utf-8") as f: