Rogerjs commited on
Commit
d44c6d5
·
verified ·
1 Parent(s): 406b7b8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -3
app.py CHANGED
@@ -4,14 +4,18 @@ import os
4
  import time
5
  import torch
6
  from scipy.io import wavfile
 
7
 
8
  # Bark imports
9
  from bark import generate_audio, SAMPLE_RATE
10
  from bark.generation import preload_models
11
 
12
  # Hugging Face Transformers
13
- from transformers import AutoModelForTextToSpeech, AutoProcessor, AutoTokenizer
14
- from transformers import SpeechT5HifiGan, SpeechT5ForTextToSpeech, SpeechT5Processor
 
 
 
15
 
16
  class VoiceSynthesizer:
17
  def __init__(self):
@@ -50,7 +54,7 @@ class VoiceSynthesizer:
50
  vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
51
 
52
  # Load speaker embeddings
53
- embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
54
  speaker_embeddings = torch.tensor(embeddings_dataset[0]["xvector"]).unsqueeze(0)
55
 
56
  return {
 
4
  import time
5
  import torch
6
  from scipy.io import wavfile
7
+ import datasets
8
 
9
  # Bark imports
10
  from bark import generate_audio, SAMPLE_RATE
11
  from bark.generation import preload_models
12
 
13
  # Hugging Face Transformers
14
+ from transformers import (
15
+ SpeechT5HifiGan,
16
+ SpeechT5ForTextToSpeech,
17
+ SpeechT5Processor
18
+ )
19
 
20
  class VoiceSynthesizer:
21
  def __init__(self):
 
54
  vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
55
 
56
  # Load speaker embeddings
57
+ embeddings_dataset = datasets.load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
58
  speaker_embeddings = torch.tensor(embeddings_dataset[0]["xvector"]).unsqueeze(0)
59
 
60
  return {