Solo448 commited on
Commit
6341f08
·
verified ·
1 Parent(s): d8bd91c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -7
app.py CHANGED
@@ -19,6 +19,13 @@ speaker_model = EncoderClassifier.from_hparams(
19
  savedir=os.path.join("/tmp", "speechbrain/spkrec-xvect-voxceleb")
20
  )
21
 
 
 
 
 
 
 
 
22
  # Load a sample from the dataset for speaker embedding
23
  try:
24
  dataset = load_dataset("Sajjo/bangala_data_v3", split="train", trust_remote_code=True)
@@ -30,13 +37,6 @@ except Exception as e:
30
  # Use a random speaker embedding as fallback
31
  speaker_embedding = torch.randn(1, 512)
32
 
33
- def create_speaker_embedding(waveform):
34
- with torch.no_grad():
35
- speaker_embeddings = speaker_model.encode_batch(torch.tensor(waveform))
36
- speaker_embeddings = torch.nn.functional.normalize(speaker_embeddings, dim=2)
37
- speaker_embeddings = speaker_embeddings.squeeze().cpu().numpy()
38
- return speaker_embeddings
39
-
40
  def text_to_speech(text):
41
  # Clean up text
42
  replacements = [
 
19
  savedir=os.path.join("/tmp", "speechbrain/spkrec-xvect-voxceleb")
20
  )
21
 
22
+ def create_speaker_embedding(waveform):
23
+ with torch.no_grad():
24
+ speaker_embeddings = speaker_model.encode_batch(torch.tensor(waveform))
25
+ speaker_embeddings = torch.nn.functional.normalize(speaker_embeddings, dim=2)
26
+ speaker_embeddings = speaker_embeddings.squeeze().cpu().numpy()
27
+ return speaker_embeddings
28
+
29
  # Load a sample from the dataset for speaker embedding
30
  try:
31
  dataset = load_dataset("Sajjo/bangala_data_v3", split="train", trust_remote_code=True)
 
37
  # Use a random speaker embedding as fallback
38
  speaker_embedding = torch.randn(1, 512)
39
 
 
 
 
 
 
 
 
40
  def text_to_speech(text):
41
  # Clean up text
42
  replacements = [