Remsky commited on 10 days ago

Commit

9aea310

1 Parent(s): 80c0dbf

Refactor TTSModelV1 to remove JSON voice mappings and load voices from the voices_v1 directory

Files changed (18) hide show

tts_model_v1.py CHANGED Viewed

@@ -1,10 +1,8 @@
 import os
-import json
 import torch
 import numpy as np
 import time
 from typing import Tuple, List
-import soundfile as sf
 from kokoro import KPipeline
 import spaces
@@ -13,10 +11,7 @@ class TTSModelV1:
     def __init__(self):
         self.pipeline = None
-        # Load v1 voice mappings
-        voice_map_path = os.path.join(os.path.dirname(__file__), "voices", "v1_voices.json")
-        with open(voice_map_path) as f:
-            self.voice_map = json.load(f)
     def initialize(self) -> bool:
         """Initialize KPipeline"""
@@ -30,9 +25,14 @@ class TTSModelV1:
             return False
     def list_voices(self) -> List[str]:
-        """List available voices"""
-        # Return all voices from voice map
-        return self.voice_map["american"] + self.voice_map["british"]
     @spaces.GPU(duration=None)  # Duration will be set by the UI
     def generate_speech(self, text: str, voice_names: list[str], speed: float = 1.0, gpu_timeout: int = 60, progress_callback=None, progress_state=None, progress=None) -> Tuple[np.ndarray, float]:

 import os
 import torch
 import numpy as np
 import time
 from typing import Tuple, List
 from kokoro import KPipeline
 import spaces
     def __init__(self):
         self.pipeline = None
+        self.voices_dir = os.path.join(os.path.dirname(__file__), "voices_v1")
     def initialize(self) -> bool:
         """Initialize KPipeline"""
             return False
     def list_voices(self) -> List[str]:
+        """List available voices from voices_v1 directory"""
+        voices = []
+        if os.path.exists(self.voices_dir):
+            for file in os.listdir(self.voices_dir):
+                if file.endswith(".pt"):
+                    voice_name = file[:-3]
+                    voices.append(voice_name)
+        return sorted(voices)
     @spaces.GPU(duration=None)  # Duration will be set by the UI
     def generate_speech(self, text: str, voice_names: list[str], speed: float = 1.0, gpu_timeout: int = 60, progress_callback=None, progress_state=None, progress=None) -> Tuple[np.ndarray, float]:

voices/v1_voices.json DELETED Viewed

@@ -1,32 +0,0 @@
-{
-    "american": [
-        "af_alloy",
-        "af_aoede",
-        "af_bella",
-        "af_jessica",
-        "af_kore",
-        "af_nicole",
-        "af_nova",
-        "af_river",
-        "af_sarah",
-        "af_sky",
-        "am_adam",
-        "am_echo",
-        "am_eric",
-        "am_fenrir",
-        "am_liam",
-        "am_michael",
-        "am_onyx",
-        "am_puck"
-    ],
-    "british": [
-        "bf_alice",
-        "bf_emma",
-        "bf_isabella",
-        "bf_lily",
-        "bm_daniel",
-        "bm_fable",
-        "bm_george",
-        "bm_lewis"
-    ]
-}

voices_v1/af_alloy.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d877149dd8b348fbad12e5845b7e43d975390e9f3b68a811d1d86168bef5aa3
+size 523425

voices_v1/af_aoede.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c03bd1a4c3716c2d8eaa3d50022f62d5c31cfbd6e15933a00b17fefe13841cc4
+size 523425

voices_v1/af_jessica.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdfdccb8cc975aa34ee6b89642963b0064237675de0e41a30ae64cc958dd4e87
+size 523435

voices_v1/af_kore.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8bfbc512321c3db49dff984ac675fa5ac7eaed5a96cc31104d3a9080e179d69d
+size 523420

voices_v1/af_nova.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0233676ddc21908c37a1f102f6b88a59e4e5c1bd764983616eb9eda629dbcd2
+size 523420

voices_v1/af_river.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e149459bd9c084416b74756b9bd3418256a8b839088abb07d463730c369dab8f
+size 523425

voices_v1/am_echo.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8bcfdc852bc985fb45c396c561e571ffb9183930071f962f1b50df5c97b161e8
+size 523420

voices_v1/am_eric.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ada66f0eefff34ec921b1d7474d7ac8bec00cd863c170f1c534916e9b8212aae
+size 523420

voices_v1/am_fenrir.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:98e507eca1db08230ae3b6232d59c10aec9630022d19accac4f5d12fcec3c37a
+size 523430

voices_v1/am_liam.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c82550757ddb31308b97f30040dda8c2d609a9e2de6135848d0a948368138518
+size 523420

voices_v1/am_onyx.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e8452be16cd0f6da7b4579eaf7b1e4506e92524882053d86d72b96b9a7fed584
+size 523420

voices_v1/am_puck.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:dd1d8973f4ce4b7d8ae407c77a435f485dabc052081b80ea75c4f30b84f36223
+size 523420

voices_v1/bf_alice.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d292651b6af6c0d81705c2580dcb4463fccc0ff7b8d618a471dbb4e45655b3f3
+size 523425

voices_v1/bf_lily.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e09c2e481e2d53004d7e5ae7d3a325369e130a6f45c35a6002de75084be9285
+size 523420

voices_v1/bm_daniel.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc3fce4e9c12ed4dbc8fa9680cfe51ee190a96444ce7c3ad647549a30823fc5d
+size 523430

voices_v1/bm_fable.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d44935f3135257a9064df99f007fc1342ff1aa767552b4a4fa4c3b2e6e59079c
+size 523425