Spaces:

nkalra0123
/

Kokoro_onnx

Runtime error

App Files Files Community

nkalra0123 commited on Jan 12

Commit

9132718

verified ·

1 Parent(s): 393a7f5

Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

.gitattributes +1 -0
.gradio/certificate.pem +31 -0
README.md +13 -7
__pycache__/gradio.cpython-310.pyc +0 -0
audio.wav +0 -0
gr-demo.py +12 -0
gradio-audio.py +61 -0
kokoro-v0_19.onnx +3 -0
requirements.txt +119 -0
voices.json +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+voices.json filter=lfs diff=lfs merge=lfs -text

.gradio/certificate.pem ADDED Viewed

	@@ -0,0 +1,31 @@

+-----BEGIN CERTIFICATE-----
+MIIFazCCA1OgAwIBAgIRAIIQz7DSQONZRGPgu2OCiwAwDQYJKoZIhvcNAQELBQAw
+TzELMAkGA1UEBhMCVVMxKTAnBgNVBAoTIEludGVybmV0IFNlY3VyaXR5IFJlc2Vh
+cmNoIEdyb3VwMRUwEwYDVQQDEwxJU1JHIFJvb3QgWDEwHhcNMTUwNjA0MTEwNDM4
+WhcNMzUwNjA0MTEwNDM4WjBPMQswCQYDVQQGEwJVUzEpMCcGA1UEChMgSW50ZXJu
+ZXQgU2VjdXJpdHkgUmVzZWFyY2ggR3JvdXAxFTATBgNVBAMTDElTUkcgUm9vdCBY
+MTCCAiIwDQYJKoZIhvcNAQEBBQADggIPADCCAgoCggIBAK3oJHP0FDfzm54rVygc
+h77ct984kIxuPOZXoHj3dcKi/vVqbvYATyjb3miGbESTtrFj/RQSa78f0uoxmyF+
+0TM8ukj13Xnfs7j/EvEhmkvBioZxaUpmZmyPfjxwv60pIgbz5MDmgK7iS4+3mX6U
+A5/TR5d8mUgjU+g4rk8Kb4Mu0UlXjIB0ttov0DiNewNwIRt18jA8+o+u3dpjq+sW
+T8KOEUt+zwvo/7V3LvSye0rgTBIlDHCNAymg4VMk7BPZ7hm/ELNKjD+Jo2FR3qyH
+B5T0Y3HsLuJvW5iB4YlcNHlsdu87kGJ55tukmi8mxdAQ4Q7e2RCOFvu396j3x+UC
+B5iPNgiV5+I3lg02dZ77DnKxHZu8A/lJBdiB3QW0KtZB6awBdpUKD9jf1b0SHzUv
+KBds0pjBqAlkd25HN7rOrFleaJ1/ctaJxQZBKT5ZPt0m9STJEadao0xAH0ahmbWn
+OlFuhjuefXKnEgV4We0+UXgVCwOPjdAvBbI+e0ocS3MFEvzG6uBQE3xDk3SzynTn
+jh8BCNAw1FtxNrQHusEwMFxIt4I7mKZ9YIqioymCzLq9gwQbooMDQaHWBfEbwrbw
+qHyGO0aoSCqI3Haadr8faqU9GY/rOPNk3sgrDQoo//fb4hVC1CLQJ13hef4Y53CI
+rU7m2Ys6xt0nUW7/vGT1M0NPAgMBAAGjQjBAMA4GA1UdDwEB/wQEAwIBBjAPBgNV
+HRMBAf8EBTADAQH/MB0GA1UdDgQWBBR5tFnme7bl5AFzgAiIyBpY9umbbjANBgkq
+hkiG9w0BAQsFAAOCAgEAVR9YqbyyqFDQDLHYGmkgJykIrGF1XIpu+ILlaS/V9lZL
+ubhzEFnTIZd+50xx+7LSYK05qAvqFyFWhfFQDlnrzuBZ6brJFe+GnY+EgPbk6ZGQ
+3BebYhtF8GaV0nxvwuo77x/Py9auJ/GpsMiu/X1+mvoiBOv/2X/qkSsisRcOj/KK
+NFtY2PwByVS5uCbMiogziUwthDyC3+6WVwW6LLv3xLfHTjuCvjHIInNzktHCgKQ5
+ORAzI4JMPJ+GslWYHb4phowim57iaztXOoJwTdwJx4nLCgdNbOhdjsnvzqvHu7Ur
+TkXWStAmzOVyyghqpZXjFaH3pO3JLF+l+/+sKAIuvtd7u+Nxe5AW0wdeRlN8NwdC
+jNPElpzVmbUq4JUagEiuTDkHzsxHpFKVK7q4+63SM1N95R1NbdWhscdCb+ZAJzVc
+oyi3B43njTOQ5yOf+1CceWxG1bQVs5ZufpsMljq4Ui0/1lvh+wjChP4kqKOJ2qxq
+4RgqsahDYVvTH9w7jXbyLeiNdd8XM2w9U/t7y0Ff/9yi0GE44Za4rF2LN9d11TPA
+mRGunUHBcnWEvgJBQl9nJEiU0Zsnvgc/ubhPgXRR4Xq37Z0j4r7g1SgEEzwxA57d
+emyPxgcYxn/eR44/KJ4EBs+lVDR3veyJm+kXQ99b21/+jh5Xos1AnX5iItreGCc=
+-----END CERTIFICATE-----

README.md CHANGED Viewed

@@ -1,12 +1,18 @@
 ---
-title: Kokoro Onnx
-emoji: 🐠
-colorFrom: indigo
-colorTo: indigo
 sdk: gradio
 sdk_version: 5.12.0
-app_file: app.py
-pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Kokoro_onnx
+app_file: gradio-audio.py
 sdk: gradio
 sdk_version: 5.12.0
 ---
+# kokoro-tts
+Gradio Demo of kokoro tts
+Download files from https://github.com/thewh1teagle/kokoro-onnx/tree/main
+You need kokoro-v0_19.onnx and voices.json
+# How to run
+```
+pip install -r requirements.txt
+python gradio_audio.py
+```

__pycache__/gradio.cpython-310.pyc ADDED Viewed

Binary file (2.04 kB). View file

audio.wav ADDED Viewed

Binary file (262 kB). View file

gr-demo.py ADDED Viewed

	@@ -0,0 +1,12 @@

+import gradio as gr
+def greet(name, intensity):
+    return "Hello, " + name + "!" * int(intensity)
+demo = gr.Interface(
+    fn=greet,
+    inputs=["text", "slider"],
+    outputs=["text"],
+)
+demo.launch()

gradio-audio.py ADDED Viewed

	@@ -0,0 +1,61 @@

+import gradio as gr
+from kokoro_onnx import Kokoro
+import soundfile as sf
+import tempfile
+import os
+class TextToSpeechApp:
+    def __init__(self):
+        # Initialize Kokoro
+        self.kokoro = Kokoro("kokoro-v0_19.onnx", "voices.json")
+        # Available voices
+        self.voices = [
+            'af', 'af_bella', 'af_nicole', 'af_sarah', 'af_sky',
+            'am_adam', 'am_michael', 'bf_emma', 'bf_isabella',
+            'bm_george', 'bm_lewis'
+        ]
+    def generate_speech(self, text, voice, speed):
+        try:
+            # Generate audio
+            samples, sample_rate = self.kokoro.create(
+                text,
+                voice=voice,
+                speed=float(speed)
+            )
+            # Create temporary file
+            temp_dir = tempfile.mkdtemp()
+            temp_path = os.path.join(temp_dir, "output.wav")
+            # Save to temporary file
+            sf.write(temp_path, samples, sample_rate)
+            return temp_path
+        except Exception as e:
+            return f"Error: {str(e)}"
+    def create_interface(self):
+        interface = gr.Interface(
+            fn=self.generate_speech,
+            inputs=[
+                gr.Textbox(label="Enter text to convert", lines=5),
+                gr.Dropdown(choices=self.voices, label="Select Voice", value=self.voices[0]),
+                gr.Slider(minimum=0.5, maximum=2.0, value=1.0, step=0.1, label="Speech Speed")
+            ],
+            outputs=gr.Audio(label="Generated Speech"),
+            title="Text to Speech Converter",
+            description="Convert text to speech using different voices and speeds."
+        )
+        return interface
+def main():
+    app = TextToSpeechApp()
+    interface = app.create_interface()
+    # Launch with a public URL
+    interface.launch(server_name="0.0.0.0", share=True)
+if __name__ == "__main__":
+    main()

kokoro-v0_19.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebef42457f7efee9b60b4f1d5aec7692f2925923948a0d7a2a49d2c9edf57e49
+size 345554732

requirements.txt ADDED Viewed

	@@ -0,0 +1,119 @@

+aiofiles==23.2.1
+altair==5.5.0
+annotated-types==0.7.0
+anyio==4.8.0
+attrs==24.3.0
+audioread==3.0.1
+babel==2.16.0
+bibtexparser==2.0.0b8
+certifi==2024.12.14
+cffi==1.17.1
+charset-normalizer==3.4.1
+click==8.1.8
+clldutils==3.24.0
+colorama==0.4.6
+coloredlogs==15.0.1
+colorlog==6.9.0
+contourpy==1.3.1
+csvw==3.5.1
+cycler==0.12.1
+decorator==5.1.1
+dlinfo==1.2.1
+espeakng-loader==0.2.1
+exceptiongroup==1.2.2
+fastapi==0.115.6
+ffmpy==0.5.0
+filelock==3.16.1
+flatbuffers==24.12.23
+fonttools==4.55.3
+fsspec==2024.12.0
+gradio==5.12.0
+gradio_client==1.5.4
+h11==0.14.0
+httpcore==1.0.7
+httpx==0.28.1
+huggingface-hub==0.27.1
+humanfriendly==10.0
+idna==3.10
+importlib_resources==6.5.2
+isodate==0.7.2
+Jinja2==3.1.5
+joblib==1.4.2
+jsonschema==4.23.0
+jsonschema-specifications==2024.10.1
+kiwisolver==1.4.8
+kokoro-onnx==0.2.5
+language-tags==1.2.0
+lazy_loader==0.4
+librosa==0.10.2.post1
+llvmlite==0.43.0
+lxml==5.3.0
+Markdown==3.7
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+matplotlib==3.10.0
+mdurl==0.1.2
+mpmath==1.3.0
+msgpack==1.1.0
+munch==4.0.0
+narwhals==1.21.1
+networkx==3.4.2
+numba==0.60.0
+numpy==1.26.4
+onnxruntime==1.20.1
+orjson==3.10.14
+packaging==24.2
+pandas==2.2.3
+phonemizer==3.3.0
+phonemizer-fork==3.3.1
+pillow==10.4.0
+platformdirs==4.3.6
+pooch==1.8.2
+protobuf==5.29.3
+pycparser==2.22
+pydantic==2.10.5
+pydantic_core==2.27.2
+pydub==0.25.1
+Pygments==2.19.1
+pylatexenc==2.10
+pyparsing==3.2.1
+python-dateutil==2.9.0.post0
+python-multipart==0.0.20
+pytz==2024.2
+PyYAML==6.0.2
+rdflib==7.1.2
+referencing==0.35.1
+regex==2024.11.6
+requests==2.32.3
+rfc3986==1.5.0
+rich==13.9.4
+rpds-py==0.22.3
+ruff==0.9.1
+safehttpx==0.1.6
+safetensors==0.5.2
+scikit-learn==1.6.1
+scipy==1.15.1
+segments==2.2.1
+semantic-version==2.10.0
+shellingham==1.5.4
+six==1.17.0
+sniffio==1.3.1
+sounddevice==0.5.1
+soundfile==0.13.0
+soxr==0.5.0.post1
+starlette==0.41.3
+sympy==1.13.1
+tabulate==0.9.0
+threadpoolctl==3.5.0
+tokenizers==0.21.0
+tomlkit==0.12.0
+torch==2.5.1
+tqdm==4.67.1
+transformers==4.48.0
+typer==0.15.1
+typing_extensions==4.12.2
+tzdata==2024.2
+uritemplate==4.1.1
+urllib3==2.3.0
+uvicorn==0.34.0
+websockets==11.0.3

voices.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc24670e8333cb30990726c5d99e991afc14645139d1a9d2d1858d4fba08df05
+size 54060439