Spaces:

Vishwas1
/

KittenTTSDemo

Runtime error

App Files Files Community

Vishwas1 commited on Aug 6

Commit

a0a99a6

verified ·

1 Parent(s): e327671

Upload 6 files

Browse files

Files changed (3) hide show

README.md +2 -2
app_minimal.py +61 -0
requirements.txt +1 -1

README.md CHANGED Viewed

@@ -4,8 +4,8 @@ emoji: 🎤
 colorFrom: blue
 colorTo: purple
 sdk: gradio
-sdk_version: 4.44.1
-app_file: app_simple.py
 pinned: false
 license: mit
 ---

 colorFrom: blue
 colorTo: purple
 sdk: gradio
+sdk_version: 4.35.2
+app_file: app_minimal.py
 pinned: false
 license: mit
 ---

app_minimal.py ADDED Viewed

	@@ -0,0 +1,61 @@

+import gradio as gr
+import numpy as np
+from kittentts import KittenTTS
+# Initialize the model
+model = KittenTTS("KittenML/kitten-tts-nano-0.1")
+# Available voices
+AVAILABLE_VOICES = [
+    'expr-voice-2-m', 'expr-voice-2-f', 'expr-voice-3-m', 'expr-voice-3-f',
+    'expr-voice-4-m', 'expr-voice-4-f', 'expr-voice-5-m', 'expr-voice-5-f'
+]
+def generate_speech(text, voice):
+    """Generate speech from text using KittenTTS"""
+    if not text.strip():
+        return None, "Please enter some text to generate speech."
+    try:
+        # Generate audio
+        audio = model.generate(text, voice=voice)
+        # Convert to the format expected by Gradio
+        if len(audio.shape) > 1:
+            audio = audio.mean(axis=1)  # Convert stereo to mono if needed
+        # Normalize audio
+        audio = audio / np.max(np.abs(audio)) if np.max(np.abs(audio)) > 0 else audio
+        return audio, f"✅ Successfully generated speech with voice: {voice}"
+    except Exception as e:
+        return None, f"❌ Error generating speech: {str(e)}"
+# Create the interface using Interface instead of Blocks
+demo = gr.Interface(
+    fn=generate_speech,
+    inputs=[
+        gr.Textbox(label="Enter your text", placeholder="Type your text here...", lines=3),
+        gr.Dropdown(choices=AVAILABLE_VOICES, value=AVAILABLE_VOICES[1], label="Select Voice")
+    ],
+    outputs=[
+        gr.Audio(label="Generated Audio"),
+        gr.Textbox(label="Status", interactive=False)
+    ],
+    title="🎤 KittenTTS - High Quality Text-to-Speech",
+    description="Generate natural-sounding speech from text using the KittenTTS model",
+    examples=[
+        ["Hello! This is a demonstration of the KittenTTS model.", "expr-voice-2-f"],
+        ["The quick brown fox jumps over the lazy dog.", "expr-voice-2-m"],
+        ["Welcome to our high-quality text-to-speech system.", "expr-voice-3-f"],
+    ]
+)
+# Launch the demo
+if __name__ == "__main__":
+    demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=True
+    )

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-gradio==4.44.1
 https://github.com/KittenML/KittenTTS/releases/download/0.1/kittentts-0.1.0-py3-none-any.whl
 soundfile
 numpy

+gradio==4.35.2
 https://github.com/KittenML/KittenTTS/releases/download/0.1/kittentts-0.1.0-py3-none-any.whl
 soundfile
 numpy