elevenlabs / app.py
Nymbo's picture
Update app.py
157260f verified
raw
history blame
2.85 kB
import random
import gradio as gr
import numpy as np
import time
from elevenlabs import voices, generate, set_api_key, UnauthenticatedRateLimitError
def pad_buffer(audio):
# Pad buffer to multiple of 2 bytes
buffer_size = len(audio)
element_size = np.dtype(np.int16).itemsize
if buffer_size % element_size != 0:
audio = audio + b'\0' * (element_size - (buffer_size % element_size))
return audio
def generate_voice(text, voice_name, api_key):
set_api_key(api_key) #set API key
try:
audio = generate(
text[:4000], # Limit to 4000 characters
voice=voice_name,
model="eleven_multilingual_v2"
)
return (44100, np.frombuffer(pad_buffer(audio), dtype=np.int16))
except UnauthenticatedRateLimitError as e:
raise gr.Error("Thanks for trying out ElevenLabs TTS! You've reached the free tier limit. Please provide an API key to continue.")
except Exception as e:
raise gr.Error(e)
# description = """
# Eleven Multilingual V2 is the world's best Text-to-Speech model. Features 38 voices and supports 28 languages. Sign up on [ElevenLabs](https://elevenlabs.io/?from=partnerpierce7156) to get an API Key.
# """
with gr.Blocks(theme='Nymbo/Alyx_Theme') as block:
#gr.Markdown('[ ![ElevenLabs](https://user-images.githubusercontent.com/12028621/262629275-4f85c9cf-85b6-435e-ab50-5b8c7c4e9dd2.png) ](https://elevenlabs.io)')
#gr.Markdown("# <center> ElevenLabs </center>")
#gr.Markdown(description)
with gr.Row(variant='panel'):
input_api_key = gr.Textbox(
type='password',
label='ElevenLabs API Key',
placeholder='Enter your API key',
elem_id="input_api_key"
)
all_voices = voices()
input_voice = gr.Dropdown(
[ voice.name for voice in all_voices ],
value="Rachel",
label="Voice",
elem_id="input_voice"
)
input_text = gr.Textbox(
label="Input Text (4000 characters max)",
lines=1,
value="Hello! 你好! Hola! नमस्ते! Bonjour! こんにちは! مرحبا! 안녕하세요! Ciao! Cześć! Привіт! Γειά σας! Здравей! வணக்கம்!",
elem_id="input_text"
)
run_button = gr.Button(
text="Generate Voice",
type="button",
variant="primary"
)
out_audio = gr.Audio(
label="Speech Output",
type="numpy",
elem_id="out_audio",
format="mp3"
)
inputs = [input_text, input_voice, input_api_key]
outputs = [out_audio]
run_button.click(
fn=generate_voice,
inputs=inputs,
outputs=outputs,
queue=True
)
block.queue(concurrency_count=5).launch(debug=True)