import random 
import gradio as gr 
import numpy as np 
import time
from elevenlabs import voices, generate, set_api_key, UnauthenticatedRateLimitError

def pad_buffer(audio):
    # Pad buffer to multiple of 2 bytes
    buffer_size = len(audio)
    element_size = np.dtype(np.int16).itemsize
    if buffer_size % element_size != 0:
        audio = audio + b'\0' * (element_size - (buffer_size % element_size))
    return audio 

def generate_voice(text, voice_name, api_key):
    set_api_key(api_key) #set API key
    try:
        audio = generate(
            text[:4000], # Limit to 4000 characters
            voice=voice_name, 
            model="eleven_multilingual_v2"
        )
        return (44100, np.frombuffer(pad_buffer(audio), dtype=np.int16))
    except UnauthenticatedRateLimitError as e:
        raise gr.Error("Thanks for trying out ElevenLabs TTS! You've reached the free tier limit. Please provide an API key to continue.") 
    except Exception as e:
        raise gr.Error(e)
    
    # description = """
    # Eleven Multilingual V2 is the world's best Text-to-Speech model. Features 38 voices and supports 28 languages. Sign up on [ElevenLabs](https://elevenlabs.io/?from=partnerpierce7156) to get an API Key.
    # """

with gr.Blocks(theme='Nymbo/Alyx_Theme') as block:
    #gr.Markdown('[ ![ElevenLabs](https://user-images.githubusercontent.com/12028621/262629275-4f85c9cf-85b6-435e-ab50-5b8c7c4e9dd2.png) ](https://elevenlabs.io)')
    #gr.Markdown("# <center> ElevenLabs </center>")
    #gr.Markdown(description)
        
    with gr.Row(variant='panel'):
        input_api_key = gr.Textbox(
        type='password', 
        label='ElevenLabs API Key', 
        placeholder='Enter your API key',
        elem_id="input_api_key"
        )

        all_voices = voices() 
        input_voice = gr.Dropdown(
            [ voice.name for voice in all_voices ], 
            value="Rachel",
            label="Voice", 
            elem_id="input_voice"
        )

    input_text = gr.Textbox(
        label="Input Text (4000 characters max)", 
        lines=1, 
        value="Hello! 你好! Hola! नमस्ते! Bonjour! こんにちは! مرحبا! 안녕하세요! Ciao! Cześć! Привіт! Γειά σας! Здравей! வணக்கம்!",
        elem_id="input_text"
    )
    
    run_button = gr.Button(
        text="Generate Voice", 
        type="button", 
        variant="primary"
    )

    out_audio = gr.Audio(
        label="Speech Output",
        type="numpy", 
        elem_id="out_audio",
        format="mp3"
    )
        
    inputs = [input_text, input_voice, input_api_key]
    outputs = [out_audio]
    
    run_button.click(
        fn=generate_voice, 
        inputs=inputs, 
        outputs=outputs, 
        queue=True
    )

block.queue(concurrency_count=5).launch(debug=True)