openvoice2 / openvoice_app.py
CuddleBuddys's picture
Update openvoice_app.py
002c88f verified
raw
history blame
8.17 kB
import os
import torch
import argparse
import gradio as gr
from mailersend import emails
from dotenv import load_dotenv
from elevenlabs.client import ElevenLabs
from elevenlabs import play, save
import base64
# Load environment variables
load_dotenv()
# Argument parsing
parser = argparse.ArgumentParser()
parser.add_argument("--share", action='store_true', default=False, help="make link public")
args = parser.parse_args()
# Initialize ElevenLabs client
client = ElevenLabs(api_key=os.environ.get("ELEVENLABS_API_KEY"))
device = 'cuda' if torch.cuda.is_available() else 'cpu'
output_dir = 'outputs'
os.makedirs(output_dir, exist_ok=True)
supported_languages = ['zh', 'en']
MAILERSEND_API_KEY = os.getenv("MAILERSEND_API_KEY")
MAILERSEND_DOMAIN = os.getenv("MAILERSEND_DOMAIN")
MAILERSEND_SENDER_EMAIL = f"noreply@{MAILERSEND_DOMAIN}"
MAILERSEND_SENDER_NAME = "Voice Clone App"
# List of blocked words
BLOCKED_WORDS = ['Kill','hurt','shoot','gun','rifle','AR','semi automatic','knife','blade','sword','punch harm','disrupt','blackmail','steal','bitch','cunt','fuck','freaking','nigger','nigga','niggas','cracker','jew','oriental','fag','faggot','account','money','transfer','urgent','help','scared','policy','frightened','accident','fear','scam','address','social security number','assault','injure','maim','destroy','damage','threaten','intimidate','bully','menace','blackmail','extort','exploit','defame','steal','rob','embezzle','defraud Harass','jerk','idiot','stupid','moron','asshole','con','trick','swindle','defraud','payment','credit card','bank account','urgent','immediate','afraid','phone number','email','password'] # Add more words as needed
# Function to check for blocked words
def contains_blocked_words(text):
return any(word.lower() in text.lower() for word in BLOCKED_WORDS)
# Function to send email with downloadable file using MailerSend
def send_email_with_file(recipient_email, file_path, subject, body):
try:
mailer = emails.NewEmail(MAILERSEND_API_KEY)
mail_body = {}
mail_from = {
"name": MAILERSEND_SENDER_NAME,
"email": MAILERSEND_SENDER_EMAIL,
}
recipients = [
{
"name": "Recipient",
"email": recipient_email,
}
]
mailer.set_mail_from(mail_from, mail_body)
mailer.set_mail_to(recipients, mail_body)
mailer.set_subject(subject, mail_body)
mailer.set_html_content(f"<p>{body}</p>", mail_body)
mailer.set_plaintext_content(body, mail_body)
with open(file_path, "rb") as file:
attachment_content = base64.b64encode(file.read()).decode('utf-8')
attachments = [
{
"filename": os.path.basename(file_path),
"content": attachment_content,
"disposition": "attachment"
}
]
mailer.set_attachments(attachments, mail_body)
response = mailer.send(mail_body)
if response[0] == 202:
print("Email sent successfully")
return True
else:
print(f"Failed to send email. Status code: {response[0]}")
print(f"Response: {response[1]}")
return False
except Exception as e:
print(f"An error occurred while sending email: {e}")
return False
# New function to handle consent
def check_consent(agreement):
if agreement:
return gr.update(visible=True), gr.update(visible=False)
else:
return gr.update(visible=False), gr.update(visible=True)
# Predict function
def predict(agreement, prompt, style, audio_file_pth, voice_name, customer_email):
if not agreement:
return "You must agree to the terms before using this application.", None, None
text_hint = 'Your file will only be saved for 24 hours.\n'
if len(prompt) < 2:
text_hint += "[ERROR] Please provide a longer prompt text.\n"
return text_hint, None, None
if len(prompt) > 200:
text_hint += "[ERROR] Text length limited to 200 characters. Please try shorter text.\n"
return text_hint, None, None
if contains_blocked_words(prompt):
text_hint += "[ERROR] Your text contains blocked words. Please remove them and try again.\n"
return text_hint, None, None
full_voice_name = f"{voice_name} - {customer_email}"
print(audio_file_pth)
voice = client.clone(
name=full_voice_name,
description="A trial voice model for testing",
files=[audio_file_pth],
)
audio = client.generate(text=prompt, voice=voice)
save_path = f'{output_dir}/output.wav'
save(audio, save_path)
subject = "Your Voice Clone File"
body = "Thank you for using our Voice Clone service. Your file is attached."
if send_email_with_file(customer_email, save_path, subject, body):
text_hint += "Email sent successfully with the voice file.\n"
else:
text_hint += "Failed to send email with the voice file. Please try again later.\n"
return text_hint, save_path, audio_file_pth
# Gradio interface setup
with gr.Blocks(gr.themes.Glass()) as demo:
# Consent view
with gr.Row(visible=True) as consent_row:
consent_text = gr.Markdown(
"""
# Consent Agreement
By using this application, you agree to the following terms:
1. This app will only be used for CuddleBuddy products.
2. CuddleBuddy and any of its partners are not responsible for any misuse of this application.
3. You understand that the voice cloning technology should be used responsibly and ethically.
Do you agree to these terms?
"""
)
consent_checkbox = gr.Checkbox(label="I agree to the terms")
# Main application view
with gr.Row(visible=False) as main_app:
with gr.Column():
input_text_gr = gr.Textbox(
label="Create This",
info="One or two sentences at a time is better. Up to 200 text characters.",
value="He hoped there would be stew for dinner, turnips and carrots and bruised potatoes and fat mutton pieces to be ladled out in thick, peppered, flour-fattened sauce.",
)
style_gr = gr.Dropdown(
label="Style",
choices=['default', 'whispering', 'cheerful', 'terrified', 'angry', 'sad', 'friendly'],
info="Please upload a reference audio file that is at least 1 minute long. For best results, ensure the audio is clear. You can use Adobe Podcast Enhance(https://podcast.adobe.com/enhance) to improve the audio quality before uploading.",
max_choices=1,
value="default",
)
ref_gr = gr.Audio(
label="Original Audio",
type="filepath",
sources=["upload"],
)
voice_name_gr = gr.Textbox(
label="Your name and Product you bought",
value="Sam"
)
customer_email_gr = gr.Textbox(
label="Your Email",
info="We'll send you a downloadable file to this email address."
)
tts_button = gr.Button("Start", elem_id="send-btn", visible=True)
with gr.Column():
out_text_gr = gr.Text(label="Info")
audio_gr = gr.Audio(label="Replicated Sound", autoplay=True)
ref_audio_gr = gr.Audio(label="Original Audio Used ")
# Connect the consent checkbox to show/hide views
consent_checkbox.change(
check_consent,
inputs=[consent_checkbox],
outputs=[main_app, consent_row]
)
# Modify the click event to include the consent check
tts_button.click(
predict,
inputs=[consent_checkbox, input_text_gr, style_gr, ref_gr, voice_name_gr, customer_email_gr],
outputs=[out_text_gr, audio_gr, ref_audio_gr]
)
demo.queue()
demo.launch(debug=True, show_api=False, share=args.share)
css = """
footer {visibility: hidden}
audio .btn-container {display: none}
"""
demo.add_css(css)