Spaces:
Running
Running
import os | |
import torch | |
import argparse | |
import gradio as gr | |
import smtplib | |
from email.mime.text import MIMEText | |
from email.mime.multipart import MIMEMultipart | |
from email.mime.application import MIMEApplication | |
from openvoice import se_extractor | |
from openvoice.api import BaseSpeakerTTS, ToneColorConverter | |
from dotenv import load_dotenv | |
from openai import OpenAI | |
from elevenlabs.client import ElevenLabs | |
from elevenlabs import play, save | |
from flask import Flask | |
from flask_limiter import Limiter | |
from flask_limiter.util import get_remote_address | |
# Load environment variables | |
load_dotenv() | |
# Initialize Flask app | |
app = Flask(__name__) | |
# Setup Limiter for rate limiting and quota management based on IP address | |
limiter = Limiter(get_remote_address, app=app, default_limits=["5 per minute"]) | |
# Argument parsing | |
parser = argparse.ArgumentParser() | |
parser.add_argument("--share", action='store_true', default=False, help="make link public") | |
args = parser.parse_args() | |
# Initialize ElevenLabs client | |
client = ElevenLabs(api_key=os.environ.get("ELEVENLABS_API_KEY")) | |
device = 'cuda' if torch.cuda.is_available() else 'cpu' | |
output_dir = 'outputs' | |
os.makedirs(output_dir, exist_ok=True) | |
api_key = os.environ.get("ELEVENLABS_API_KEY") | |
supported_languages = ['zh', 'en'] | |
# Gmail configuration | |
GMAIL_USER = os.environ.get('GMAIL_USER') | |
GMAIL_PASSWORD = os.environ.get('GMAIL_PASSWORD') # This should be an app password, not your regular password | |
# Function to send email with downloadable file using Gmail SMTP | |
def send_email_with_file(recipient_email, file_path, subject, body): | |
try: | |
msg = MIMEMultipart() | |
msg['From'] = GMAIL_USER | |
msg['To'] = recipient_email | |
msg['Subject'] = subject | |
msg.attach(MIMEText(body, 'plain')) | |
with open(file_path, "rb") as file: | |
part = MIMEApplication(file.read(), Name=os.path.basename(file_path)) | |
part['Content-Disposition'] = f'attachment; filename="{os.path.basename(file_path)}"' | |
msg.attach(part) | |
server = smtplib.SMTP_SSL('smtp.gmail.com', 465) | |
server.ehlo() | |
server.login(GMAIL_USER, GMAIL_PASSWORD) | |
server.send_message(msg) | |
server.close() | |
return True | |
except Exception as e: | |
print(f"An error occurred while sending email: {e}") | |
return False | |
# Predict function with rate limiting based on IP address | |
def predict(prompt, style, audio_file_pth, voice_name, customer_email): | |
text_hint = 'Your file will only be saved for 24 hours.\n' | |
if len(prompt) < 2: | |
text_hint += "[ERROR] Please provide a longer prompt text.\n" | |
return text_hint, None, None | |
if len(prompt) > 200: | |
text_hint += "[ERROR] Text length limited to 200 characters. Please try shorter text.\n" | |
return text_hint, None, None | |
print(audio_file_pth) | |
voice = client.clone( | |
name=voice_name, | |
description="A trial voice model for testing", | |
files=[audio_file_pth], | |
) | |
# Generate audio from text | |
audio = client.generate(text=prompt, voice=voice) | |
save_path = f'{output_dir}/output.wav' | |
save(audio, save_path) | |
# Send email with downloadable file | |
subject = "Your Voice Clone File" | |
body = "Thank you for using our Voice Clone service. Your file is attached." | |
if send_email_with_file(customer_email, save_path, subject, body): | |
text_hint += "Email sent successfully with the voice file.\n" | |
else: | |
text_hint += "Failed to send email with the voice file. Please try again later.\n" | |
return text_hint, save_path, audio_file_pth | |
# Gradio interface setup | |
with gr.Blocks(gr.themes.Glass()) as demo: | |
with gr.Row(): | |
with gr.Column(): | |
input_text_gr = gr.Textbox( | |
label="Create This", | |
info="One or two sentences at a time is better. Up to 200 text characters.", | |
value="He hoped there would be stew for dinner, turnips and carrots and bruised potatoes and fat mutton pieces to be ladled out in thick, peppered, flour-fattened sauce.", | |
) | |
style_gr = gr.Dropdown( | |
label="Style", | |
choices=['default', 'whispering', 'cheerful', 'terrified', 'angry', 'sad', 'friendly'], | |
info="Please upload a reference audio file that is at least 1 minute long. For best results, ensure the audio is clear. You can use Adobe Podcast Enhance(https://podcast.adobe.com/enhance) to improve the audio quality before uploading.", | |
max_choices=1, | |
value="default", | |
) | |
ref_gr = gr.Audio( | |
label="Original Audio", | |
type="filepath", | |
sources=["upload"], # Allow only upload | |
) | |
voice_name_gr = gr.Textbox( | |
label="Your name and Product you bought", | |
value="Sam" | |
) | |
customer_email_gr = gr.Textbox( | |
label="Your Email", | |
info="We'll send you a downloadable file to this email address." | |
) | |
tts_button = gr.Button("Start", elem_id="send-btn", visible=True) | |
with gr.Column(): | |
out_text_gr = gr.Text(label="Info") | |
audio_gr = gr.Audio(label="Replicated Sound", autoplay=True) | |
ref_audio_gr = gr.Audio(label="Original Audio Used ") | |
tts_button.click(predict, [input_text_gr, style_gr, ref_gr, voice_name_gr, customer_email_gr], outputs=[out_text_gr, audio_gr, ref_audio_gr]) | |
demo.queue() | |
demo.launch(debug=True, show_api=False, share=args.share) | |
# Hide Gradio footer and record button | |
css = """ | |
footer {visibility: hidden} | |
audio .btn-container {display: none} | |
""" | |
demo.add_css(css) |