openvoice2

Running

App Files Files Community

openvoice2 / openvoice_app.py

poemsforaphrodite

Update openvoice_app.py

b4fcf8b verified 4 months ago

raw

history blame

5.77 kB

	import os
	import torch
	import argparse
	import gradio as gr
	import smtplib
	from email.mime.text import MIMEText
	from email.mime.multipart import MIMEMultipart
	from email.mime.application import MIMEApplication
	from openvoice import se_extractor
	from openvoice.api import BaseSpeakerTTS, ToneColorConverter
	from dotenv import load_dotenv
	from openai import OpenAI
	from elevenlabs.client import ElevenLabs
	from elevenlabs import play, save
	from flask import Flask
	from flask_limiter import Limiter
	from flask_limiter.util import get_remote_address

	# Load environment variables
	load_dotenv()

	# Initialize Flask app
	app = Flask(__name__)

	# Setup Limiter for rate limiting and quota management based on IP address
	limiter = Limiter(get_remote_address, app=app, default_limits=["5 per minute"])

	# Argument parsing
	parser = argparse.ArgumentParser()
	parser.add_argument("--share", action='store_true', default=False, help="make link public")
	args = parser.parse_args()

	# Initialize ElevenLabs client
	client = ElevenLabs(api_key=os.environ.get("ELEVENLABS_API_KEY"))
	device = 'cuda' if torch.cuda.is_available() else 'cpu'
	output_dir = 'outputs'
	os.makedirs(output_dir, exist_ok=True)

	api_key = os.environ.get("ELEVENLABS_API_KEY")
	supported_languages = ['zh', 'en']

	# Gmail configuration
	GMAIL_USER = os.environ.get('GMAIL_USER')
	GMAIL_PASSWORD = os.environ.get('GMAIL_PASSWORD') # This should be an app password, not your regular password

	# Function to send email with downloadable file using Gmail SMTP
	def send_email_with_file(recipient_email, file_path, subject, body):
	try:
	msg = MIMEMultipart()
	msg['From'] = GMAIL_USER
	msg['To'] = recipient_email
	msg['Subject'] = subject

	msg.attach(MIMEText(body, 'plain'))

	with open(file_path, "rb") as file:
	part = MIMEApplication(file.read(), Name=os.path.basename(file_path))
	part['Content-Disposition'] = f'attachment; filename="{os.path.basename(file_path)}"'
	msg.attach(part)

	server = smtplib.SMTP_SSL('smtp.gmail.com', 465)
	server.ehlo()
	server.login(GMAIL_USER, GMAIL_PASSWORD)
	server.send_message(msg)
	server.close()

	return True
	except Exception as e:
	print(f"An error occurred while sending email: {e}")
	return False

	# Predict function with rate limiting based on IP address
	@limiter.limit("100 per minute")
	def predict(prompt, style, audio_file_pth, voice_name, customer_email):
	text_hint = 'Your file will only be saved for 24 hours.\n'
	if len(prompt) < 2:
	text_hint += "[ERROR] Please provide a longer prompt text.\n"
	return text_hint, None, None
	if len(prompt) > 200:
	text_hint += "[ERROR] Text length limited to 200 characters. Please try shorter text.\n"
	return text_hint, None, None

	print(audio_file_pth)
	voice = client.clone(
	name=voice_name,
	description="A trial voice model for testing",
	files=[audio_file_pth],
	)
	# Generate audio from text
	audio = client.generate(text=prompt, voice=voice)
	save_path = f'{output_dir}/output.wav'
	save(audio, save_path)

	# Send email with downloadable file
	subject = "Your Voice Clone File"
	body = "Thank you for using our Voice Clone service. Your file is attached."
	if send_email_with_file(customer_email, save_path, subject, body):
	text_hint += "Email sent successfully with the voice file.\n"
	else:
	text_hint += "Failed to send email with the voice file. Please try again later.\n"

	return text_hint, save_path, audio_file_pth

	# Gradio interface setup
	with gr.Blocks(gr.themes.Glass()) as demo:
	with gr.Row():
	with gr.Column():
	input_text_gr = gr.Textbox(
	label="Create This",
	info="One or two sentences at a time is better. Up to 200 text characters.",
	value="He hoped there would be stew for dinner, turnips and carrots and bruised potatoes and fat mutton pieces to be ladled out in thick, peppered, flour-fattened sauce.",
	)
	style_gr = gr.Dropdown(
	label="Style",
	choices=['default', 'whispering', 'cheerful', 'terrified', 'angry', 'sad', 'friendly'],
	info="Please upload a reference audio file that is at least 1 minute long. For best results, ensure the audio is clear. You can use Adobe Podcast Enhance(https://podcast.adobe.com/enhance) to improve the audio quality before uploading.",
	max_choices=1,
	value="default",
	)
	ref_gr = gr.Audio(
	label="Original Audio",
	type="filepath",
	sources=["upload"], # Allow only upload
	)
	voice_name_gr = gr.Textbox(
	label="Your name and Product you bought",
	value="Sam"
	)
	customer_email_gr = gr.Textbox(
	label="Your Email",
	info="We'll send you a downloadable file to this email address."
	)
	tts_button = gr.Button("Start", elem_id="send-btn", visible=True)

	with gr.Column():
	out_text_gr = gr.Text(label="Info")
	audio_gr = gr.Audio(label="Replicated Sound", autoplay=True)
	ref_audio_gr = gr.Audio(label="Original Audio Used ")

	tts_button.click(predict, [input_text_gr, style_gr, ref_gr, voice_name_gr, customer_email_gr], outputs=[out_text_gr, audio_gr, ref_audio_gr])

	demo.queue()
	demo.launch(debug=True, show_api=False, share=args.share)

	# Hide Gradio footer and record button
	css = """
	footer {visibility: hidden}
	audio .btn-container {display: none}
	"""

	demo.add_css(css)