Spaces:

Risdom
/

english2

Sleeping

App Files Files Community

english2 / voice_create.py

yosuke-i

Update voice_create.py

ccc5133 verified 4 months ago

raw

history blame contribute delete

8.28 kB

	import pandas as pd
	import zipfile
	import base64
	import os
	import requests
	import re
	from pydub import AudioSegment
	import json

	def remove_quotes(text):
	# ダブルクォートを空文字に置き換え
	return text.replace('"', '')

	def text_to_speech(input_file, selected_option):
	# APIキーを直接コードに埋め込む（実際の運用では推奨されません）
	api_key = 'AIzaSyBqvy0wRyZVapYyZ_GfTlRpQwrwj9YqYaw' # ここを実際のAPIキーに置き換えてください
	data = pd.read_csv(input_file)
	zip_path = 'output_audio_files.zip'
	error_log = [] # エラーログを格納するリスト

	with zipfile.ZipFile(zip_path, 'w') as z:
	for idx, row in data.iterrows():
	try:
	# script列が文字列か確認し、文字列でない場合は空文字に置き換える
	script = row.get('script', '')
	print("原稿", script)
	if pd.isna(script):
	error_log.append(f"行 {idx+1}: スクリプトが空です")
	continue
	if not isinstance(script, str):
	script = str(script)

	# テキストをA:やB:で分割
	parts = re.split(r'(A:\|B:)', script)
	ssml_parts = []

	# 交互に発言するAとBの内容を順に処理
	for i in range(1, len(parts), 2):
	if parts[i] == "A:":
	voice_name = row["voiceA"]
	elif parts[i] == "B:":
	voice_name = row["voiceB"]
	else:
	continue # A:またはB:で始まらない行は無視

	text = parts[i + 1].strip()
	text = remove_quotes(text)

	# 1sに変換する前に除外するコード
	text = text.replace("a.m.", 'AM')
	text = text.replace("p.m.", 'PM')
	text = text.replace("U.S.", 'US')
	text = text.replace("U.K.", 'UK')
	text = text.replace("Mr.", 'Mister')
	text = text.replace("Ms.", 'MIZ')
	text = text.replace("Mrs.", 'Misiz')
	text = text.replace("Dr.", 'Doctor')
	text = text.replace("Mt.", 'Mount')
	text = text.replace("Prof.", 'Professor')

	# テキスト内の改行を1sの間に変換
	text = text.replace("\n", '<break time="1s"/>')
	text = text.replace(".", '.<break time="500ms"/>')

	if selected_option == "ブレイクタイム有":
	# 「,」で時間を空ける
	if row["eikenn"] in ["5級", "4級", "3級", "準2級", "2級", "準1級"]:
	text = text.replace(",", '<break time="50ms"/>')

	ssml_parts.append(f'<voice name="{voice_name}"><prosody rate="{row["speed"]}"><p>{text}</p></prosody></voice>')

	ssml = '<speak>' + ''.join(ssml_parts)

	if pd.notna(row.get('question')) and row['question'] != '':
	ssml += f'<break time="1s"/><voice name="{row["voiceQuestion"]}"><prosody rate="{row["speed"]}"><p>Question</p><break time="1s"/><p>{row["question"]}</p></prosody></voice>'
	if pd.notna(row.get('choices')) and row['choices'] != '':
	choices_list = row['choices'].split('/')
	choices_ssml = '<break time="1s"/>'.join(choices_list)
	ssml += f'<break time="1s"/><voice name="{row["voiceB"]}"><prosody rate="{row["speed"]}"><p>{choices_ssml}</p></prosody></voice>'
	ssml += '</speak>'

	# APIリクエスト用のボディ
	body = {
	"input": {"ssml": ssml},
	"voice": {"languageCode": "en-US"}, # 基本的な言語設定（必要に応じて行ごとに変更可能）
	"audioConfig": {"audioEncoding": "MP3"}
	}
	headers = {
	"X-Goog-Api-Key": api_key,
	"Content-Type": "application/json"
	}
	url = "https://texttospeech.googleapis.com/v1/text:synthesize"

	# APIリクエスト送信とレスポンスの確認
	try:
	response = requests.post(url, headers=headers, json=body)

	# ステータスコードの確認
	if response.status_code != 200:
	error_message = f"行 {idx+1}: APIエラー - HTTP {response.status_code}"
	try:
	error_data = response.json()
	if 'error' in error_data and 'message' in error_data['error']:
	error_message += f" - {error_data['error']['message']}"
	except:
	error_message += f" - レスポンス: {response.text}"

	print(error_message)
	error_log.append(error_message)
	continue

	response_data = response.json()

	# 音声コンテンツが存在するか確認
	if 'audioContent' not in response_data:
	error_message = f"行 {idx+1}: 音声データがレスポンスに含まれていません"
	print(error_message)
	error_log.append(error_message)
	continue

	# 音声コンテンツの取得とファイル保存
	audio_content = base64.b64decode(response_data['audioContent'])
	temp_file_name = f"{row['id']}_temp.mp3"
	final_file_name = f"{row['id']}.mp3"

	# 一時ファイルに保存
	with open(temp_file_name, "wb") as out:
	out.write(audio_content)

	# pydubを使用して128kbpsで再保存
	audio = AudioSegment.from_file(temp_file_name, format="mp3")
	audio.export(final_file_name, format="mp3", bitrate="128k")

	# ZIPファイルに追加
	z.write(final_file_name)

	# 一時ファイルを削除
	os.remove(temp_file_name)
	os.remove(final_file_name)

	print(f"行 {idx+1}: 処理成功 - ファイルID: {row['id']}")

	except requests.exceptions.RequestException as e:
	error_message = f"行 {idx+1}: API接続エラー - {str(e)}"
	print(error_message)
	error_log.append(error_message)

	except Exception as e:
	error_message = f"行 {idx+1}: 予期せぬエラー - {str(e)}"
	print(error_message)
	error_log.append(error_message)

	# エラーログのサマリーを出力
	if error_log:
	print("\n===== エラーログ =====")
	for error in error_log:
	print(error)
	print(f"合計 {len(error_log)} 件のエラーが発生しました。")

	# エラーログをファイルに保存
	with open('tts_error_log.txt', 'w', encoding='utf-8') as log_file:
	log_file.write("===== Google Text-to-Speech API エラーログ =====\n")
	log_file.write(f"処理日時: {pd.Timestamp.now()}\n\n")
	for error in error_log:
	log_file.write(f"{error}\n")
	print("エラーログは 'tts_error_log.txt' に保存されました。")
	else:
	print("すべての行が正常に処理されました。")

	return zip_path