Spaces:

Mahiruoshi
/

Lovelive-Nijigasaku-Chat-iSTFT-GPT3

Running

App Files Files Community

Mahiruoshi commited on Apr 12, 2023

Commit

9c49b65

•

1 Parent(s): 37eb9e1

Upload 90 files

Browse files

Files changed (46) hide show

app.py +282 -160
checkpoints/Nijigaku/config.json +70 -0
checkpoints/Nijigaku/model.pth +3 -0
checkpoints/info.json +72 -0
image//343/201/202/343/202/213/343/202/213.png +0 -0
image//343/201/204/343/201/241/343/201/210.png +0 -0
image//343/201/213/343/201/231/343/201/277.png +0 -0
image//343/201/227/343/201/232/343/201/217.png +0 -0
image//343/201/233/343/201/244/350/217/234.png +0 -0
image//343/201/252/343/201/252.png +0 -0
image//343/201/262/343/201/213/343/202/212.png +0 -0
image//343/201/276/343/201/262/343/202/213.png +0 -0
image//343/202/204/343/201/241/343/202/210.png +0 -0
image//343/202/206/343/202/206/345/255/220.png +0 -0
image//343/202/250/343/203/236.png +0 -0
image//343/202/257/343/203/255/343/203/207/343/202/243/343/203/274/343/203/214.png +0 -0
image//343/203/237/343/202/242.png +0 -0
image//343/203/237/343/203/201/343/203/253.png +0 -0
image//343/203/241/343/202/244/343/203/225/343/202/241/343/203/263.png +0 -0
image//343/203/251/343/203/251/343/203/225/343/202/243/343/203/263.png +0 -0
image//343/203/251/343/203/263/343/202/270/343/203/245.png +0 -0
image//345/217/214/350/221/211.png +0 -0
image//345/241/201.png +0 -0
image//345/275/274/346/226/271.png +0 -0
image//346/204/233.png +0 -0
image//346/231/266.png +0 -0
image//346/236/234/346/236/227.png +0 -0
image//346/240/236/345/255/220.png +0 -0
image//346/255/251/345/244/242.png +0 -0
image//347/217/240/347/267/222.png +0 -0
image//347/222/203/345/245/210.png +0 -0
image//347/234/237/347/237/242.png +0 -0
image//347/264/224/351/202/243.png +0 -0
image//347/276/216/347/251/272.png +0 -0
image//350/217/257/346/201/213.png +0 -0
image//351/235/231/347/276/275.png +0 -0
image//351/246/231/345/255/220.png +0 -0
image//351/253/230/345/222/262/344/276/221.png +0 -0
monotonic_align/__pycache__/__init__.cpython-39.pyc +0 -0
monotonic_align/__pycache__/core.cpython-39.pyc +0 -0
subtitles.srt +4 -0
text/__pycache__/__init__.cpython-39.pyc +0 -0
text/__pycache__/cleaners.cpython-39.pyc +0 -0
text/__pycache__/japanese.cpython-39.pyc +0 -0
text/__pycache__/mandarin.cpython-39.pyc +0 -0
text/__pycache__/symbols.cpython-39.pyc +0 -0

app.py CHANGED Viewed

@@ -1,178 +1,300 @@
-import time
-import matplotlib.pyplot as plt
-import IPython.display as ipd
-import re
-import os
 import json
-import math
 import torch
-from torch import nn
-from torch.nn import functional as F
-from torch.utils.data import DataLoader
-import gradio as gr
 import commons
 import utils
-from data_utils import TextAudioLoader, TextAudioCollate, TextAudioSpeakerLoader, TextAudioSpeakerCollate
 from models import SynthesizerTrn
 from text.symbols import symbols
 from text import text_to_sequence
-import unicodedata
-from scipy.io.wavfile import write
 import openai
-def get_text(text, hps):
-    text_norm = text_to_sequence(text, hps.data.text_cleaners)
-    if hps.data.add_blank:
-        text_norm = commons.intersperse(text_norm, 0)
-    text_norm = torch.LongTensor(text_norm)
-    return text_norm
-def get_label(text, label):
-    if f'[{label}]' in text:
-        return True, text.replace(f'[{label}]', '')
-    else:
-        return False, text
-def selection(speaker):
-    if speaker == "高咲侑（误）":
-        spk = 0
-        return spk
-    elif speaker == "歩夢":
-        spk = 1
-        return spk
-    elif speaker == "かすみ":
-        spk = 2
-        return spk
-    elif speaker == "しずく":
-        spk = 3
-        return spk
-    elif speaker == "果林":
-        spk = 4
-        return spk
-    elif speaker == "愛":
-        spk = 5
-        return spk
-    elif speaker == "彼方":
-        spk = 6
-        return spk
-    elif speaker == "せつ菜":
-        spk = 7
-        return spk
-    elif speaker == "エマ":
-        spk = 8
-        return spk
-    elif speaker == "璃奈":
-        spk = 9
-        return spk
-    elif speaker == "栞子":
-        spk = 10
-        return spk
-    elif speaker == "ランジュ":
-        spk = 11
-        return spk
-    elif speaker == "ミア":
-        spk = 12
-        return spk
-    elif speaker == "三色绘恋1":
-        spk = 13
-        return spk
-    elif speaker == "三色绘恋2":
-        spk = 15
-        return spk
-    elif speaker == "派蒙":
-        spk = 16
-        return spk
-def friend_chat(text,key,call_name,tts_input3):
-  call_name = call_name
-  openai.api_key = key
-  identity = tts_input3
-  start_sequence = '\n'+str(call_name)+':'
-  restart_sequence = "\nYou: "
-  if 1 == 1:
-     prompt0 = text #当期prompt
-  if text == 'quit':
-     return prompt0
-  prompt = identity + prompt0 + start_sequence
-  response = openai.Completion.create(
-    model="text-davinci-003",
-    prompt=prompt,
-    temperature=0.5,
-    max_tokens=1000,
-    top_p=1.0,
-    frequency_penalty=0.5,
-    presence_penalty=0.0,
-    stop=["\nYou:"]
-  )
-  return response['choices'][0]['text'].strip()
-def is_japanese(string):
-        for ch in string:
-            if ord(ch) > 0x3040 and ord(ch) < 0x30FF:
-                return True
-        return False
-def sle(language,text,tts_input2,call_name,tts_input3):
-    if language == "中文":
-        tts_input1 = "[ZH]" + text.replace('\n','。').replace(' ',',') + "[ZH]"
-        return tts_input1
-    if language == "对话":
-        text = friend_chat(text,tts_input2,call_name,tts_input3).replace('\n','。').replace(' ',',')
-        text = f"[JA]{text}[JA]" if is_japanese(text) else f"[ZH]{text}[ZH]"
-        return text
-    elif language == "日文":
-        tts_input1 = "[JA]" + text.replace('\n','。').replace(' ',',') + "[JA]"
-        return tts_input1
-def infer(text,tts_input2,tts_input3,language, speaker_id,n_scale= 0.667,n_scale_w = 0.8, l_scale = 1):
-    speaker_name = speaker_id
-    speaker_id = int(selection(speaker_id))
-    text = sle(language,text,tts_input2,speaker_name,tts_input3)
-    response = text.replace("[ZH]","").replace("[JA]","")
-    stn_tst = get_text(text, hps_ms)
-    with torch.no_grad():
-        x_tst = stn_tst.unsqueeze(0).to(dev)
-        x_tst_lengths = torch.LongTensor([stn_tst.size(0)]).to(dev)
-        sid = torch.LongTensor([speaker_id]).to(dev)
-        t1 = time.time()
-        audio = net_g_ms.infer(x_tst, x_tst_lengths, sid=sid, noise_scale=n_scale, noise_scale_w=n_scale_w, length_scale=l_scale)[0][0,0].data.cpu().float().numpy()
-        t2 = time.time()
-        spending_time = "推理时间："+str(t2-t1)+"s"
-        print(spending_time)
-    return response,(hps_ms.data.sampling_rate, audio)
-lan = ["中文","日文","对话"]
-idols = ["高咲侑（误）","歩夢","かすみ","しずく","果林","愛","彼方","せつ菜","璃奈","栞子","エマ","ランジュ","ミア","派蒙"]
-dev = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
-hps_ms = utils.get_hparams_from_file("config.json")
-net_g_ms = SynthesizerTrn(
-    len(symbols),
-    hps_ms.data.filter_length // 2 + 1,
-    hps_ms.train.segment_size // hps_ms.data.hop_length,
-    n_speakers=hps_ms.data.n_speakers,
-    **hps_ms.model).to(dev)
-_ = net_g_ms.eval()
-_ = utils.load_checkpoint("G_1415000.pth", net_g_ms, None)
-inputs = [gr.TextArea(label="输入你的文本，支持vits版在另一个仓库", value="一次審査、二次審査、それぞれの欄に記入をお願いします。"),
-           gr.TextArea(label="如需使用openai，输入你的openai-key,合成方式选择对话", value="官网"),
-           gr.TextArea(label="写上你给她的设定", value=""),
-           gr.Dropdown(label="选择合成方式",choices=lan, value="日文", interactive=True),
-           gr.Dropdown(label="选择说话人",choices=idols, value="かすみ", interactive=True),
-           gr.Slider(minimum= 0.01,maximum=1.0,label="更改噪声比例", value=0.127),
-           gr.Slider(minimum= 0.01,maximum=1.0,label="更改噪声偏差", value=0.8),
-           gr.Slider(minimum= 0.1,maximum=10,label="更改时间比例", value=1)]
-outputs=[ gr.Textbox(label="回复"),gr.Audio(type="numpy", label="Output audio")]
-iface = gr.Interface(
-    fn=infer,
-    inputs=inputs,
-    outputs=outputs,
-    title="轻量化vits",
-    description="虹团12人模型",
-)
-iface.launch()

+import logging
+logging.getLogger('numba').setLevel(logging.WARNING)
+logging.getLogger('matplotlib').setLevel(logging.WARNING)
+logging.getLogger('urllib3').setLevel(logging.WARNING)
 import json
+import re
+import numpy as np
+import IPython.display as ipd
 import torch
 import commons
 import utils
 from models import SynthesizerTrn
 from text.symbols import symbols
 from text import text_to_sequence
+import gradio as gr
+import time
+import datetime
+import os
+import pickle
 import openai
+from scipy.io.wavfile import write
+def is_japanese(string):
+        for ch in string:
+            if ord(ch) > 0x3040 and ord(ch) < 0x30FF:
+                return True
+        return False
+def is_english(string):
+        import re
+        pattern = re.compile('^[A-Za-z0-9.,:;!?()_*"\' ]+$')
+        if pattern.fullmatch(string):
+            return True
+        else:
+            return False
+def to_html(chat_history):
+    chat_html = ""
+    for item in chat_history:
+        if item['role'] == 'user':
+            chat_html += f"""
+                <div style="margin-bottom: 20px;">
+                    <div style="text-align: right; margin-right: 20px;">
+                        <span style="background-color: #4CAF50; color: black; padding: 10px; border-radius: 10px; display: inline-block; max-width: 80%; word-wrap: break-word;">
+                            {item['content']}
+                        </span>
+                    </div>
+                </div>
+            """
+        else:
+            chat_html += f"""
+                <div style="margin-bottom: 20px;">
+                    <div style="text-align: left; margin-left: 20px;">
+                        <span style="background-color: white; color: black; padding: 10px; border-radius: 10px; display: inline-block; max-width: 80%; word-wrap: break-word;">
+                            {item['content']}
+                        </span>
+                    </div>
+                </div>
+            """
+    output_html = f"""
+        <div style="height: 400px; overflow-y: scroll; padding: 10px;">
+            {chat_html}
+        </div>
+    """
+    return output_html
+def extrac(text):
+    text = re.sub("<[^>]*>","",text)
+    result_list = re.split(r'\n', text)
+    final_list = []
+    for i in result_list:
+        if is_english(i):
+            i = romajitable.to_kana(i).katakana
+        i = i.replace('\n','').replace(' ','')
+        #Current length of single sentence: 20
+        if len(i)>1:
+            if len(i) > 20:
+                try:
+                    cur_list = re.split(r'。|！', i)
+                    for i in cur_list:
+                        if len(i)>1:
+                            final_list.append(i+'。')
+                except:
+                    pass
+            else:
+                final_list.append(i)
+    final_list = [x for x in final_list if x != '']
+    print(final_list)
+    return final_list
+def to_numpy(tensor: torch.Tensor):
+    return tensor.detach().cpu().numpy() if tensor.requires_grad \
+        else tensor.detach().numpy()
+def chatgpt(text):
+    messages = []
+    try:
+        with open('log.pickle', 'rb') as f:
+            messages = pickle.load(f)
+            messages.append({"role": "user", "content": text},)
+            chat = openai.ChatCompletion.create(model="gpt-3.5-turbo", messages=messages)
+            reply = chat.choices[0].message.content
+            messages.append({"role": "assistant", "content": reply})
+            print(messages[-1])
+            if len(messages) == 12:
+                messages[6:10] = messages[8:]
+                del messages[-2:]
+            with open('log.pickle', 'wb') as f:
+                messages2 = []
+                pickle.dump(messages2, f)
+            return reply,messages
+    except:
+        messages.append({"role": "user", "content": text},)
+        chat = openai.ChatCompletion.create(model="gpt-3.5-turbo", messages=messages)
+        reply = chat.choices[0].message.content
+        messages.append({"role": "assistant", "content": reply})
+        print(messages[-1])
+        if len(messages) == 12:
+            messages[6:10] = messages[8:]
+            del messages[-2:]
+        with open('log.pickle', 'wb') as f:
+            pickle.dump(messages, f)
+        return reply,messages
+def get_symbols_from_json(path):
+    assert os.path.isfile(path)
+    with open(path, 'r') as f:
+        data = json.load(f)
+    return data['symbols']
+def sle(language,text):
+        text = text.replace('\n', ' ').replace('\r', '').replace(" ", "")
+        if language == "中文":
+            tts_input1 = "[ZH]" + text + "[ZH]"
+            return tts_input1
+        elif language == "自动":
+            tts_input1 = f"[JA]{text}[JA]" if is_japanese(text) else f"[ZH]{text}[ZH]"
+            return tts_input1
+        elif language == "日文":
+            tts_input1 = "[JA]" + text + "[JA]"
+            return tts_input1
+        elif language == "英文":
+            tts_input1 = "[EN]" + text + "[EN]"
+            return tts_input1
+        elif language == "手动":
+            return text
+def get_text(text,hps_ms):
+    text_norm = text_to_sequence(text,hps_ms.data.text_cleaners)
+    if hps_ms.data.add_blank:
+        text_norm = commons.intersperse(text_norm, 0)
+    text_norm = torch.LongTensor(text_norm)
+    return text_norm
+def create_tts_fn(net_g,hps,speaker_id):
+    speaker_id = int(speaker_id)
+    def tts_fn(is_gpt,api_key,is_audio,audiopath,repeat_time,text, language, extract, n_scale= 0.667,n_scale_w = 0.8, l_scale = 1 ):
+        repeat_ime = int(repeat_time)
+        if is_gpt:
+            openai.api_key = api_key
+            text,messages = chatgpt(text)
+            htm = to_html(messages)
+        else:
+            htm = ''
+        if not extract:
+            t1 = time.time()
+            stn_tst = get_text(sle(language,text),hps)
+            with torch.no_grad():
+                x_tst = stn_tst.unsqueeze(0).to(dev)
+                x_tst_lengths = torch.LongTensor([stn_tst.size(0)]).to(dev)
+                sid = torch.LongTensor([speaker_id]).to(dev)
+                audio = net_g.infer(x_tst, x_tst_lengths, sid=sid, noise_scale=n_scale, noise_scale_w=n_scale_w, length_scale=l_scale)[0][0,0].data.cpu().float().numpy()
+                t2 = time.time()
+                spending_time = "推理时间为："+str(t2-t1)+"s"
+                print(spending_time)
+                file_path = "subtitles.srt"
+            try:
+                write(audiopath + '.wav',22050,audio)
+                if is_audio:
+                    for i in range(repeat_time):
+                        cmd = 'ffmpeg -y -i ' +  audiopath + '.wav' + ' -ar 44100 '+ audiopath.replace('temp','temp'+str(i))
+                        os.system(cmd)
+            except:
+                pass
+            return (hps.data.sampling_rate, audio),file_path,htm
+        else:
+            a = ['【','[','(','（']
+            b = ['】',']',')','）']
+            for i in a:
+                text = text.replace(i,'<')
+            for i in b:
+                text = text.replace(i,'>')
+            final_list = extrac(text.replace('“','').replace('”',''))
+            audio_fin = []
+            c = 0
+            t = datetime.timedelta(seconds=0)
+            for sentence in final_list:
+                try:
+                    f1 = open("subtitles.srt",'w',encoding='utf-8')
+                    c +=1
+                    stn_tst = get_text(sle(language,sentence),hps)
+                    with torch.no_grad():
+                        x_tst = stn_tst.unsqueeze(0).to(dev)
+                        x_tst_lengths = torch.LongTensor([stn_tst.size(0)]).to(dev)
+                        sid = torch.LongTensor([speaker_id]).to(dev)
+                        t1 = time.time()
+                        audio = net_g.infer(x_tst, x_tst_lengths, sid=sid, noise_scale=n_scale, noise_scale_w=n_scale_w, length_scale=l_scale)[0][0,0].data.cpu().float().numpy()
+                        t2 = time.time()
+                        spending_time = "第"+str(c)+"句的推理时间为："+str(t2-t1)+"s"
+                        print(spending_time)
+                        time_start = str(t).split(".")[0] + "," + str(t.microseconds)[:3]
+                        last_time = datetime.timedelta(seconds=len(audio)/float(22050))
+                        t+=last_time
+                        time_end = str(t).split(".")[0] + "," + str(t.microseconds)[:3]
+                        print(time_end)
+                        f1.write(str(c-1)+'\n'+time_start+' --> '+time_end+'\n'+sentence+'\n\n')
+                        audio_fin.append(audio)
+                except:
+                    pass
+                try:
+                    write(audiopath + '.wav',22050,np.concatenate(audio_fin))
+                    if is_audio:
+                        for i in range(repeat_time):
+                            cmd = 'ffmpeg -y -i ' +  audiopath + '.wav' + ' -ar 44100 '+ audiopath.replace('temp','temp'+str(i))
+                            os.system(cmd)
+                except:
+                    pass
+            file_path = "subtitles.srt"
+            return (hps.data.sampling_rate, np.concatenate(audio_fin)),file_path,htm
+    return tts_fn
+if __name__ == '__main__':
+    hps = utils.get_hparams_from_file('checkpoints/Nijigaku/config.json')
+    dev = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+    models = []
+    schools = ["Nijigasaki High School"]
+    lan = ["中文","日文","自动","手动"]
+    with open("checkpoints/info.json", "r", encoding="utf-8") as f:
+        models_info = json.load(f)
+    net_g = SynthesizerTrn(
+            len(symbols),
+            hps.data.filter_length // 2 + 1,
+            hps.train.segment_size // hps.data.hop_length,
+            n_speakers=hps.data.n_speakers,
+            **hps.model).to(dev)
+    _ = net_g.eval()
+    _ = utils.load_checkpoint("checkpoints/Nijigaku/model.pth" , net_g)
+    for i in models_info:
+        school = models_info[i]
+        speakers = school["speakers"]
+        phone_dict = {
+            symbol: i for i, symbol in enumerate(symbols)
+        }
+        content = []
+        for j in speakers:
+            sid = int(speakers[j]['sid'])
+            title = school
+            example = speakers[j]['speech']
+            name = speakers[j]["name"]
+            content.append((sid, name, title, example, create_tts_fn(net_g,hps,sid)))
+        models.append(content)
+    with gr.Blocks() as app:
+        with gr.Tabs():
+            for i in schools:
+                with gr.TabItem(i):
+                    for (sid, name,  title, example, tts_fn) in models[schools.index(i)]:
+                        with gr.TabItem(name):
+                            with gr.Column():
+                                with gr.Row():
+                                    with gr.Row():
+                                        gr.Markdown(
+                                            '<div align="center">'
+                                            f'<img style="width:auto;height:400px;" src="file/image/{name}.png">'
+                                            '</div>'
+                                        )
+                                    output_UI = gr.outputs.HTML()
+                                with gr.Row():
+                                    with gr.Column(scale=0.85):
+                                        input1 = gr.TextArea(label="Text", value=example,lines = 1)
+                                    with gr.Column(scale=0.15, min_width=0):
+                                        btnVC = gr.Button("Send")
+                                output1 = gr.Audio(label="采样率22050")
+                                with gr.Accordion(label="Setting(TTS)", open=False):
+                                    input2 = gr.Dropdown(label="Language", choices=lan, value="自动", interactive=True)
+                                    input4 = gr.Slider(minimum=0, maximum=1.0, label="更改噪声比例(noise scale)，以控制情感", value=0.6)
+                                    input5 = gr.Slider(minimum=0, maximum=1.0, label="更改噪声偏差(noise scale w)，以控制音素长短", value=0.668)
+                                    input6 = gr.Slider(minimum=0.1, maximum=10, label="duration", value=1)
+                                with gr.Accordion(label="Advanced Setting(GPT3.5接口+长句子合成，建议克隆本仓库后运行main.py)", open=False):
+                                    input3 = gr.Checkbox(value=False, label="长句切割(小说合成)")
+                                    output2 = gr.outputs.File(label="字幕文件：subtitles.srt")
+                                    api_input1 = gr.Checkbox(value=False, label="接入chatgpt")
+                                    api_input2 = gr.TextArea(label="api-key",lines=1,value = '见 https://openai.com/blog/openai-api')
+                                    audio_input1 = gr.Checkbox(value=False, label="修改音频路径(live2d)")
+                                    audio_input2 = gr.TextArea(label="音频路径",lines=1,value = '#参考 D:/app_develop/live2d_whole/2010002/sounds/temp.wav')
+                                    audio_input3 = gr.Dropdown(label="重复生成次数", choices=list(range(101)), value='0', interactive=True)
+                        btnVC.click(tts_fn, inputs=[api_input1,api_input2,audio_input1,audio_input2,audio_input3,input1,input2,input3,input4,input5,input6], outputs=[output1,output2,output_UI])
+    app.launch()

checkpoints/Nijigaku/config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+  "train": {
+    "log_interval": 200,
+    "eval_interval": 5000,
+    "seed": 1234,
+    "epochs": 20000,
+    "learning_rate": 2e-4,
+    "betas": [ 0.8, 0.99 ],
+    "eps": 1e-9,
+    "batch_size": 12,
+    "fp16_run": false,
+    "lr_decay": 0.999875,
+    "segment_size": 8192,
+    "init_lr_ratio": 1,
+    "warmup_epochs": 0,
+    "c_mel": 45,
+    "c_kl": 1.0,
+    "fft_sizes": [ 384, 683, 171 ],
+    "hop_sizes": [ 30, 60, 10 ],
+    "win_lengths": [ 150, 300, 60 ],
+    "window": "hann_window"
+  },
+  "data": {
+    "training_files": "E:/filelist/train_with_paimeng.txt",
+    "validation_files": "E:/filelist/val_filelist.txt",
+    "text_cleaners": [ "cjke_cleaners" ],
+    "max_wav_value": 32768.0,
+    "sampling_rate": 22050,
+    "filter_length": 1024,
+    "hop_length": 256,
+    "win_length": 1024,
+    "n_mel_channels": 80,
+    "mel_fmin": 0.0,
+    "mel_fmax": null,
+    "add_blank": true,
+    "n_speakers": 18,
+    "cleaned_text": true
+  },
+  "model": {
+    "ms_istft_vits": true,
+    "mb_istft_vits": false,
+    "istft_vits": false,
+    "subbands": 4,
+    "gen_istft_n_fft": 16,
+    "gen_istft_hop_size": 4,
+    "inter_channels": 192,
+    "hidden_channels": 192,
+    "filter_channels": 768,
+    "n_heads": 2,
+    "n_layers": 6,
+    "kernel_size": 3,
+    "p_dropout": 0.1,
+    "resblock": "1",
+    "resblock_kernel_sizes": [ 3, 7, 11 ],
+    "resblock_dilation_sizes": [
+      [ 1, 3, 5 ],
+      [ 1, 3, 5 ],
+      [ 1, 3, 5 ]
+    ],
+    "upsample_rates": [ 4, 4 ],
+    "upsample_initial_channel": 512,
+    "upsample_kernel_sizes": [ 16, 16 ],
+    "n_layers_q": 3,
+    "use_spectral_norm": false,
+    "gin_channels": 256,
+    "use_sdp": false
+  }
+}

checkpoints/Nijigaku/model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62dae224dce4ae492158dc675b96d3aaa45335a69f4118870d645c3fb718df63
+size 455712599

checkpoints/info.json ADDED Viewed

	@@ -0,0 +1,72 @@

+{
+    "Nijigasaki High School":{
+        "speakers":{
+            "歩夢":{
+                "sid": 1,
+                "speech": "みなさん、はじめまして。上原歩夢です。",
+                "name": "歩夢"
+            },
+            "かすみ":{
+                "sid": 2,
+                "speech": "みんなのアイドルかすみんだよー。",
+                "name": "かすみ"
+            },
+            "しずく":{
+                "sid": 3,
+                "speech": "みなさん、こんにちは。しずくです。",
+                "name": "しずく"
+            },
+            "果林":{
+                "sid": 4,
+                "speech": "ハーイ。　朝香果林よ。よろしくね",
+                "name": "果林"
+            },
+            "愛":{
+                "sid": 5,
+                "speech": "ちっすー。アタシは愛。",
+                "name": "愛"
+            },
+            "彼方":{
+                "sid": 6,
+                "speech": "ちっすー。アタシは愛。",
+                "name": "彼方"
+            },
+            "せつ菜":{
+                "sid": 7,
+                "speech": "絶えぬ命は，常世に在らず。終わらぬ芝居も，夢幻のごとく。儚く燃えゆく，さだめであれば。舞台に刻まん，刹那の瞬き。",
+                "name": "せつ菜"
+            },
+            "エマ":{
+                "sid": 8,
+                "speech": "こんにちは、エマです。自然溢れるスイスからやってきましたっ。",
+                "name": "エマ"
+            },
+            "璃奈":{
+                "sid": 9,
+                "speech": "私、天王寺璃奈。とってもきゅーとな女の子。ホントだよ？",
+                "name": "璃奈"
+            },
+            "栞子":{
+                "sid": 10,
+                "speech": "みなさん、初めまして。三船栞子と申します。",
+                "name": "栞子"
+            },
+            "ランジュ":{
+                "sid": 11,
+                "speech": "你好啊，我是钟岚珠。",
+                "name": "ランジュ"
+            },
+            "ミア":{
+                "sid": 12,
+                "speech": "ボクはミア・テイラー。",
+                "name": "ミア"
+            },
+            "高咲侑":{
+                "sid": 0,
+                "speech": "只选一个做不到啊",
+                "name": "高咲侑"
+            }
+        },
+        "checkpoint":  "checkpoints/Nijigaku/model.pth"
+    }
+}

image//343/201/202/343/202/213/343/202/213.png ADDED Viewed

image//343/201/204/343/201/241/343/201/210.png ADDED Viewed

image//343/201/213/343/201/231/343/201/277.png ADDED Viewed

image//343/201/227/343/201/232/343/201/217.png ADDED Viewed

image//343/201/233/343/201/244/350/217/234.png ADDED Viewed

image//343/201/252/343/201/252.png ADDED Viewed

image//343/201/262/343/201/213/343/202/212.png ADDED Viewed

image//343/201/276/343/201/262/343/202/213.png ADDED Viewed

image//343/202/204/343/201/241/343/202/210.png ADDED Viewed

image//343/202/206/343/202/206/345/255/220.png ADDED Viewed

image//343/202/250/343/203/236.png ADDED Viewed

image//343/202/257/343/203/255/343/203/207/343/202/243/343/203/274/343/203/214.png ADDED Viewed

image//343/203/237/343/202/242.png ADDED Viewed

image//343/203/237/343/203/201/343/203/253.png ADDED Viewed

image//343/203/241/343/202/244/343/203/225/343/202/241/343/203/263.png ADDED Viewed

image//343/203/251/343/203/251/343/203/225/343/202/243/343/203/263.png ADDED Viewed

image//343/203/251/343/203/263/343/202/270/343/203/245.png ADDED Viewed

image//345/217/214/350/221/211.png ADDED Viewed

image//345/241/201.png ADDED Viewed

image//345/275/274/346/226/271.png ADDED Viewed

image//346/204/233.png ADDED Viewed

image//346/231/266.png ADDED Viewed

image//346/236/234/346/236/227.png ADDED Viewed

image//346/240/236/345/255/220.png ADDED Viewed

image//346/255/251/345/244/242.png ADDED Viewed

image//347/217/240/347/267/222.png ADDED Viewed

image//347/222/203/345/245/210.png ADDED Viewed

image//347/234/237/347/237/242.png ADDED Viewed

image//347/264/224/351/202/243.png ADDED Viewed

image//347/276/216/347/251/272.png ADDED Viewed

image//350/217/257/346/201/213.png ADDED Viewed

image//351/235/231/347/276/275.png ADDED Viewed

image//351/246/231/345/255/220.png ADDED Viewed

image//351/253/230/345/222/262/344/276/221.png ADDED Viewed

monotonic_align/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (842 Bytes). View file

monotonic_align/__pycache__/core.cpython-39.pyc ADDED Viewed

Binary file (993 Bytes). View file

subtitles.srt ADDED Viewed

	@@ -0,0 +1,4 @@

+0
+0:00:00,0 --> 0:00:02,333
+ちっすー。アタシは愛。

text/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (2.14 kB). View file

text/__pycache__/cleaners.cpython-39.pyc ADDED Viewed

Binary file (6.31 kB). View file

text/__pycache__/japanese.cpython-39.pyc ADDED Viewed

Binary file (4.44 kB). View file

text/__pycache__/mandarin.cpython-39.pyc ADDED Viewed

Binary file (6.41 kB). View file

text/__pycache__/symbols.cpython-39.pyc ADDED Viewed

Binary file (438 Bytes). View file