jiedi-so-vits-svc

Sleeping

App Files Files Community

aoxiang1221 commited on Oct 5, 2023

Commit

9912004

1 Parent(s): 85ce65e

update

Browse files

Files changed (47) hide show

__pycache__/compress_model.cpython-310.pyc +0 -0
__pycache__/models.cpython-310.pyc +0 -0
__pycache__/utils.cpython-310.pyc +0 -0
cluster/__pycache__/__init__.cpython-310.pyc +0 -0
configs/config.json +0 -0
dataset_raw/wav_structure.txt +20 -0
diffusion/__pycache__/__init__.cpython-310.pyc +0 -0
diffusion/__pycache__/diffusion.cpython-310.pyc +0 -0
diffusion/__pycache__/unit2mel.cpython-310.pyc +0 -0
diffusion/__pycache__/vocoder.cpython-310.pyc +0 -0
diffusion/__pycache__/wavenet.cpython-310.pyc +0 -0
edgetts/__pycache__/tts_voices.cpython-310.pyc +0 -0
filelists/test.txt +4 -0
filelists/train.txt +15 -0
filelists/val.txt +4 -0
inference/__pycache__/__init__.cpython-310.pyc +0 -0
inference/__pycache__/infer_tool.cpython-310.pyc +0 -0
inference/__pycache__/slicer.cpython-310.pyc +0 -0
logs/44k/diffusion/put_diffusion_pretrained_model_here +0 -0
logs/44k/put_pretrained_model_here +0 -0
modules/F0Predictor/__pycache__/F0Predictor.cpython-310.pyc +0 -0
modules/F0Predictor/__pycache__/HarvestF0Predictor.cpython-310.pyc +0 -0
modules/F0Predictor/__pycache__/__init__.cpython-310.pyc +0 -0
modules/__pycache__/DSConv.cpython-310.pyc +0 -0
modules/__pycache__/__init__.cpython-310.pyc +0 -0
modules/__pycache__/attentions.cpython-310.pyc +0 -0
modules/__pycache__/commons.cpython-310.pyc +0 -0
modules/__pycache__/modules.cpython-310.pyc +0 -0
pretrain/__init__.py +0 -0
pretrain/checkpoint_best_legacy_500.pt +3 -0
pretrain/meta.py +39 -0
pretrain/nsf_hifigan/put_nsf_hifigan_ckpt_here +0 -0
pretrain/put_hubert_ckpt_here +0 -0
raw/put_raw_wav_here +0 -0
trained/nahida/nahida.json +96 -0
trained/nahida/nahida_G_40000.pth +3 -0
vdecoder/__pycache__/__init__.cpython-310.pyc +0 -0
vdecoder/hifigan/__pycache__/env.cpython-310.pyc +0 -0
vdecoder/hifigan/__pycache__/models.cpython-310.pyc +0 -0
vdecoder/hifigan/__pycache__/utils.cpython-310.pyc +0 -0
vdecoder/nsf_hifigan/__pycache__/env.cpython-310.pyc +0 -0
vdecoder/nsf_hifigan/__pycache__/models.cpython-310.pyc +0 -0
vdecoder/nsf_hifigan/__pycache__/nvSTFT.cpython-310.pyc +0 -0
vdecoder/nsf_hifigan/__pycache__/utils.cpython-310.pyc +0 -0
vencoder/__pycache__/ContentVec256L9.cpython-310.pyc +0 -0
vencoder/__pycache__/__init__.cpython-310.pyc +0 -0
vencoder/__pycache__/encoder.cpython-310.pyc +0 -0

__pycache__/compress_model.cpython-310.pyc ADDED Viewed

Binary file (2.22 kB). View file

__pycache__/models.cpython-310.pyc ADDED Viewed

Binary file (14.7 kB). View file

__pycache__/utils.cpython-310.pyc ADDED Viewed

Binary file (20.5 kB). View file

cluster/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (1.06 kB). View file

configs/config.json ADDED Viewed

File without changes

dataset_raw/wav_structure.txt ADDED Viewed

	@@ -0,0 +1,20 @@

+数据集准备
+raw
+├───speaker0
+│   ├───xxx1-xxx1.wav
+│   ├───...
+│   └───Lxx-0xx8.wav
+└───speaker1
+    ├───xx2-0xxx2.wav
+    ├───...
+    └───xxx7-xxx007.wav
+此外还需要编辑config.json
+"n_speakers": 10
+"spk":{
+    "speaker0": 0,
+    "speaker1": 1,
+}

diffusion/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (132 Bytes). View file

diffusion/__pycache__/diffusion.cpython-310.pyc ADDED Viewed

Binary file (11.3 kB). View file

diffusion/__pycache__/unit2mel.cpython-310.pyc ADDED Viewed

Binary file (4.9 kB). View file

diffusion/__pycache__/vocoder.cpython-310.pyc ADDED Viewed

Binary file (3.52 kB). View file

diffusion/__pycache__/wavenet.cpython-310.pyc ADDED Viewed

Binary file (3.83 kB). View file

edgetts/__pycache__/tts_voices.cpython-310.pyc ADDED Viewed

Binary file (11.3 kB). View file

filelists/test.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+./dataset/44k/taffy/000562.wav
+./dataset/44k/nyaru/000011.wav
+./dataset/44k/nyaru/000008.wav
+./dataset/44k/taffy/000563.wav

filelists/train.txt ADDED Viewed

	@@ -0,0 +1,15 @@

+./dataset/44k/taffy/000549.wav
+./dataset/44k/nyaru/000004.wav
+./dataset/44k/nyaru/000006.wav
+./dataset/44k/taffy/000551.wav
+./dataset/44k/nyaru/000009.wav
+./dataset/44k/taffy/000561.wav
+./dataset/44k/nyaru/000001.wav
+./dataset/44k/taffy/000553.wav
+./dataset/44k/nyaru/000002.wav
+./dataset/44k/taffy/000560.wav
+./dataset/44k/taffy/000557.wav
+./dataset/44k/nyaru/000005.wav
+./dataset/44k/taffy/000554.wav
+./dataset/44k/taffy/000550.wav
+./dataset/44k/taffy/000559.wav

filelists/val.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+./dataset/44k/nyaru/000003.wav
+./dataset/44k/nyaru/000007.wav
+./dataset/44k/taffy/000558.wav
+./dataset/44k/taffy/000556.wav

inference/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (132 Bytes). View file

inference/__pycache__/infer_tool.cpython-310.pyc ADDED Viewed

Binary file (15.4 kB). View file

inference/__pycache__/slicer.cpython-310.pyc ADDED Viewed

Binary file (3.85 kB). View file

logs/44k/diffusion/put_diffusion_pretrained_model_here ADDED Viewed

File without changes

logs/44k/put_pretrained_model_here ADDED Viewed

File without changes

modules/F0Predictor/__pycache__/F0Predictor.cpython-310.pyc ADDED Viewed

Binary file (838 Bytes). View file

modules/F0Predictor/__pycache__/HarvestF0Predictor.cpython-310.pyc ADDED Viewed

Binary file (2.46 kB). View file

modules/F0Predictor/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (142 Bytes). View file

modules/__pycache__/DSConv.cpython-310.pyc ADDED Viewed

Binary file (2.98 kB). View file

modules/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (130 Bytes). View file

modules/__pycache__/attentions.cpython-310.pyc ADDED Viewed

Binary file (11.1 kB). View file

modules/__pycache__/commons.cpython-310.pyc ADDED Viewed

Binary file (6.39 kB). View file

modules/__pycache__/modules.cpython-310.pyc ADDED Viewed

Binary file (9.9 kB). View file

pretrain/__init__.py ADDED Viewed

File without changes

pretrain/checkpoint_best_legacy_500.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f54b40fd2802423a5643779c4861af1e9ee9c1564dc9d32f54f20b5ffba7db96
+size 189507909

pretrain/meta.py ADDED Viewed

	@@ -0,0 +1,39 @@

+def download_dict():
+    return {
+        "vec768l12": {
+            "url": "https://ibm.ent.box.com/shared/static/z1wgl1stco8ffooyatzdwsqn2psd9lrr",
+            "output": "./pretrain/checkpoint_best_legacy_500.pt"
+        },
+        "vec256l9": {
+            "url": "https://ibm.ent.box.com/shared/static/z1wgl1stco8ffooyatzdwsqn2psd9lrr",
+            "output": "./pretrain/checkpoint_best_legacy_500.pt"
+        },
+        "hubertsoft": {
+            "url": "https://github.com/bshall/hubert/releases/download/v0.1/hubert-soft-0d54a1f4.pt",
+            "output": "./pretrain/hubert-soft-0d54a1f4.pt"
+        },
+        "whisper-ppg-small": {
+            "url": "https://openaipublic.azureedge.net/main/whisper/models/9ecf779972d90ba49c06d968637d720dd632c55bbf19d441fb42bf17a411e794/small.pt",
+            "output": "./pretrain/small.pt"
+        },
+        "whisper-ppg": {
+            "url": "https://openaipublic.azureedge.net/main/whisper/models/345ae4da62f9b3d59415adc60127b97c714f32e89e936602e85993674d08dcb1/medium.pt",
+            "output": "./pretrain/medium.pt"
+        },
+        "whisper-ppg-large": {
+            "url": "https://openaipublic.azureedge.net/main/whisper/models/81f7c96c852ee8fc832187b0132e569d6c3065a3252ed18e56effd0b6a73e524/large-v2.pt",
+            "output": "./pretrain/large-v2.pt"
+        }
+    }
+def get_speech_encoder(config_path="configs/config.json"):
+    import json
+    with open(config_path, "r") as f:
+        data = f.read()
+        config = json.loads(data)
+        speech_encoder = config["model"]["speech_encoder"]
+        dict = download_dict()
+        return dict[speech_encoder]["url"], dict[speech_encoder]["output"]

pretrain/nsf_hifigan/put_nsf_hifigan_ckpt_here ADDED Viewed

File without changes

pretrain/put_hubert_ckpt_here ADDED Viewed

File without changes

raw/put_raw_wav_here ADDED Viewed

File without changes

trained/nahida/nahida.json ADDED Viewed

	@@ -0,0 +1,96 @@

+{
+  "train": {
+    "log_interval": 200,
+    "eval_interval": 800,
+    "seed": 1234,
+    "epochs": 10000,
+    "learning_rate": 0.00015,
+    "betas": [
+      0.8,
+      0.99
+    ],
+    "eps": 1e-09,
+    "batch_size": 12,
+    "fp16_run": false,
+    "lr_decay": 0.999875,
+    "segment_size": 10240,
+    "init_lr_ratio": 1,
+    "warmup_epochs": 0,
+    "c_mel": 45,
+    "c_kl": 1.0,
+    "use_sr": true,
+    "max_speclen": 512,
+    "port": "8001",
+    "keep_ckpts": 3,
+    "all_in_mem": false
+  },
+  "data": {
+    "training_files": "filelists/train.txt",
+    "validation_files": "filelists/val.txt",
+    "max_wav_value": 32768.0,
+    "sampling_rate": 44100,
+    "filter_length": 2048,
+    "hop_length": 512,
+    "win_length": 2048,
+    "n_mel_channels": 80,
+    "mel_fmin": 0.0,
+    "mel_fmax": 22050
+  },
+  "model": {
+    "inter_channels": 192,
+    "hidden_channels": 192,
+    "filter_channels": 768,
+    "n_heads": 2,
+    "n_layers": 6,
+    "kernel_size": 3,
+    "p_dropout": 0.1,
+    "resblock": "1",
+    "resblock_kernel_sizes": [
+      3,
+      7,
+      11
+    ],
+    "resblock_dilation_sizes": [
+      [
+        1,
+        3,
+        5
+      ],
+      [
+        1,
+        3,
+        5
+      ],
+      [
+        1,
+        3,
+        5
+      ]
+    ],
+    "upsample_rates": [
+      8,
+      8,
+      2,
+      2,
+      2
+    ],
+    "upsample_initial_channel": 512,
+    "upsample_kernel_sizes": [
+      16,
+      16,
+      4,
+      4,
+      4
+    ],
+    "n_layers_q": 3,
+    "use_spectral_norm": false,
+    "gin_channels": 256,
+    "ssl_dim": 256,
+    "n_speakers": 1,
+    "speech_encoder": "vec256l9",
+    "speaker_embedding": false
+  },
+  "spk": {
+    "nahida": 0
+  }
+}

trained/nahida/nahida_G_40000.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fec9506f8a762516e5321bcaedc72b6891d61a631e82ac596fe4e16e45b4652a
+size 542178077

vdecoder/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (131 Bytes). View file

vdecoder/hifigan/__pycache__/env.cpython-310.pyc ADDED Viewed

Binary file (804 Bytes). View file

vdecoder/hifigan/__pycache__/models.cpython-310.pyc ADDED Viewed

Binary file (16.3 kB). View file

vdecoder/hifigan/__pycache__/utils.cpython-310.pyc ADDED Viewed

Binary file (2.3 kB). View file

vdecoder/nsf_hifigan/__pycache__/env.cpython-310.pyc ADDED Viewed

Binary file (808 Bytes). View file

vdecoder/nsf_hifigan/__pycache__/models.cpython-310.pyc ADDED Viewed

Binary file (14.2 kB). View file

vdecoder/nsf_hifigan/__pycache__/nvSTFT.cpython-310.pyc ADDED Viewed

Binary file (4.26 kB). View file

vdecoder/nsf_hifigan/__pycache__/utils.cpython-310.pyc ADDED Viewed

Binary file (2.35 kB). View file

vencoder/__pycache__/ContentVec256L9.cpython-310.pyc ADDED Viewed

Binary file (1.55 kB). View file

vencoder/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (131 Bytes). View file

vencoder/__pycache__/encoder.cpython-310.pyc ADDED Viewed

Binary file (757 Bytes). View file