zdxiaoda commited on
Commit
f3367c4
·
1 Parent(s): ff55c95

Add application file

Browse files
Dockerfile DELETED
@@ -1,34 +0,0 @@
1
- FROM python:3.8
2
-
3
- RUN apt update
4
- RUN apt install -y git libsndfile1-dev python3 python3-dev python3-pip ffmpeg
5
- RUN python3 -m pip install --no-cache-dir --upgrade pip
6
-
7
- # Set up a new user named "user" with user ID 1000
8
- RUN useradd -m -u 1000 user
9
-
10
- # Switch to the "user" user
11
- USER user
12
-
13
- # Set home to the user's home directory
14
- ENV HOME=/home/user \
15
- PATH=/home/user/.local/bin:$PATH
16
-
17
- # Set the working directory to the user's home directory
18
- WORKDIR $HOME/
19
-
20
- # Copy the current directory contents into the container at $HOME/app setting the owner to the user
21
- COPY --chown=user . .
22
-
23
- RUN cd $HOME/so-vits-svc/pretrain && \
24
- wget -c https://github.com/openvpi/vocoders/releases/download/nsf-hifigan-v1/nsf_hifigan_20221211.zip && \
25
- unzip -q nsf_hifigan_20221211.zip
26
-
27
- RUN pip install --no-cache-dir --upgrade -r $HOME/so-vits-svc/requirements.txt
28
-
29
- ENV SERVER_NAME="0.0.0.0"
30
- ENV SERVER_PORT=7860
31
-
32
- WORKDIR $HOME/so-vits-svc
33
-
34
- CMD ["python3", "webUI.py"]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
models/sora_mix/config.json CHANGED
@@ -5,11 +5,8 @@
5
  "seed": 1234,
6
  "epochs": 10000,
7
  "learning_rate": 0.00005,
8
- "betas": [
9
- 0.8,
10
- 0.99
11
- ],
12
- "eps": 1e-09,
13
  "batch_size": 20,
14
  "fp16_run": false,
15
  "lr_decay": 0.999875,
@@ -45,43 +42,15 @@
45
  "kernel_size": 3,
46
  "p_dropout": 0.1,
47
  "resblock": "1",
48
- "resblock_kernel_sizes": [
49
- 3,
50
- 7,
51
- 11
52
- ],
53
  "resblock_dilation_sizes": [
54
- [
55
- 1,
56
- 3,
57
- 5
58
- ],
59
- [
60
- 1,
61
- 3,
62
- 5
63
- ],
64
- [
65
- 1,
66
- 3,
67
- 5
68
- ]
69
- ],
70
- "upsample_rates": [
71
- 8,
72
- 8,
73
- 2,
74
- 2,
75
- 2
76
  ],
 
77
  "upsample_initial_channel": 512,
78
- "upsample_kernel_sizes": [
79
- 16,
80
- 16,
81
- 4,
82
- 4,
83
- 4
84
- ],
85
  "n_layers_q": 3,
86
  "use_spectral_norm": false,
87
  "gin_channels": 256,
@@ -89,6 +58,6 @@
89
  "n_speakers": 1
90
  },
91
  "spk": {
92
- "kasugano_sora_mix": 0
93
  }
94
  }
 
5
  "seed": 1234,
6
  "epochs": 10000,
7
  "learning_rate": 0.00005,
8
+ "betas": [0.8, 0.99],
9
+ "eps": 1e-9,
 
 
 
10
  "batch_size": 20,
11
  "fp16_run": false,
12
  "lr_decay": 0.999875,
 
42
  "kernel_size": 3,
43
  "p_dropout": 0.1,
44
  "resblock": "1",
45
+ "resblock_kernel_sizes": [3, 7, 11],
 
 
 
 
46
  "resblock_dilation_sizes": [
47
+ [1, 3, 5],
48
+ [1, 3, 5],
49
+ [1, 3, 5]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
50
  ],
51
+ "upsample_rates": [8, 8, 2, 2, 2],
52
  "upsample_initial_channel": 512,
53
+ "upsample_kernel_sizes": [16, 16, 4, 4, 4],
 
 
 
 
 
 
54
  "n_layers_q": 3,
55
  "use_spectral_norm": false,
56
  "gin_channels": 256,
 
58
  "n_speakers": 1
59
  },
60
  "spk": {
61
+ "春日野穹_mix": 0
62
  }
63
  }
models/sora_speak/config.json CHANGED
@@ -5,11 +5,8 @@
5
  "seed": 1234,
6
  "epochs": 100000,
7
  "learning_rate": 0.0002,
8
- "betas": [
9
- 0.8,
10
- 0.99
11
- ],
12
- "eps": 1e-09,
13
  "batch_size": 20,
14
  "fp16_run": false,
15
  "lr_decay": 0.999875,
@@ -45,43 +42,15 @@
45
  "kernel_size": 3,
46
  "p_dropout": 0.1,
47
  "resblock": "1",
48
- "resblock_kernel_sizes": [
49
- 3,
50
- 7,
51
- 11
52
- ],
53
  "resblock_dilation_sizes": [
54
- [
55
- 1,
56
- 3,
57
- 5
58
- ],
59
- [
60
- 1,
61
- 3,
62
- 5
63
- ],
64
- [
65
- 1,
66
- 3,
67
- 5
68
- ]
69
- ],
70
- "upsample_rates": [
71
- 8,
72
- 8,
73
- 2,
74
- 2,
75
- 2
76
  ],
 
77
  "upsample_initial_channel": 512,
78
- "upsample_kernel_sizes": [
79
- 16,
80
- 16,
81
- 4,
82
- 4,
83
- 4
84
- ],
85
  "n_layers_q": 3,
86
  "use_spectral_norm": false,
87
  "gin_channels": 256,
@@ -89,6 +58,6 @@
89
  "n_speakers": 1
90
  },
91
  "spk": {
92
- "kasugano_sora_speak": 0
93
  }
94
  }
 
5
  "seed": 1234,
6
  "epochs": 100000,
7
  "learning_rate": 0.0002,
8
+ "betas": [0.8, 0.99],
9
+ "eps": 1e-9,
 
 
 
10
  "batch_size": 20,
11
  "fp16_run": false,
12
  "lr_decay": 0.999875,
 
42
  "kernel_size": 3,
43
  "p_dropout": 0.1,
44
  "resblock": "1",
45
+ "resblock_kernel_sizes": [3, 7, 11],
 
 
 
 
46
  "resblock_dilation_sizes": [
47
+ [1, 3, 5],
48
+ [1, 3, 5],
49
+ [1, 3, 5]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
50
  ],
51
+ "upsample_rates": [8, 8, 2, 2, 2],
52
  "upsample_initial_channel": 512,
53
+ "upsample_kernel_sizes": [16, 16, 4, 4, 4],
 
 
 
 
 
 
54
  "n_layers_q": 3,
55
  "use_spectral_norm": false,
56
  "gin_channels": 256,
 
58
  "n_speakers": 1
59
  },
60
  "spk": {
61
+ "春日野穹_speak": 0
62
  }
63
  }
so-vits-svc/__pycache__/models.cpython-38.pyc ADDED
Binary file (12.4 kB). View file
 
so-vits-svc/__pycache__/utils.cpython-38.pyc ADDED
Binary file (17.8 kB). View file
 
so-vits-svc/cluster/__pycache__/__init__.cpython-38.pyc ADDED
Binary file (1.12 kB). View file
 
so-vits-svc/hubert/__pycache__/__init__.cpython-38.pyc ADDED
Binary file (167 Bytes). View file
 
so-vits-svc/hubert/__pycache__/hubert_model.cpython-38.pyc ADDED
Binary file (7.61 kB). View file
 
so-vits-svc/hubert/checkpoint_best_legacy_500.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60d936ec5a566776fc392e69ad8b630d14eb588111233fe313436e200a7b187b
3
+ size 1330114945
so-vits-svc/inference/__pycache__/__init__.cpython-38.pyc ADDED
Binary file (170 Bytes). View file
 
so-vits-svc/inference/__pycache__/infer_tool.cpython-38.pyc ADDED
Binary file (10.6 kB). View file
 
so-vits-svc/inference/__pycache__/slicer.cpython-38.pyc ADDED
Binary file (3.87 kB). View file
 
so-vits-svc/modules/__pycache__/__init__.cpython-38.pyc ADDED
Binary file (168 Bytes). View file
 
so-vits-svc/modules/__pycache__/attentions.cpython-38.pyc ADDED
Binary file (10.7 kB). View file
 
so-vits-svc/modules/__pycache__/commons.cpython-38.pyc ADDED
Binary file (6.66 kB). View file
 
so-vits-svc/modules/__pycache__/crepe.cpython-38.pyc ADDED
Binary file (8.83 kB). View file
 
so-vits-svc/modules/__pycache__/modules.cpython-38.pyc ADDED
Binary file (10.1 kB). View file
 
so-vits-svc/pretrain/nsf_hifigan/NOTICE.txt ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ --- DiffSinger Community Vocoder ---
2
+
3
+ ARCHITECTURE: NSF-HiFiGAN
4
+ RELEASE DATE: 2022-12-11
5
+
6
+ HYPER PARAMETERS:
7
+ - 44100 sample rate
8
+ - 128 mel bins
9
+ - 512 hop size
10
+ - 2048 window size
11
+ - fmin at 40Hz
12
+ - fmax at 16000Hz
13
+
14
+
15
+ NOTICE:
16
+
17
+ All model weights in the [DiffSinger Community Vocoder Project](https://openvpi.github.io/vocoders/), including
18
+ model weights in this directory, are provided by the [OpenVPI Team](https://github.com/openvpi/), under the
19
+ [Attribution-NonCommercial-ShareAlike 4.0 International](https://creativecommons.org/licenses/by-nc-sa/4.0/) license.
20
+
21
+
22
+ ACKNOWLEDGEMENTS:
23
+
24
+ Training data of this vocoder is provided and permitted by the following organizations, societies and individuals:
25
+
26
+ 孙飒 https://www.qfssr.cn
27
+ 赤松_Akamatsu https://www.zhibin.club
28
+ 乐威 https://www.zhibin.club
29
+ 伯添 https://space.bilibili.com/24087011
30
+ 雲宇光 https://space.bilibili.com/660675050
31
+ 橙子言 https://space.bilibili.com/318486464
32
+ 人衣大人 https://space.bilibili.com/2270344
33
+ 玖蝶 https://space.bilibili.com/676771003
34
+ Yuuko
35
+ 白夜零BYL https://space.bilibili.com/1605040503
36
+ 嗷天 https://space.bilibili.com/5675252
37
+ 洛泠羽 https://space.bilibili.com/347373318
38
+ 灰条纹的灰猫君 https://space.bilibili.com/2083633
39
+ 幽寂 https://space.bilibili.com/478860
40
+ 恶魔王女 https://space.bilibili.com/2475098
41
+ AlexYHX 芮晴
42
+ 绮萱 https://y.qq.com/n/ryqq/singer/003HjD6H4aZn1K
43
+ 诗芸 https://y.qq.com/n/ryqq/singer/0005NInj142zm0
44
+ 汐蕾 https://y.qq.com/n/ryqq/singer/0023cWMH1Bq1PJ
45
+ 1262917464
46
+ 炜阳
47
+ 叶卡yolka
48
+ 幸の夏 https://space.bilibili.com/1017297686
49
+ 暮色未量 https://space.bilibili.com/272904686
50
+ 晓寞sama https://space.bilibili.com/3463394
51
+ 没头绪的节操君
52
+ 串串BunC https://space.bilibili.com/95817834
53
+ 落雨 https://space.bilibili.com/1292427
54
+ 长尾巴的翎艾 https://space.bilibili.com/1638666
55
+ 声闻计划 https://space.bilibili.com/392812269
56
+ 唐家大小姐 http://5sing.kugou.com/palmusic/default.html
57
+ 不伊子
58
+
59
+ Training machines are provided by:
60
+
61
+ 花儿不哭 https://space.bilibili.com/5760446
62
+
63
+
64
+ TERMS OF REDISTRIBUTIONS:
65
+
66
+ 1. Do not sell this vocoder, or charge any fees from redistributing it, as prohibited by
67
+ the license.
68
+ 2. Include a copy of the CC BY-NC-SA 4.0 license, or a link referring to it.
69
+ 3. Include a copy of this notice, or any other notices informing that this vocoder is
70
+ provided by the OpenVPI Team, that this vocoder is licensed under CC BY-NC-SA 4.0, and
71
+ with a complete acknowledgement list as shown above.
72
+ 4. If you fine-tuned or modified the weights, leave a notice about what has been changed.
73
+ 5. (Optional) Leave a link to the official release page of the vocoder, and tell users
74
+ that other versions and future updates of this vocoder can be obtained from the website.
so-vits-svc/pretrain/nsf_hifigan/NOTICE.zh-CN.txt ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ --- DiffSinger 社区声码器 ---
2
+
3
+ 架构:NSF-HiFiGAN
4
+ 发布日期:2022-12-11
5
+
6
+ 超参数:
7
+ - 44100 sample rate
8
+ - 128 mel bins
9
+ - 512 hop size
10
+ - 2048 window size
11
+ - fmin at 40Hz
12
+ - fmax at 16000Hz
13
+
14
+
15
+ 注意事项:
16
+
17
+ [DiffSinger 社区声码器企划](https://openvpi.github.io/vocoders/) 中的所有模型权重,
18
+ 包括此目录下的模型权重,均由 [OpenVPI Team](https://github.com/openvpi/) 提供,并基于
19
+ [Attribution-NonCommercial-ShareAlike 4.0 International](https://creativecommons.org/licenses/by-nc-sa/4.0/)
20
+ 进行许可。
21
+
22
+
23
+ 致谢:
24
+
25
+ 此声码器的训练数据由以下组织、社团和个人提供并许可:
26
+
27
+ 孙飒 https://www.qfssr.cn
28
+ 赤松_Akamatsu https://www.zhibin.club
29
+ 乐威 https://www.zhibin.club
30
+ 伯添 https://space.bilibili.com/24087011
31
+ 雲宇光 https://space.bilibili.com/660675050
32
+ 橙子言 https://space.bilibili.com/318486464
33
+ 人衣大人 https://space.bilibili.com/2270344
34
+ 玖蝶 https://space.bilibili.com/676771003
35
+ Yuuko
36
+ 白夜零BYL https://space.bilibili.com/1605040503
37
+ 嗷天 https://space.bilibili.com/5675252
38
+ 洛泠羽 https://space.bilibili.com/347373318
39
+ 灰条纹的灰猫君 https://space.bilibili.com/2083633
40
+ 幽寂 https://space.bilibili.com/478860
41
+ 恶魔王女 https://space.bilibili.com/2475098
42
+ AlexYHX 芮晴
43
+ 绮萱 https://y.qq.com/n/ryqq/singer/003HjD6H4aZn1K
44
+ 诗芸 https://y.qq.com/n/ryqq/singer/0005NInj142zm0
45
+ 汐蕾 https://y.qq.com/n/ryqq/singer/0023cWMH1Bq1PJ
46
+ 1262917464
47
+ 炜阳
48
+ 叶卡yolka
49
+ 幸の夏 https://space.bilibili.com/1017297686
50
+ 暮色未量 https://space.bilibili.com/272904686
51
+ 晓寞sama https://space.bilibili.com/3463394
52
+ 没头绪的节操君
53
+ 串串BunC https://space.bilibili.com/95817834
54
+ 落雨 https://space.bilibili.com/1292427
55
+ 长尾巴的翎艾 https://space.bilibili.com/1638666
56
+ 声闻计划 https://space.bilibili.com/392812269
57
+ 唐家大小姐 http://5sing.kugou.com/palmusic/default.html
58
+ 不伊子
59
+
60
+ 训练算力的提供者如下:
61
+
62
+ 花儿不哭 https://space.bilibili.com/5760446
63
+
64
+
65
+ 二次分发条款:
66
+
67
+ 1. 请勿售卖此声码器或从其二次分发过程中收取任何费用,因为此类行为受到许可证的禁止。
68
+ 2. 请在二次分发文件中包含一份 CC BY-NC-SA 4.0 许可证的副本或指向该许可证的链接。
69
+ 3. 请在二次分发文件中包含这份声明,或以其他形式声明此声码器由 OpenVPI Team 提供并基于 CC BY-NC-SA 4.0 许可,
70
+ 并附带上述完整的致谢名单。
71
+ 4. 如果您微调或修改了权重,请留下一份关于其受到了何种修改的说明。
72
+ 5.(可选)留下一份指向此声码器的官方发布页面的链接,并告知使用者可从该网站获取此声码器的其他版本和未来的更新。
so-vits-svc/pretrain/nsf_hifigan/config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "resblock": "1",
3
+ "num_gpus": 4,
4
+ "batch_size": 10,
5
+ "learning_rate": 0.0002,
6
+ "adam_b1": 0.8,
7
+ "adam_b2": 0.99,
8
+ "lr_decay": 0.999,
9
+ "seed": 1234,
10
+
11
+ "upsample_rates": [ 8, 8, 2, 2, 2],
12
+ "upsample_kernel_sizes": [16,16, 4, 4, 4],
13
+ "upsample_initial_channel": 512,
14
+ "resblock_kernel_sizes": [3,7,11],
15
+ "resblock_dilation_sizes": [[1,3,5], [1,3,5], [1,3,5]],
16
+ "discriminator_periods": [3, 5, 7, 11, 17, 23, 37],
17
+
18
+ "segment_size": 16384,
19
+ "num_mels": 128,
20
+ "num_freq": 1025,
21
+ "n_fft" : 2048,
22
+ "hop_size": 512,
23
+ "win_size": 2048,
24
+
25
+ "sampling_rate": 44100,
26
+
27
+ "fmin": 40,
28
+ "fmax": 16000,
29
+ "fmax_for_loss": null,
30
+
31
+ "num_workers": 16,
32
+
33
+ "dist_config": {
34
+ "dist_backend": "nccl",
35
+ "dist_url": "tcp://localhost:54321",
36
+ "world_size": 1
37
+ }
38
+ }
so-vits-svc/vdecoder/__pycache__/__init__.cpython-38.pyc ADDED
Binary file (169 Bytes). View file
 
so-vits-svc/vdecoder/hifigan/__pycache__/env.cpython-38.pyc CHANGED
Binary files a/so-vits-svc/vdecoder/hifigan/__pycache__/env.cpython-38.pyc and b/so-vits-svc/vdecoder/hifigan/__pycache__/env.cpython-38.pyc differ
 
so-vits-svc/vdecoder/hifigan/__pycache__/models.cpython-38.pyc CHANGED
Binary files a/so-vits-svc/vdecoder/hifigan/__pycache__/models.cpython-38.pyc and b/so-vits-svc/vdecoder/hifigan/__pycache__/models.cpython-38.pyc differ
 
so-vits-svc/vdecoder/hifigan/__pycache__/utils.cpython-38.pyc CHANGED
Binary files a/so-vits-svc/vdecoder/hifigan/__pycache__/utils.cpython-38.pyc and b/so-vits-svc/vdecoder/hifigan/__pycache__/utils.cpython-38.pyc differ
 
so-vits-svc/webUI.py CHANGED
@@ -313,7 +313,7 @@ with gr.Blocks(
313
  model_load_button.click(modelAnalysis,[model_path,config_path,cluster_model_path,device,enhance],[sid,sid_output])
314
  model_unload_button.click(modelUnload,[],[sid,sid_output])
315
  app.launch(
316
- server_name=os.environ.get("SERVER_NAME", "0.0.0.0"),
317
  server_port=int(os.environ.get("SERVER_PORT", 7860))
318
  )
319
 
 
313
  model_load_button.click(modelAnalysis,[model_path,config_path,cluster_model_path,device,enhance],[sid,sid_output])
314
  model_unload_button.click(modelUnload,[],[sid,sid_output])
315
  app.launch(
316
+ server_name=os.environ.get("SERVER_NAME", "127.0.0.1"),
317
  server_port=int(os.environ.get("SERVER_PORT", 7860))
318
  )
319