Upload 23 files
Browse files- .cardboardlint.yml +5 -0
- .dockerignore +9 -0
- .gitignore +171 -0
- .pre-commit-config.yaml +27 -0
- .pylintrc +599 -0
- .readthedocs.yml +23 -0
- CITATION.cff +20 -0
- CODE_OF_CONDUCT.md +133 -0
- CODE_OWNERS.rst +75 -0
- CONTRIBUTING.md +136 -0
- Dockerfile +13 -0
- LICENSE.txt +373 -0
- MANIFEST.in +15 -0
- Makefile +72 -0
- README.md +373 -3
- hubconf.py +46 -0
- pyproject.toml +33 -0
- requirements.dev.txt +5 -0
- requirements.notebooks.txt +1 -0
- requirements.txt +53 -0
- run_bash_tests.sh +7 -0
- setup.cfg +8 -0
- setup.py +138 -0
.cardboardlint.yml
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
linters:
|
2 |
+
- pylint:
|
3 |
+
# pylintrc: pylintrc
|
4 |
+
filefilter: ['- test_*.py', '+ *.py', '- *.npy']
|
5 |
+
# exclude:
|
.dockerignore
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
.git/
|
2 |
+
Dockerfile
|
3 |
+
build/
|
4 |
+
dist/
|
5 |
+
TTS.egg-info/
|
6 |
+
tests/outputs/*
|
7 |
+
tests/train_outputs/*
|
8 |
+
__pycache__/
|
9 |
+
*.pyc
|
.gitignore
ADDED
@@ -0,0 +1,171 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
WadaSNR/
|
2 |
+
.idea/
|
3 |
+
*.pyc
|
4 |
+
.DS_Store
|
5 |
+
./__init__.py
|
6 |
+
# Byte-compiled / optimized / DLL files
|
7 |
+
__pycache__/
|
8 |
+
*.py[cod]
|
9 |
+
*$py.class
|
10 |
+
|
11 |
+
# C extensions
|
12 |
+
*.so
|
13 |
+
|
14 |
+
# Distribution / packaging
|
15 |
+
.Python
|
16 |
+
build/
|
17 |
+
develop-eggs/
|
18 |
+
dist/
|
19 |
+
downloads/
|
20 |
+
eggs/
|
21 |
+
.eggs/
|
22 |
+
lib/
|
23 |
+
lib64/
|
24 |
+
parts/
|
25 |
+
sdist/
|
26 |
+
var/
|
27 |
+
wheels/
|
28 |
+
*.egg-info/
|
29 |
+
.installed.cfg
|
30 |
+
*.egg
|
31 |
+
MANIFEST
|
32 |
+
|
33 |
+
# PyInstaller
|
34 |
+
# Usually these files are written by a python script from a template
|
35 |
+
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
36 |
+
*.manifest
|
37 |
+
*.spec
|
38 |
+
|
39 |
+
# Installer logs
|
40 |
+
pip-log.txt
|
41 |
+
pip-delete-this-directory.txt
|
42 |
+
|
43 |
+
# Unit test / coverage reports
|
44 |
+
htmlcov/
|
45 |
+
.tox/
|
46 |
+
.coverage
|
47 |
+
.coverage.*
|
48 |
+
.cache
|
49 |
+
nosetests.xml
|
50 |
+
coverage.xml
|
51 |
+
*.cover
|
52 |
+
.hypothesis/
|
53 |
+
|
54 |
+
# Translations
|
55 |
+
*.mo
|
56 |
+
*.pot
|
57 |
+
|
58 |
+
# Django stuff:
|
59 |
+
*.log
|
60 |
+
.static_storage/
|
61 |
+
.media/
|
62 |
+
local_settings.py
|
63 |
+
|
64 |
+
# Flask stuff:
|
65 |
+
instance/
|
66 |
+
.webassets-cache
|
67 |
+
|
68 |
+
# Scrapy stuff:
|
69 |
+
.scrapy
|
70 |
+
|
71 |
+
# Sphinx documentation
|
72 |
+
docs/_build/
|
73 |
+
|
74 |
+
# PyBuilder
|
75 |
+
target/
|
76 |
+
|
77 |
+
# Jupyter Notebook
|
78 |
+
.ipynb_checkpoints
|
79 |
+
|
80 |
+
# pyenv
|
81 |
+
.python-version
|
82 |
+
|
83 |
+
# celery beat schedule file
|
84 |
+
celerybeat-schedule
|
85 |
+
|
86 |
+
# SageMath parsed files
|
87 |
+
*.sage.py
|
88 |
+
|
89 |
+
# Environments
|
90 |
+
.env
|
91 |
+
.venv
|
92 |
+
env/
|
93 |
+
venv/
|
94 |
+
ENV/
|
95 |
+
env.bak/
|
96 |
+
venv.bak/
|
97 |
+
|
98 |
+
# Spyder project settings
|
99 |
+
.spyderproject
|
100 |
+
.spyproject
|
101 |
+
|
102 |
+
# Rope project settings
|
103 |
+
.ropeproject
|
104 |
+
|
105 |
+
# mkdocs documentation
|
106 |
+
/site
|
107 |
+
|
108 |
+
# mypy
|
109 |
+
.mypy_cache/
|
110 |
+
|
111 |
+
# vim
|
112 |
+
*.swp
|
113 |
+
*.swm
|
114 |
+
*.swn
|
115 |
+
*.swo
|
116 |
+
|
117 |
+
# pytorch models
|
118 |
+
*.pth
|
119 |
+
*.pth.tar
|
120 |
+
!dummy_speakers.pth
|
121 |
+
result/
|
122 |
+
|
123 |
+
# setup.py
|
124 |
+
version.py
|
125 |
+
|
126 |
+
# jupyter dummy files
|
127 |
+
core
|
128 |
+
|
129 |
+
# ignore local datasets
|
130 |
+
recipes/WIP/*
|
131 |
+
recipes/ljspeech/LJSpeech-1.1/*
|
132 |
+
recipes/vctk/VCTK/*
|
133 |
+
recipes/**/*.npy
|
134 |
+
recipes/**/*.json
|
135 |
+
VCTK-Corpus-removed-silence/*
|
136 |
+
|
137 |
+
# ignore training logs
|
138 |
+
trainer_*_log.txt
|
139 |
+
|
140 |
+
# files used internally for dev, test etc.
|
141 |
+
tests/outputs/*
|
142 |
+
tests/train_outputs/*
|
143 |
+
TODO.txt
|
144 |
+
.vscode/*
|
145 |
+
data/*
|
146 |
+
notebooks/data/*
|
147 |
+
TTS/tts/utils/monotonic_align/core.c
|
148 |
+
.vscode-upload.json
|
149 |
+
temp_build/*
|
150 |
+
events.out*
|
151 |
+
old_configs/*
|
152 |
+
model_importers/*
|
153 |
+
model_profiling/*
|
154 |
+
docs/source/TODO/*
|
155 |
+
.noseids
|
156 |
+
.dccache
|
157 |
+
log.txt
|
158 |
+
umap.png
|
159 |
+
*.out
|
160 |
+
SocialMedia.txt
|
161 |
+
output.wav
|
162 |
+
tts_output.wav
|
163 |
+
deps.json
|
164 |
+
speakers.json
|
165 |
+
internal/*
|
166 |
+
*_pitch.npy
|
167 |
+
*_phoneme.npy
|
168 |
+
wandb
|
169 |
+
depot/*
|
170 |
+
coqui_recipes/*
|
171 |
+
local_scripts/*
|
.pre-commit-config.yaml
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
repos:
|
2 |
+
- repo: 'https://github.com/pre-commit/pre-commit-hooks'
|
3 |
+
rev: v2.3.0
|
4 |
+
hooks:
|
5 |
+
- id: check-yaml
|
6 |
+
- id: end-of-file-fixer
|
7 |
+
- id: trailing-whitespace
|
8 |
+
- repo: 'https://github.com/psf/black'
|
9 |
+
rev: 22.3.0
|
10 |
+
hooks:
|
11 |
+
- id: black
|
12 |
+
language_version: python3
|
13 |
+
- repo: https://github.com/pycqa/isort
|
14 |
+
rev: 5.8.0
|
15 |
+
hooks:
|
16 |
+
- id: isort
|
17 |
+
name: isort (python)
|
18 |
+
- id: isort
|
19 |
+
name: isort (cython)
|
20 |
+
types: [cython]
|
21 |
+
- id: isort
|
22 |
+
name: isort (pyi)
|
23 |
+
types: [pyi]
|
24 |
+
- repo: https://github.com/pycqa/pylint
|
25 |
+
rev: v2.8.2
|
26 |
+
hooks:
|
27 |
+
- id: pylint
|
.pylintrc
ADDED
@@ -0,0 +1,599 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[MASTER]
|
2 |
+
|
3 |
+
# A comma-separated list of package or module names from where C extensions may
|
4 |
+
# be loaded. Extensions are loading into the active Python interpreter and may
|
5 |
+
# run arbitrary code.
|
6 |
+
extension-pkg-whitelist=
|
7 |
+
|
8 |
+
# Add files or directories to the blacklist. They should be base names, not
|
9 |
+
# paths.
|
10 |
+
ignore=CVS
|
11 |
+
|
12 |
+
# Add files or directories matching the regex patterns to the blacklist. The
|
13 |
+
# regex matches against base names, not paths.
|
14 |
+
ignore-patterns=
|
15 |
+
|
16 |
+
# Python code to execute, usually for sys.path manipulation such as
|
17 |
+
# pygtk.require().
|
18 |
+
#init-hook=
|
19 |
+
|
20 |
+
# Use multiple processes to speed up Pylint. Specifying 0 will auto-detect the
|
21 |
+
# number of processors available to use.
|
22 |
+
jobs=1
|
23 |
+
|
24 |
+
# Control the amount of potential inferred values when inferring a single
|
25 |
+
# object. This can help the performance when dealing with large functions or
|
26 |
+
# complex, nested conditions.
|
27 |
+
limit-inference-results=100
|
28 |
+
|
29 |
+
# List of plugins (as comma separated values of python modules names) to load,
|
30 |
+
# usually to register additional checkers.
|
31 |
+
load-plugins=
|
32 |
+
|
33 |
+
# Pickle collected data for later comparisons.
|
34 |
+
persistent=yes
|
35 |
+
|
36 |
+
# Specify a configuration file.
|
37 |
+
#rcfile=
|
38 |
+
|
39 |
+
# When enabled, pylint would attempt to guess common misconfiguration and emit
|
40 |
+
# user-friendly hints instead of false-positive error messages.
|
41 |
+
suggestion-mode=yes
|
42 |
+
|
43 |
+
# Allow loading of arbitrary C extensions. Extensions are imported into the
|
44 |
+
# active Python interpreter and may run arbitrary code.
|
45 |
+
unsafe-load-any-extension=no
|
46 |
+
|
47 |
+
|
48 |
+
[MESSAGES CONTROL]
|
49 |
+
|
50 |
+
# Only show warnings with the listed confidence levels. Leave empty to show
|
51 |
+
# all. Valid levels: HIGH, INFERENCE, INFERENCE_FAILURE, UNDEFINED.
|
52 |
+
confidence=
|
53 |
+
|
54 |
+
# Disable the message, report, category or checker with the given id(s). You
|
55 |
+
# can either give multiple identifiers separated by comma (,) or put this
|
56 |
+
# option multiple times (only on the command line, not in the configuration
|
57 |
+
# file where it should appear only once). You can also use "--disable=all" to
|
58 |
+
# disable everything first and then reenable specific checks. For example, if
|
59 |
+
# you want to run only the similarities checker, you can use "--disable=all
|
60 |
+
# --enable=similarities". If you want to run only the classes checker, but have
|
61 |
+
# no Warning level messages displayed, use "--disable=all --enable=classes
|
62 |
+
# --disable=W".
|
63 |
+
disable=missing-docstring,
|
64 |
+
too-many-public-methods,
|
65 |
+
too-many-lines,
|
66 |
+
bare-except,
|
67 |
+
## for avoiding weird p3.6 CI linter error
|
68 |
+
## TODO: see later if we can remove this
|
69 |
+
assigning-non-slot,
|
70 |
+
unsupported-assignment-operation,
|
71 |
+
## end
|
72 |
+
line-too-long,
|
73 |
+
fixme,
|
74 |
+
wrong-import-order,
|
75 |
+
ungrouped-imports,
|
76 |
+
wrong-import-position,
|
77 |
+
import-error,
|
78 |
+
invalid-name,
|
79 |
+
too-many-instance-attributes,
|
80 |
+
arguments-differ,
|
81 |
+
arguments-renamed,
|
82 |
+
no-name-in-module,
|
83 |
+
no-member,
|
84 |
+
unsubscriptable-object,
|
85 |
+
print-statement,
|
86 |
+
parameter-unpacking,
|
87 |
+
unpacking-in-except,
|
88 |
+
old-raise-syntax,
|
89 |
+
backtick,
|
90 |
+
long-suffix,
|
91 |
+
old-ne-operator,
|
92 |
+
old-octal-literal,
|
93 |
+
import-star-module-level,
|
94 |
+
non-ascii-bytes-literal,
|
95 |
+
raw-checker-failed,
|
96 |
+
bad-inline-option,
|
97 |
+
locally-disabled,
|
98 |
+
file-ignored,
|
99 |
+
suppressed-message,
|
100 |
+
useless-suppression,
|
101 |
+
deprecated-pragma,
|
102 |
+
use-symbolic-message-instead,
|
103 |
+
useless-object-inheritance,
|
104 |
+
too-few-public-methods,
|
105 |
+
too-many-branches,
|
106 |
+
too-many-arguments,
|
107 |
+
too-many-locals,
|
108 |
+
too-many-statements,
|
109 |
+
apply-builtin,
|
110 |
+
basestring-builtin,
|
111 |
+
buffer-builtin,
|
112 |
+
cmp-builtin,
|
113 |
+
coerce-builtin,
|
114 |
+
execfile-builtin,
|
115 |
+
file-builtin,
|
116 |
+
long-builtin,
|
117 |
+
raw_input-builtin,
|
118 |
+
reduce-builtin,
|
119 |
+
standarderror-builtin,
|
120 |
+
unicode-builtin,
|
121 |
+
xrange-builtin,
|
122 |
+
coerce-method,
|
123 |
+
delslice-method,
|
124 |
+
getslice-method,
|
125 |
+
setslice-method,
|
126 |
+
no-absolute-import,
|
127 |
+
old-division,
|
128 |
+
dict-iter-method,
|
129 |
+
dict-view-method,
|
130 |
+
next-method-called,
|
131 |
+
metaclass-assignment,
|
132 |
+
indexing-exception,
|
133 |
+
raising-string,
|
134 |
+
reload-builtin,
|
135 |
+
oct-method,
|
136 |
+
hex-method,
|
137 |
+
nonzero-method,
|
138 |
+
cmp-method,
|
139 |
+
input-builtin,
|
140 |
+
round-builtin,
|
141 |
+
intern-builtin,
|
142 |
+
unichr-builtin,
|
143 |
+
map-builtin-not-iterating,
|
144 |
+
zip-builtin-not-iterating,
|
145 |
+
range-builtin-not-iterating,
|
146 |
+
filter-builtin-not-iterating,
|
147 |
+
using-cmp-argument,
|
148 |
+
eq-without-hash,
|
149 |
+
div-method,
|
150 |
+
idiv-method,
|
151 |
+
rdiv-method,
|
152 |
+
exception-message-attribute,
|
153 |
+
invalid-str-codec,
|
154 |
+
sys-max-int,
|
155 |
+
bad-python3-import,
|
156 |
+
deprecated-string-function,
|
157 |
+
deprecated-str-translate-call,
|
158 |
+
deprecated-itertools-function,
|
159 |
+
deprecated-types-field,
|
160 |
+
next-method-defined,
|
161 |
+
dict-items-not-iterating,
|
162 |
+
dict-keys-not-iterating,
|
163 |
+
dict-values-not-iterating,
|
164 |
+
deprecated-operator-function,
|
165 |
+
deprecated-urllib-function,
|
166 |
+
xreadlines-attribute,
|
167 |
+
deprecated-sys-function,
|
168 |
+
exception-escape,
|
169 |
+
comprehension-escape,
|
170 |
+
duplicate-code,
|
171 |
+
not-callable,
|
172 |
+
import-outside-toplevel,
|
173 |
+
logging-fstring-interpolation,
|
174 |
+
logging-not-lazy
|
175 |
+
|
176 |
+
# Enable the message, report, category or checker with the given id(s). You can
|
177 |
+
# either give multiple identifier separated by comma (,) or put this option
|
178 |
+
# multiple time (only on the command line, not in the configuration file where
|
179 |
+
# it should appear only once). See also the "--disable" option for examples.
|
180 |
+
enable=c-extension-no-member
|
181 |
+
|
182 |
+
|
183 |
+
[REPORTS]
|
184 |
+
|
185 |
+
# Python expression which should return a note less than 10 (10 is the highest
|
186 |
+
# note). You have access to the variables errors warning, statement which
|
187 |
+
# respectively contain the number of errors / warnings messages and the total
|
188 |
+
# number of statements analyzed. This is used by the global evaluation report
|
189 |
+
# (RP0004).
|
190 |
+
evaluation=10.0 - ((float(5 * error + warning + refactor + convention) / statement) * 10)
|
191 |
+
|
192 |
+
# Template used to display messages. This is a python new-style format string
|
193 |
+
# used to format the message information. See doc for all details.
|
194 |
+
#msg-template=
|
195 |
+
|
196 |
+
# Set the output format. Available formats are text, parseable, colorized, json
|
197 |
+
# and msvs (visual studio). You can also give a reporter class, e.g.
|
198 |
+
# mypackage.mymodule.MyReporterClass.
|
199 |
+
output-format=text
|
200 |
+
|
201 |
+
# Tells whether to display a full report or only the messages.
|
202 |
+
reports=no
|
203 |
+
|
204 |
+
# Activate the evaluation score.
|
205 |
+
score=yes
|
206 |
+
|
207 |
+
|
208 |
+
[REFACTORING]
|
209 |
+
|
210 |
+
# Maximum number of nested blocks for function / method body
|
211 |
+
max-nested-blocks=5
|
212 |
+
|
213 |
+
# Complete name of functions that never returns. When checking for
|
214 |
+
# inconsistent-return-statements if a never returning function is called then
|
215 |
+
# it will be considered as an explicit return statement and no message will be
|
216 |
+
# printed.
|
217 |
+
never-returning-functions=sys.exit
|
218 |
+
|
219 |
+
|
220 |
+
[LOGGING]
|
221 |
+
|
222 |
+
# Format style used to check logging format string. `old` means using %
|
223 |
+
# formatting, while `new` is for `{}` formatting.
|
224 |
+
logging-format-style=old
|
225 |
+
|
226 |
+
# Logging modules to check that the string format arguments are in logging
|
227 |
+
# function parameter format.
|
228 |
+
logging-modules=logging
|
229 |
+
|
230 |
+
|
231 |
+
[SPELLING]
|
232 |
+
|
233 |
+
# Limits count of emitted suggestions for spelling mistakes.
|
234 |
+
max-spelling-suggestions=4
|
235 |
+
|
236 |
+
# Spelling dictionary name. Available dictionaries: none. To make it working
|
237 |
+
# install python-enchant package..
|
238 |
+
spelling-dict=
|
239 |
+
|
240 |
+
# List of comma separated words that should not be checked.
|
241 |
+
spelling-ignore-words=
|
242 |
+
|
243 |
+
# A path to a file that contains private dictionary; one word per line.
|
244 |
+
spelling-private-dict-file=
|
245 |
+
|
246 |
+
# Tells whether to store unknown words to indicated private dictionary in
|
247 |
+
# --spelling-private-dict-file option instead of raising a message.
|
248 |
+
spelling-store-unknown-words=no
|
249 |
+
|
250 |
+
|
251 |
+
[MISCELLANEOUS]
|
252 |
+
|
253 |
+
# List of note tags to take in consideration, separated by a comma.
|
254 |
+
notes=FIXME,
|
255 |
+
XXX,
|
256 |
+
TODO
|
257 |
+
|
258 |
+
|
259 |
+
[TYPECHECK]
|
260 |
+
|
261 |
+
# List of decorators that produce context managers, such as
|
262 |
+
# contextlib.contextmanager. Add to this list to register other decorators that
|
263 |
+
# produce valid context managers.
|
264 |
+
contextmanager-decorators=contextlib.contextmanager
|
265 |
+
|
266 |
+
# List of members which are set dynamically and missed by pylint inference
|
267 |
+
# system, and so shouldn't trigger E1101 when accessed. Python regular
|
268 |
+
# expressions are accepted.
|
269 |
+
generated-members=numpy.*,torch.*
|
270 |
+
|
271 |
+
# Tells whether missing members accessed in mixin class should be ignored. A
|
272 |
+
# mixin class is detected if its name ends with "mixin" (case insensitive).
|
273 |
+
ignore-mixin-members=yes
|
274 |
+
|
275 |
+
# Tells whether to warn about missing members when the owner of the attribute
|
276 |
+
# is inferred to be None.
|
277 |
+
ignore-none=yes
|
278 |
+
|
279 |
+
# This flag controls whether pylint should warn about no-member and similar
|
280 |
+
# checks whenever an opaque object is returned when inferring. The inference
|
281 |
+
# can return multiple potential results while evaluating a Python object, but
|
282 |
+
# some branches might not be evaluated, which results in partial inference. In
|
283 |
+
# that case, it might be useful to still emit no-member and other checks for
|
284 |
+
# the rest of the inferred objects.
|
285 |
+
ignore-on-opaque-inference=yes
|
286 |
+
|
287 |
+
# List of class names for which member attributes should not be checked (useful
|
288 |
+
# for classes with dynamically set attributes). This supports the use of
|
289 |
+
# qualified names.
|
290 |
+
ignored-classes=optparse.Values,thread._local,_thread._local
|
291 |
+
|
292 |
+
# List of module names for which member attributes should not be checked
|
293 |
+
# (useful for modules/projects where namespaces are manipulated during runtime
|
294 |
+
# and thus existing member attributes cannot be deduced by static analysis. It
|
295 |
+
# supports qualified module names, as well as Unix pattern matching.
|
296 |
+
ignored-modules=
|
297 |
+
|
298 |
+
# Show a hint with possible names when a member name was not found. The aspect
|
299 |
+
# of finding the hint is based on edit distance.
|
300 |
+
missing-member-hint=yes
|
301 |
+
|
302 |
+
# The minimum edit distance a name should have in order to be considered a
|
303 |
+
# similar match for a missing member name.
|
304 |
+
missing-member-hint-distance=1
|
305 |
+
|
306 |
+
# The total number of similar names that should be taken in consideration when
|
307 |
+
# showing a hint for a missing member.
|
308 |
+
missing-member-max-choices=1
|
309 |
+
|
310 |
+
|
311 |
+
[VARIABLES]
|
312 |
+
|
313 |
+
# List of additional names supposed to be defined in builtins. Remember that
|
314 |
+
# you should avoid defining new builtins when possible.
|
315 |
+
additional-builtins=
|
316 |
+
|
317 |
+
# Tells whether unused global variables should be treated as a violation.
|
318 |
+
allow-global-unused-variables=yes
|
319 |
+
|
320 |
+
# List of strings which can identify a callback function by name. A callback
|
321 |
+
# name must start or end with one of those strings.
|
322 |
+
callbacks=cb_,
|
323 |
+
_cb
|
324 |
+
|
325 |
+
# A regular expression matching the name of dummy variables (i.e. expected to
|
326 |
+
# not be used).
|
327 |
+
dummy-variables-rgx=_+$|(_[a-zA-Z0-9_]*[a-zA-Z0-9]+?$)|dummy|^ignored_|^unused_
|
328 |
+
|
329 |
+
# Argument names that match this expression will be ignored. Default to name
|
330 |
+
# with leading underscore.
|
331 |
+
ignored-argument-names=_.*|^ignored_|^unused_
|
332 |
+
|
333 |
+
# Tells whether we should check for unused import in __init__ files.
|
334 |
+
init-import=no
|
335 |
+
|
336 |
+
# List of qualified module names which can have objects that can redefine
|
337 |
+
# builtins.
|
338 |
+
redefining-builtins-modules=six.moves,past.builtins,future.builtins,builtins,io
|
339 |
+
|
340 |
+
|
341 |
+
[FORMAT]
|
342 |
+
|
343 |
+
# Expected format of line ending, e.g. empty (any line ending), LF or CRLF.
|
344 |
+
expected-line-ending-format=
|
345 |
+
|
346 |
+
# Regexp for a line that is allowed to be longer than the limit.
|
347 |
+
ignore-long-lines=^\s*(# )?<?https?://\S+>?$
|
348 |
+
|
349 |
+
# Number of spaces of indent required inside a hanging or continued line.
|
350 |
+
indent-after-paren=4
|
351 |
+
|
352 |
+
# String used as indentation unit. This is usually " " (4 spaces) or "\t" (1
|
353 |
+
# tab).
|
354 |
+
indent-string=' '
|
355 |
+
|
356 |
+
# Maximum number of characters on a single line.
|
357 |
+
max-line-length=120
|
358 |
+
|
359 |
+
# Maximum number of lines in a module.
|
360 |
+
max-module-lines=1000
|
361 |
+
|
362 |
+
# List of optional constructs for which whitespace checking is disabled. `dict-
|
363 |
+
# separator` is used to allow tabulation in dicts, etc.: {1 : 1,\n222: 2}.
|
364 |
+
# `trailing-comma` allows a space between comma and closing bracket: (a, ).
|
365 |
+
# `empty-line` allows space-only lines.
|
366 |
+
no-space-check=trailing-comma,
|
367 |
+
dict-separator
|
368 |
+
|
369 |
+
# Allow the body of a class to be on the same line as the declaration if body
|
370 |
+
# contains single statement.
|
371 |
+
single-line-class-stmt=no
|
372 |
+
|
373 |
+
# Allow the body of an if to be on the same line as the test if there is no
|
374 |
+
# else.
|
375 |
+
single-line-if-stmt=no
|
376 |
+
|
377 |
+
|
378 |
+
[SIMILARITIES]
|
379 |
+
|
380 |
+
# Ignore comments when computing similarities.
|
381 |
+
ignore-comments=yes
|
382 |
+
|
383 |
+
# Ignore docstrings when computing similarities.
|
384 |
+
ignore-docstrings=yes
|
385 |
+
|
386 |
+
# Ignore imports when computing similarities.
|
387 |
+
ignore-imports=no
|
388 |
+
|
389 |
+
# Minimum lines number of a similarity.
|
390 |
+
min-similarity-lines=4
|
391 |
+
|
392 |
+
|
393 |
+
[BASIC]
|
394 |
+
|
395 |
+
# Naming style matching correct argument names.
|
396 |
+
argument-naming-style=snake_case
|
397 |
+
|
398 |
+
# Regular expression matching correct argument names. Overrides argument-
|
399 |
+
# naming-style.
|
400 |
+
argument-rgx=[a-z_][a-z0-9_]{0,30}$
|
401 |
+
|
402 |
+
# Naming style matching correct attribute names.
|
403 |
+
attr-naming-style=snake_case
|
404 |
+
|
405 |
+
# Regular expression matching correct attribute names. Overrides attr-naming-
|
406 |
+
# style.
|
407 |
+
#attr-rgx=
|
408 |
+
|
409 |
+
# Bad variable names which should always be refused, separated by a comma.
|
410 |
+
bad-names=
|
411 |
+
|
412 |
+
# Naming style matching correct class attribute names.
|
413 |
+
class-attribute-naming-style=any
|
414 |
+
|
415 |
+
# Regular expression matching correct class attribute names. Overrides class-
|
416 |
+
# attribute-naming-style.
|
417 |
+
#class-attribute-rgx=
|
418 |
+
|
419 |
+
# Naming style matching correct class names.
|
420 |
+
class-naming-style=PascalCase
|
421 |
+
|
422 |
+
# Regular expression matching correct class names. Overrides class-naming-
|
423 |
+
# style.
|
424 |
+
#class-rgx=
|
425 |
+
|
426 |
+
# Naming style matching correct constant names.
|
427 |
+
const-naming-style=UPPER_CASE
|
428 |
+
|
429 |
+
# Regular expression matching correct constant names. Overrides const-naming-
|
430 |
+
# style.
|
431 |
+
#const-rgx=
|
432 |
+
|
433 |
+
# Minimum line length for functions/classes that require docstrings, shorter
|
434 |
+
# ones are exempt.
|
435 |
+
docstring-min-length=-1
|
436 |
+
|
437 |
+
# Naming style matching correct function names.
|
438 |
+
function-naming-style=snake_case
|
439 |
+
|
440 |
+
# Regular expression matching correct function names. Overrides function-
|
441 |
+
# naming-style.
|
442 |
+
#function-rgx=
|
443 |
+
|
444 |
+
# Good variable names which should always be accepted, separated by a comma.
|
445 |
+
good-names=i,
|
446 |
+
j,
|
447 |
+
k,
|
448 |
+
x,
|
449 |
+
ex,
|
450 |
+
Run,
|
451 |
+
_
|
452 |
+
|
453 |
+
# Include a hint for the correct naming format with invalid-name.
|
454 |
+
include-naming-hint=no
|
455 |
+
|
456 |
+
# Naming style matching correct inline iteration names.
|
457 |
+
inlinevar-naming-style=any
|
458 |
+
|
459 |
+
# Regular expression matching correct inline iteration names. Overrides
|
460 |
+
# inlinevar-naming-style.
|
461 |
+
#inlinevar-rgx=
|
462 |
+
|
463 |
+
# Naming style matching correct method names.
|
464 |
+
method-naming-style=snake_case
|
465 |
+
|
466 |
+
# Regular expression matching correct method names. Overrides method-naming-
|
467 |
+
# style.
|
468 |
+
#method-rgx=
|
469 |
+
|
470 |
+
# Naming style matching correct module names.
|
471 |
+
module-naming-style=snake_case
|
472 |
+
|
473 |
+
# Regular expression matching correct module names. Overrides module-naming-
|
474 |
+
# style.
|
475 |
+
#module-rgx=
|
476 |
+
|
477 |
+
# Colon-delimited sets of names that determine each other's naming style when
|
478 |
+
# the name regexes allow several styles.
|
479 |
+
name-group=
|
480 |
+
|
481 |
+
# Regular expression which should only match function or class names that do
|
482 |
+
# not require a docstring.
|
483 |
+
no-docstring-rgx=^_
|
484 |
+
|
485 |
+
# List of decorators that produce properties, such as abc.abstractproperty. Add
|
486 |
+
# to this list to register other decorators that produce valid properties.
|
487 |
+
# These decorators are taken in consideration only for invalid-name.
|
488 |
+
property-classes=abc.abstractproperty
|
489 |
+
|
490 |
+
# Naming style matching correct variable names.
|
491 |
+
variable-naming-style=snake_case
|
492 |
+
|
493 |
+
# Regular expression matching correct variable names. Overrides variable-
|
494 |
+
# naming-style.
|
495 |
+
variable-rgx=[a-z_][a-z0-9_]{0,30}$
|
496 |
+
|
497 |
+
|
498 |
+
[STRING]
|
499 |
+
|
500 |
+
# This flag controls whether the implicit-str-concat-in-sequence should
|
501 |
+
# generate a warning on implicit string concatenation in sequences defined over
|
502 |
+
# several lines.
|
503 |
+
check-str-concat-over-line-jumps=no
|
504 |
+
|
505 |
+
|
506 |
+
[IMPORTS]
|
507 |
+
|
508 |
+
# Allow wildcard imports from modules that define __all__.
|
509 |
+
allow-wildcard-with-all=no
|
510 |
+
|
511 |
+
# Analyse import fallback blocks. This can be used to support both Python 2 and
|
512 |
+
# 3 compatible code, which means that the block might have code that exists
|
513 |
+
# only in one or another interpreter, leading to false positives when analysed.
|
514 |
+
analyse-fallback-blocks=no
|
515 |
+
|
516 |
+
# Deprecated modules which should not be used, separated by a comma.
|
517 |
+
deprecated-modules=optparse,tkinter.tix
|
518 |
+
|
519 |
+
# Create a graph of external dependencies in the given file (report RP0402 must
|
520 |
+
# not be disabled).
|
521 |
+
ext-import-graph=
|
522 |
+
|
523 |
+
# Create a graph of every (i.e. internal and external) dependencies in the
|
524 |
+
# given file (report RP0402 must not be disabled).
|
525 |
+
import-graph=
|
526 |
+
|
527 |
+
# Create a graph of internal dependencies in the given file (report RP0402 must
|
528 |
+
# not be disabled).
|
529 |
+
int-import-graph=
|
530 |
+
|
531 |
+
# Force import order to recognize a module as part of the standard
|
532 |
+
# compatibility libraries.
|
533 |
+
known-standard-library=
|
534 |
+
|
535 |
+
# Force import order to recognize a module as part of a third party library.
|
536 |
+
known-third-party=enchant
|
537 |
+
|
538 |
+
|
539 |
+
[CLASSES]
|
540 |
+
|
541 |
+
# List of method names used to declare (i.e. assign) instance attributes.
|
542 |
+
defining-attr-methods=__init__,
|
543 |
+
__new__,
|
544 |
+
setUp
|
545 |
+
|
546 |
+
# List of member names, which should be excluded from the protected access
|
547 |
+
# warning.
|
548 |
+
exclude-protected=_asdict,
|
549 |
+
_fields,
|
550 |
+
_replace,
|
551 |
+
_source,
|
552 |
+
_make
|
553 |
+
|
554 |
+
# List of valid names for the first argument in a class method.
|
555 |
+
valid-classmethod-first-arg=cls
|
556 |
+
|
557 |
+
# List of valid names for the first argument in a metaclass class method.
|
558 |
+
valid-metaclass-classmethod-first-arg=cls
|
559 |
+
|
560 |
+
|
561 |
+
[DESIGN]
|
562 |
+
|
563 |
+
# Maximum number of arguments for function / method.
|
564 |
+
max-args=5
|
565 |
+
|
566 |
+
# Maximum number of attributes for a class (see R0902).
|
567 |
+
max-attributes=7
|
568 |
+
|
569 |
+
# Maximum number of boolean expressions in an if statement.
|
570 |
+
max-bool-expr=5
|
571 |
+
|
572 |
+
# Maximum number of branch for function / method body.
|
573 |
+
max-branches=12
|
574 |
+
|
575 |
+
# Maximum number of locals for function / method body.
|
576 |
+
max-locals=15
|
577 |
+
|
578 |
+
# Maximum number of parents for a class (see R0901).
|
579 |
+
max-parents=15
|
580 |
+
|
581 |
+
# Maximum number of public methods for a class (see R0904).
|
582 |
+
max-public-methods=20
|
583 |
+
|
584 |
+
# Maximum number of return / yield for function / method body.
|
585 |
+
max-returns=6
|
586 |
+
|
587 |
+
# Maximum number of statements in function / method body.
|
588 |
+
max-statements=50
|
589 |
+
|
590 |
+
# Minimum number of public methods for a class (see R0903).
|
591 |
+
min-public-methods=2
|
592 |
+
|
593 |
+
|
594 |
+
[EXCEPTIONS]
|
595 |
+
|
596 |
+
# Exceptions that will emit a warning when being caught. Defaults to
|
597 |
+
# "BaseException, Exception".
|
598 |
+
overgeneral-exceptions=BaseException,
|
599 |
+
Exception
|
.readthedocs.yml
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# .readthedocs.yml
|
2 |
+
# Read the Docs configuration file
|
3 |
+
# See https://docs.readthedocs.io/en/stable/config-file/v2.html for details
|
4 |
+
|
5 |
+
# Required
|
6 |
+
version: 2
|
7 |
+
|
8 |
+
# Set the version of Python and other tools you might need
|
9 |
+
build:
|
10 |
+
os: ubuntu-22.04
|
11 |
+
tools:
|
12 |
+
python: "3.11"
|
13 |
+
|
14 |
+
# Optionally set the version of Python and requirements required to build your docs
|
15 |
+
python:
|
16 |
+
install:
|
17 |
+
- requirements: docs/requirements.txt
|
18 |
+
- requirements: requirements.txt
|
19 |
+
|
20 |
+
# Build documentation in the docs/ directory with Sphinx
|
21 |
+
sphinx:
|
22 |
+
builder: html
|
23 |
+
configuration: docs/source/conf.py
|
CITATION.cff
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
cff-version: 1.2.0
|
2 |
+
message: "If you want to cite 🐸💬, feel free to use this (but only if you loved it 😊)"
|
3 |
+
title: "Coqui TTS"
|
4 |
+
abstract: "A deep learning toolkit for Text-to-Speech, battle-tested in research and production"
|
5 |
+
date-released: 2021-01-01
|
6 |
+
authors:
|
7 |
+
- family-names: "Eren"
|
8 |
+
given-names: "Gölge"
|
9 |
+
- name: "The Coqui TTS Team"
|
10 |
+
version: 1.4
|
11 |
+
doi: 10.5281/zenodo.6334862
|
12 |
+
license: "MPL-2.0"
|
13 |
+
url: "https://www.coqui.ai"
|
14 |
+
repository-code: "https://github.com/coqui-ai/TTS"
|
15 |
+
keywords:
|
16 |
+
- machine learning
|
17 |
+
- deep learning
|
18 |
+
- artificial intelligence
|
19 |
+
- text to speech
|
20 |
+
- TTS
|
CODE_OF_CONDUCT.md
ADDED
@@ -0,0 +1,133 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
# Contributor Covenant Code of Conduct
|
3 |
+
|
4 |
+
## Our Pledge
|
5 |
+
|
6 |
+
We as members, contributors, and leaders pledge to make participation in our
|
7 |
+
community a harassment-free experience for everyone, regardless of age, body
|
8 |
+
size, visible or invisible disability, ethnicity, sex characteristics, gender
|
9 |
+
identity and expression, level of experience, education, socio-economic status,
|
10 |
+
nationality, personal appearance, race, caste, color, religion, or sexual identity
|
11 |
+
and orientation.
|
12 |
+
|
13 |
+
We pledge to act and interact in ways that contribute to an open, welcoming,
|
14 |
+
diverse, inclusive, and healthy community.
|
15 |
+
|
16 |
+
## Our Standards
|
17 |
+
|
18 |
+
Examples of behavior that contributes to a positive environment for our
|
19 |
+
community include:
|
20 |
+
|
21 |
+
* Demonstrating empathy and kindness toward other people
|
22 |
+
* Being respectful of differing opinions, viewpoints, and experiences
|
23 |
+
* Giving and gracefully accepting constructive feedback
|
24 |
+
* Accepting responsibility and apologizing to those affected by our mistakes,
|
25 |
+
and learning from the experience
|
26 |
+
* Focusing on what is best not just for us as individuals, but for the
|
27 |
+
overall community
|
28 |
+
|
29 |
+
Examples of unacceptable behavior include:
|
30 |
+
|
31 |
+
* The use of sexualized language or imagery, and sexual attention or
|
32 |
+
advances of any kind
|
33 |
+
* Trolling, insulting or derogatory comments, and personal or political attacks
|
34 |
+
* Public or private harassment
|
35 |
+
* Publishing others' private information, such as a physical or email
|
36 |
+
address, without their explicit permission
|
37 |
+
* Other conduct which could reasonably be considered inappropriate in a
|
38 |
+
professional setting
|
39 |
+
|
40 |
+
## Enforcement Responsibilities
|
41 |
+
|
42 |
+
Community leaders are responsible for clarifying and enforcing our standards of
|
43 |
+
acceptable behavior and will take appropriate and fair corrective action in
|
44 |
+
response to any behavior that they deem inappropriate, threatening, offensive,
|
45 |
+
or harmful.
|
46 |
+
|
47 |
+
Community leaders have the right and responsibility to remove, edit, or reject
|
48 |
+
comments, commits, code, wiki edits, issues, and other contributions that are
|
49 |
+
not aligned to this Code of Conduct, and will communicate reasons for moderation
|
50 |
+
decisions when appropriate.
|
51 |
+
|
52 |
+
## Scope
|
53 |
+
|
54 |
+
This Code of Conduct applies within all community spaces, and also applies when
|
55 |
+
an individual is officially representing the community in public spaces.
|
56 |
+
Examples of representing our community include using an official e-mail address,
|
57 |
+
posting via an official social media account, or acting as an appointed
|
58 |
+
representative at an online or offline event.
|
59 |
+
|
60 |
+
## Enforcement
|
61 |
+
|
62 |
+
Instances of abusive, harassing, or otherwise unacceptable behavior may be
|
63 |
+
reported to the community leaders responsible for enforcement at
|
64 |
+
coc-report@coqui.ai.
|
65 |
+
All complaints will be reviewed and investigated promptly and fairly.
|
66 |
+
|
67 |
+
All community leaders are obligated to respect the privacy and security of the
|
68 |
+
reporter of any incident.
|
69 |
+
|
70 |
+
## Enforcement Guidelines
|
71 |
+
|
72 |
+
Community leaders will follow these Community Impact Guidelines in determining
|
73 |
+
the consequences for any action they deem in violation of this Code of Conduct:
|
74 |
+
|
75 |
+
### 1. Correction
|
76 |
+
|
77 |
+
**Community Impact**: Use of inappropriate language or other behavior deemed
|
78 |
+
unprofessional or unwelcome in the community.
|
79 |
+
|
80 |
+
**Consequence**: A private, written warning from community leaders, providing
|
81 |
+
clarity around the nature of the violation and an explanation of why the
|
82 |
+
behavior was inappropriate. A public apology may be requested.
|
83 |
+
|
84 |
+
### 2. Warning
|
85 |
+
|
86 |
+
**Community Impact**: A violation through a single incident or series
|
87 |
+
of actions.
|
88 |
+
|
89 |
+
**Consequence**: A warning with consequences for continued behavior. No
|
90 |
+
interaction with the people involved, including unsolicited interaction with
|
91 |
+
those enforcing the Code of Conduct, for a specified period of time. This
|
92 |
+
includes avoiding interactions in community spaces as well as external channels
|
93 |
+
like social media. Violating these terms may lead to a temporary or
|
94 |
+
permanent ban.
|
95 |
+
|
96 |
+
### 3. Temporary Ban
|
97 |
+
|
98 |
+
**Community Impact**: A serious violation of community standards, including
|
99 |
+
sustained inappropriate behavior.
|
100 |
+
|
101 |
+
**Consequence**: A temporary ban from any sort of interaction or public
|
102 |
+
communication with the community for a specified period of time. No public or
|
103 |
+
private interaction with the people involved, including unsolicited interaction
|
104 |
+
with those enforcing the Code of Conduct, is allowed during this period.
|
105 |
+
Violating these terms may lead to a permanent ban.
|
106 |
+
|
107 |
+
### 4. Permanent Ban
|
108 |
+
|
109 |
+
**Community Impact**: Demonstrating a pattern of violation of community
|
110 |
+
standards, including sustained inappropriate behavior, harassment of an
|
111 |
+
individual, or aggression toward or disparagement of classes of individuals.
|
112 |
+
|
113 |
+
**Consequence**: A permanent ban from any sort of public interaction within
|
114 |
+
the community.
|
115 |
+
|
116 |
+
## Attribution
|
117 |
+
|
118 |
+
This Code of Conduct is adapted from the [Contributor Covenant][homepage],
|
119 |
+
version 2.0, available at
|
120 |
+
[https://www.contributor-covenant.org/version/2/0/code_of_conduct.html][v2.0].
|
121 |
+
|
122 |
+
Community Impact Guidelines were inspired by
|
123 |
+
[Mozilla's code of conduct enforcement ladder][Mozilla CoC].
|
124 |
+
|
125 |
+
For answers to common questions about this code of conduct, see the FAQ at
|
126 |
+
[https://www.contributor-covenant.org/faq][FAQ]. Translations are available
|
127 |
+
at [https://www.contributor-covenant.org/translations][translations].
|
128 |
+
|
129 |
+
[homepage]: https://www.contributor-covenant.org
|
130 |
+
[v2.0]: https://www.contributor-covenant.org/version/2/0/code_of_conduct.html
|
131 |
+
[Mozilla CoC]: https://github.com/mozilla/diversity
|
132 |
+
[FAQ]: https://www.contributor-covenant.org/faq
|
133 |
+
[translations]: https://www.contributor-covenant.org/translations
|
CODE_OWNERS.rst
ADDED
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
TTS code owners / governance system
|
2 |
+
==========================================
|
3 |
+
|
4 |
+
TTS is run under a governance system inspired (and partially copied from) by the `Mozilla module ownership system <https://www.mozilla.org/about/governance/policies/module-ownership/>`_. The project is roughly divided into modules, and each module has its owners, which are responsible for reviewing pull requests and deciding on technical direction for their modules. Module ownership authority is given to people who have worked extensively on areas of the project.
|
5 |
+
|
6 |
+
Module owners also have the authority of naming other module owners or appointing module peers, which are people with authority to review pull requests in that module. They can also sub-divide their module into sub-modules with their owners.
|
7 |
+
|
8 |
+
Module owners are not tyrants. They are chartered to make decisions with input from the community and in the best interest of the community. Module owners are not required to make code changes or additions solely because the community wants them to do so. (Like anyone else, the module owners may write code because they want to, because their employers want them to, because the community wants them to, or for some other reason.) Module owners do need to pay attention to patches submitted to that module. However “pay attention” does not mean agreeing to every patch. Some patches may not make sense for the WebThings project; some may be poorly implemented. Module owners have the authority to decline a patch; this is a necessary part of the role. We ask the module owners to describe in the relevant issue their reasons for wanting changes to a patch, for declining it altogether, or for postponing review for some period. We don’t ask or expect them to rewrite patches to make them acceptable. Similarly, module owners may need to delay review of a promising patch due to an upcoming deadline. For example, a patch may be of interest, but not for the next milestone. In such a case it may make sense for the module owner to postpone review of a patch until after matters needed for a milestone have been finalized. Again, we expect this to be described in the relevant issue. And of course, it shouldn’t go on very often or for very long or escalation and review is likely.
|
9 |
+
|
10 |
+
The work of the various module owners and peers is overseen by the global owners, which are responsible for making final decisions in case there's conflict between owners as well as set the direction for the project as a whole.
|
11 |
+
|
12 |
+
This file describes module owners who are active on the project and which parts of the code they have expertise on (and interest in). If you're making changes to the code and are wondering who's an appropriate person to talk to, this list will tell you who to ping.
|
13 |
+
|
14 |
+
There's overlap in the areas of expertise of each owner, and in particular when looking at which files are covered by each area, there is a lot of overlap. Don't worry about getting it exactly right when requesting review, any code owner will be happy to redirect the request to a more appropriate person.
|
15 |
+
|
16 |
+
Global owners
|
17 |
+
----------------
|
18 |
+
|
19 |
+
These are people who have worked on the project extensively and are familiar with all or most parts of it. Their expertise and review guidance is trusted by other code owners to cover their own areas of expertise. In case of conflicting opinions from other owners, global owners will make a final decision.
|
20 |
+
|
21 |
+
- Eren Gölge (@erogol)
|
22 |
+
- Reuben Morais (@reuben)
|
23 |
+
|
24 |
+
Training, feeding
|
25 |
+
-----------------
|
26 |
+
|
27 |
+
- Eren Gölge (@erogol)
|
28 |
+
|
29 |
+
Model exporting
|
30 |
+
---------------
|
31 |
+
|
32 |
+
- Eren Gölge (@erogol)
|
33 |
+
|
34 |
+
Multi-Speaker TTS
|
35 |
+
-----------------
|
36 |
+
|
37 |
+
- Eren Gölge (@erogol)
|
38 |
+
- Edresson Casanova (@edresson)
|
39 |
+
|
40 |
+
TTS
|
41 |
+
---
|
42 |
+
|
43 |
+
- Eren Gölge (@erogol)
|
44 |
+
|
45 |
+
Vocoders
|
46 |
+
--------
|
47 |
+
|
48 |
+
- Eren Gölge (@erogol)
|
49 |
+
|
50 |
+
Speaker Encoder
|
51 |
+
---------------
|
52 |
+
|
53 |
+
- Eren Gölge (@erogol)
|
54 |
+
|
55 |
+
Testing & CI
|
56 |
+
------------
|
57 |
+
|
58 |
+
- Eren Gölge (@erogol)
|
59 |
+
- Reuben Morais (@reuben)
|
60 |
+
|
61 |
+
Python bindings
|
62 |
+
---------------
|
63 |
+
|
64 |
+
- Eren Gölge (@erogol)
|
65 |
+
- Reuben Morais (@reuben)
|
66 |
+
|
67 |
+
Documentation
|
68 |
+
-------------
|
69 |
+
|
70 |
+
- Eren Gölge (@erogol)
|
71 |
+
|
72 |
+
Third party bindings
|
73 |
+
--------------------
|
74 |
+
|
75 |
+
Owned by the author.
|
CONTRIBUTING.md
ADDED
@@ -0,0 +1,136 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# Contribution guidelines
|
2 |
+
|
3 |
+
Welcome to the 🐸TTS!
|
4 |
+
|
5 |
+
This repository is governed by [the Contributor Covenant Code of Conduct](https://github.com/coqui-ai/TTS/blob/main/CODE_OF_CONDUCT.md).
|
6 |
+
|
7 |
+
## Where to start.
|
8 |
+
We welcome everyone who likes to contribute to 🐸TTS.
|
9 |
+
|
10 |
+
You can contribute not only with code but with bug reports, comments, questions, answers, or just a simple tweet to spread the word.
|
11 |
+
|
12 |
+
If you like to contribute code, squash a bug but if you don't know where to start, here are some pointers.
|
13 |
+
|
14 |
+
- [Development Road Map](https://github.com/coqui-ai/TTS/issues/378)
|
15 |
+
|
16 |
+
You can pick something out of our road map. We keep the progess of the project in this simple issue thread. It has new model proposals or developmental updates etc.
|
17 |
+
|
18 |
+
- [Github Issues Tracker](https://github.com/coqui-ai/TTS/issues)
|
19 |
+
|
20 |
+
This is a place to find feature requests, bugs.
|
21 |
+
|
22 |
+
Issues with the ```good first issue``` tag are good place for beginners to take on.
|
23 |
+
|
24 |
+
- ✨**PR**✨ [pages](https://github.com/coqui-ai/TTS/pulls) with the ```🚀new version``` tag.
|
25 |
+
|
26 |
+
We list all the target improvements for the next version. You can pick one of them and start contributing.
|
27 |
+
|
28 |
+
- Also feel free to suggest new features, ideas and models. We're always open for new things.
|
29 |
+
|
30 |
+
## Call for sharing language models
|
31 |
+
If possible, please consider sharing your pre-trained models in any language (if the licences allow for you to do so). We will include them in our model catalogue for public use and give the proper attribution, whether it be your name, company, website or any other source specified.
|
32 |
+
|
33 |
+
This model can be shared in two ways:
|
34 |
+
1. Share the model files with us and we serve them with the next 🐸 TTS release.
|
35 |
+
2. Upload your models on GDrive and share the link.
|
36 |
+
|
37 |
+
Models are served under `.models.json` file and any model is available under TTS CLI or Server end points.
|
38 |
+
|
39 |
+
Either way you choose, please make sure you send the models [here](https://github.com/coqui-ai/TTS/issues/380).
|
40 |
+
|
41 |
+
## Sending a ✨**PR**✨
|
42 |
+
|
43 |
+
If you have a new feature, a model to implement, or a bug to squash, go ahead and send a ✨**PR**✨.
|
44 |
+
Please use the following steps to send a ✨**PR**✨.
|
45 |
+
Let us know if you encounter a problem along the way.
|
46 |
+
|
47 |
+
The following steps are tested on an Ubuntu system.
|
48 |
+
|
49 |
+
1. Fork 🐸TTS[https://github.com/coqui-ai/TTS] by clicking the fork button at the top right corner of the project page.
|
50 |
+
|
51 |
+
2. Clone 🐸TTS and add the main repo as a new remote named ```upsteam```.
|
52 |
+
|
53 |
+
```bash
|
54 |
+
$ git clone git@github.com:<your Github name>/TTS.git
|
55 |
+
$ cd TTS
|
56 |
+
$ git remote add upstream https://github.com/coqui-ai/TTS.git
|
57 |
+
```
|
58 |
+
|
59 |
+
3. Install 🐸TTS for development.
|
60 |
+
|
61 |
+
```bash
|
62 |
+
$ make system-deps # intended to be used on Ubuntu (Debian). Let us know if you have a different OS.
|
63 |
+
$ make install
|
64 |
+
```
|
65 |
+
|
66 |
+
4. Create a new branch with an informative name for your goal.
|
67 |
+
|
68 |
+
```bash
|
69 |
+
$ git checkout -b an_informative_name_for_my_branch
|
70 |
+
```
|
71 |
+
|
72 |
+
5. Implement your changes on your new branch.
|
73 |
+
|
74 |
+
6. Explain your code using [Google Style](https://google.github.io/styleguide/pyguide.html#381-docstrings) docstrings.
|
75 |
+
|
76 |
+
7. Add your tests to our test suite under ```tests``` folder. It is important to show that your code works, edge cases are considered, and inform others about the intended use.
|
77 |
+
|
78 |
+
8. Run the tests to see how your updates work with the rest of the project. You can repeat this step multiple times as you implement your changes to make sure you are on the right direction.
|
79 |
+
|
80 |
+
```bash
|
81 |
+
$ make test # stop at the first error
|
82 |
+
$ make test_all # run all the tests, report all the errors
|
83 |
+
```
|
84 |
+
|
85 |
+
9. Format your code. We use ```black``` for code and ```isort``` for ```import``` formatting.
|
86 |
+
|
87 |
+
```bash
|
88 |
+
$ make style
|
89 |
+
```
|
90 |
+
|
91 |
+
10. Run the linter and correct the issues raised. We use ```pylint``` for linting. It helps to enforce a coding standard, offers simple refactoring suggestions.
|
92 |
+
|
93 |
+
```bash
|
94 |
+
$ make lint
|
95 |
+
```
|
96 |
+
|
97 |
+
11. When things are good, add new files and commit your changes.
|
98 |
+
|
99 |
+
```bash
|
100 |
+
$ git add my_file1.py my_file2.py ...
|
101 |
+
$ git commit
|
102 |
+
```
|
103 |
+
|
104 |
+
It's a good practice to regularly sync your local copy of the project with the upstream code to keep up with the recent updates.
|
105 |
+
|
106 |
+
```bash
|
107 |
+
$ git fetch upstream
|
108 |
+
$ git rebase upstream/master
|
109 |
+
# or for the development version
|
110 |
+
$ git rebase upstream/dev
|
111 |
+
```
|
112 |
+
|
113 |
+
12. Send a PR to ```dev``` branch.
|
114 |
+
|
115 |
+
Push your branch to your fork.
|
116 |
+
|
117 |
+
```bash
|
118 |
+
$ git push -u origin an_informative_name_for_my_branch
|
119 |
+
```
|
120 |
+
|
121 |
+
Then go to your fork's Github page and click on 'Pull request' to send your ✨**PR**✨.
|
122 |
+
|
123 |
+
Please set ✨**PR**✨'s target branch to ```dev``` as we use ```dev``` to work on the next version.
|
124 |
+
|
125 |
+
13. Let's discuss until it is perfect. 💪
|
126 |
+
|
127 |
+
We might ask you for certain changes that would appear in the ✨**PR**✨'s page under 🐸TTS[https://github.com/coqui-ai/TTS/pulls].
|
128 |
+
|
129 |
+
14. Once things look perfect, We merge it to the ```dev``` branch and make it ready for the next version.
|
130 |
+
|
131 |
+
Feel free to ping us at any step you need help using our communication channels.
|
132 |
+
|
133 |
+
If you are new to Github or open-source contribution, These are good resources.
|
134 |
+
|
135 |
+
- [Github Docs](https://docs.github.com/en/github/collaborating-with-issues-and-pull-requests/proposing-changes-to-your-work-with-pull-requests)
|
136 |
+
- [First-Contribution](https://github.com/firstcontributions/first-contributions)
|
Dockerfile
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
ARG BASE=nvidia/cuda:11.8.0-base-ubuntu22.04
|
2 |
+
FROM ${BASE}
|
3 |
+
RUN apt-get update && apt-get upgrade -y
|
4 |
+
RUN apt-get install -y --no-install-recommends gcc g++ make python3 python3-dev python3-pip python3-venv python3-wheel espeak-ng libsndfile1-dev && rm -rf /var/lib/apt/lists/*
|
5 |
+
RUN pip3 install llvmlite --ignore-installed
|
6 |
+
|
7 |
+
WORKDIR /root
|
8 |
+
COPY . /root
|
9 |
+
RUN pip3 install torch torchaudio --extra-index-url https://download.pytorch.org/whl/cu118
|
10 |
+
RUN rm -rf /root/.cache/pip
|
11 |
+
RUN make install
|
12 |
+
ENTRYPOINT ["tts"]
|
13 |
+
CMD ["--help"]
|
LICENSE.txt
ADDED
@@ -0,0 +1,373 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Mozilla Public License Version 2.0
|
2 |
+
==================================
|
3 |
+
|
4 |
+
1. Definitions
|
5 |
+
--------------
|
6 |
+
|
7 |
+
1.1. "Contributor"
|
8 |
+
means each individual or legal entity that creates, contributes to
|
9 |
+
the creation of, or owns Covered Software.
|
10 |
+
|
11 |
+
1.2. "Contributor Version"
|
12 |
+
means the combination of the Contributions of others (if any) used
|
13 |
+
by a Contributor and that particular Contributor's Contribution.
|
14 |
+
|
15 |
+
1.3. "Contribution"
|
16 |
+
means Covered Software of a particular Contributor.
|
17 |
+
|
18 |
+
1.4. "Covered Software"
|
19 |
+
means Source Code Form to which the initial Contributor has attached
|
20 |
+
the notice in Exhibit A, the Executable Form of such Source Code
|
21 |
+
Form, and Modifications of such Source Code Form, in each case
|
22 |
+
including portions thereof.
|
23 |
+
|
24 |
+
1.5. "Incompatible With Secondary Licenses"
|
25 |
+
means
|
26 |
+
|
27 |
+
(a) that the initial Contributor has attached the notice described
|
28 |
+
in Exhibit B to the Covered Software; or
|
29 |
+
|
30 |
+
(b) that the Covered Software was made available under the terms of
|
31 |
+
version 1.1 or earlier of the License, but not also under the
|
32 |
+
terms of a Secondary License.
|
33 |
+
|
34 |
+
1.6. "Executable Form"
|
35 |
+
means any form of the work other than Source Code Form.
|
36 |
+
|
37 |
+
1.7. "Larger Work"
|
38 |
+
means a work that combines Covered Software with other material, in
|
39 |
+
a separate file or files, that is not Covered Software.
|
40 |
+
|
41 |
+
1.8. "License"
|
42 |
+
means this document.
|
43 |
+
|
44 |
+
1.9. "Licensable"
|
45 |
+
means having the right to grant, to the maximum extent possible,
|
46 |
+
whether at the time of the initial grant or subsequently, any and
|
47 |
+
all of the rights conveyed by this License.
|
48 |
+
|
49 |
+
1.10. "Modifications"
|
50 |
+
means any of the following:
|
51 |
+
|
52 |
+
(a) any file in Source Code Form that results from an addition to,
|
53 |
+
deletion from, or modification of the contents of Covered
|
54 |
+
Software; or
|
55 |
+
|
56 |
+
(b) any new file in Source Code Form that contains any Covered
|
57 |
+
Software.
|
58 |
+
|
59 |
+
1.11. "Patent Claims" of a Contributor
|
60 |
+
means any patent claim(s), including without limitation, method,
|
61 |
+
process, and apparatus claims, in any patent Licensable by such
|
62 |
+
Contributor that would be infringed, but for the grant of the
|
63 |
+
License, by the making, using, selling, offering for sale, having
|
64 |
+
made, import, or transfer of either its Contributions or its
|
65 |
+
Contributor Version.
|
66 |
+
|
67 |
+
1.12. "Secondary License"
|
68 |
+
means either the GNU General Public License, Version 2.0, the GNU
|
69 |
+
Lesser General Public License, Version 2.1, the GNU Affero General
|
70 |
+
Public License, Version 3.0, or any later versions of those
|
71 |
+
licenses.
|
72 |
+
|
73 |
+
1.13. "Source Code Form"
|
74 |
+
means the form of the work preferred for making modifications.
|
75 |
+
|
76 |
+
1.14. "You" (or "Your")
|
77 |
+
means an individual or a legal entity exercising rights under this
|
78 |
+
License. For legal entities, "You" includes any entity that
|
79 |
+
controls, is controlled by, or is under common control with You. For
|
80 |
+
purposes of this definition, "control" means (a) the power, direct
|
81 |
+
or indirect, to cause the direction or management of such entity,
|
82 |
+
whether by contract or otherwise, or (b) ownership of more than
|
83 |
+
fifty percent (50%) of the outstanding shares or beneficial
|
84 |
+
ownership of such entity.
|
85 |
+
|
86 |
+
2. License Grants and Conditions
|
87 |
+
--------------------------------
|
88 |
+
|
89 |
+
2.1. Grants
|
90 |
+
|
91 |
+
Each Contributor hereby grants You a world-wide, royalty-free,
|
92 |
+
non-exclusive license:
|
93 |
+
|
94 |
+
(a) under intellectual property rights (other than patent or trademark)
|
95 |
+
Licensable by such Contributor to use, reproduce, make available,
|
96 |
+
modify, display, perform, distribute, and otherwise exploit its
|
97 |
+
Contributions, either on an unmodified basis, with Modifications, or
|
98 |
+
as part of a Larger Work; and
|
99 |
+
|
100 |
+
(b) under Patent Claims of such Contributor to make, use, sell, offer
|
101 |
+
for sale, have made, import, and otherwise transfer either its
|
102 |
+
Contributions or its Contributor Version.
|
103 |
+
|
104 |
+
2.2. Effective Date
|
105 |
+
|
106 |
+
The licenses granted in Section 2.1 with respect to any Contribution
|
107 |
+
become effective for each Contribution on the date the Contributor first
|
108 |
+
distributes such Contribution.
|
109 |
+
|
110 |
+
2.3. Limitations on Grant Scope
|
111 |
+
|
112 |
+
The licenses granted in this Section 2 are the only rights granted under
|
113 |
+
this License. No additional rights or licenses will be implied from the
|
114 |
+
distribution or licensing of Covered Software under this License.
|
115 |
+
Notwithstanding Section 2.1(b) above, no patent license is granted by a
|
116 |
+
Contributor:
|
117 |
+
|
118 |
+
(a) for any code that a Contributor has removed from Covered Software;
|
119 |
+
or
|
120 |
+
|
121 |
+
(b) for infringements caused by: (i) Your and any other third party's
|
122 |
+
modifications of Covered Software, or (ii) the combination of its
|
123 |
+
Contributions with other software (except as part of its Contributor
|
124 |
+
Version); or
|
125 |
+
|
126 |
+
(c) under Patent Claims infringed by Covered Software in the absence of
|
127 |
+
its Contributions.
|
128 |
+
|
129 |
+
This License does not grant any rights in the trademarks, service marks,
|
130 |
+
or logos of any Contributor (except as may be necessary to comply with
|
131 |
+
the notice requirements in Section 3.4).
|
132 |
+
|
133 |
+
2.4. Subsequent Licenses
|
134 |
+
|
135 |
+
No Contributor makes additional grants as a result of Your choice to
|
136 |
+
distribute the Covered Software under a subsequent version of this
|
137 |
+
License (see Section 10.2) or under the terms of a Secondary License (if
|
138 |
+
permitted under the terms of Section 3.3).
|
139 |
+
|
140 |
+
2.5. Representation
|
141 |
+
|
142 |
+
Each Contributor represents that the Contributor believes its
|
143 |
+
Contributions are its original creation(s) or it has sufficient rights
|
144 |
+
to grant the rights to its Contributions conveyed by this License.
|
145 |
+
|
146 |
+
2.6. Fair Use
|
147 |
+
|
148 |
+
This License is not intended to limit any rights You have under
|
149 |
+
applicable copyright doctrines of fair use, fair dealing, or other
|
150 |
+
equivalents.
|
151 |
+
|
152 |
+
2.7. Conditions
|
153 |
+
|
154 |
+
Sections 3.1, 3.2, 3.3, and 3.4 are conditions of the licenses granted
|
155 |
+
in Section 2.1.
|
156 |
+
|
157 |
+
3. Responsibilities
|
158 |
+
-------------------
|
159 |
+
|
160 |
+
3.1. Distribution of Source Form
|
161 |
+
|
162 |
+
All distribution of Covered Software in Source Code Form, including any
|
163 |
+
Modifications that You create or to which You contribute, must be under
|
164 |
+
the terms of this License. You must inform recipients that the Source
|
165 |
+
Code Form of the Covered Software is governed by the terms of this
|
166 |
+
License, and how they can obtain a copy of this License. You may not
|
167 |
+
attempt to alter or restrict the recipients' rights in the Source Code
|
168 |
+
Form.
|
169 |
+
|
170 |
+
3.2. Distribution of Executable Form
|
171 |
+
|
172 |
+
If You distribute Covered Software in Executable Form then:
|
173 |
+
|
174 |
+
(a) such Covered Software must also be made available in Source Code
|
175 |
+
Form, as described in Section 3.1, and You must inform recipients of
|
176 |
+
the Executable Form how they can obtain a copy of such Source Code
|
177 |
+
Form by reasonable means in a timely manner, at a charge no more
|
178 |
+
than the cost of distribution to the recipient; and
|
179 |
+
|
180 |
+
(b) You may distribute such Executable Form under the terms of this
|
181 |
+
License, or sublicense it under different terms, provided that the
|
182 |
+
license for the Executable Form does not attempt to limit or alter
|
183 |
+
the recipients' rights in the Source Code Form under this License.
|
184 |
+
|
185 |
+
3.3. Distribution of a Larger Work
|
186 |
+
|
187 |
+
You may create and distribute a Larger Work under terms of Your choice,
|
188 |
+
provided that You also comply with the requirements of this License for
|
189 |
+
the Covered Software. If the Larger Work is a combination of Covered
|
190 |
+
Software with a work governed by one or more Secondary Licenses, and the
|
191 |
+
Covered Software is not Incompatible With Secondary Licenses, this
|
192 |
+
License permits You to additionally distribute such Covered Software
|
193 |
+
under the terms of such Secondary License(s), so that the recipient of
|
194 |
+
the Larger Work may, at their option, further distribute the Covered
|
195 |
+
Software under the terms of either this License or such Secondary
|
196 |
+
License(s).
|
197 |
+
|
198 |
+
3.4. Notices
|
199 |
+
|
200 |
+
You may not remove or alter the substance of any license notices
|
201 |
+
(including copyright notices, patent notices, disclaimers of warranty,
|
202 |
+
or limitations of liability) contained within the Source Code Form of
|
203 |
+
the Covered Software, except that You may alter any license notices to
|
204 |
+
the extent required to remedy known factual inaccuracies.
|
205 |
+
|
206 |
+
3.5. Application of Additional Terms
|
207 |
+
|
208 |
+
You may choose to offer, and to charge a fee for, warranty, support,
|
209 |
+
indemnity or liability obligations to one or more recipients of Covered
|
210 |
+
Software. However, You may do so only on Your own behalf, and not on
|
211 |
+
behalf of any Contributor. You must make it absolutely clear that any
|
212 |
+
such warranty, support, indemnity, or liability obligation is offered by
|
213 |
+
You alone, and You hereby agree to indemnify every Contributor for any
|
214 |
+
liability incurred by such Contributor as a result of warranty, support,
|
215 |
+
indemnity or liability terms You offer. You may include additional
|
216 |
+
disclaimers of warranty and limitations of liability specific to any
|
217 |
+
jurisdiction.
|
218 |
+
|
219 |
+
4. Inability to Comply Due to Statute or Regulation
|
220 |
+
---------------------------------------------------
|
221 |
+
|
222 |
+
If it is impossible for You to comply with any of the terms of this
|
223 |
+
License with respect to some or all of the Covered Software due to
|
224 |
+
statute, judicial order, or regulation then You must: (a) comply with
|
225 |
+
the terms of this License to the maximum extent possible; and (b)
|
226 |
+
describe the limitations and the code they affect. Such description must
|
227 |
+
be placed in a text file included with all distributions of the Covered
|
228 |
+
Software under this License. Except to the extent prohibited by statute
|
229 |
+
or regulation, such description must be sufficiently detailed for a
|
230 |
+
recipient of ordinary skill to be able to understand it.
|
231 |
+
|
232 |
+
5. Termination
|
233 |
+
--------------
|
234 |
+
|
235 |
+
5.1. The rights granted under this License will terminate automatically
|
236 |
+
if You fail to comply with any of its terms. However, if You become
|
237 |
+
compliant, then the rights granted under this License from a particular
|
238 |
+
Contributor are reinstated (a) provisionally, unless and until such
|
239 |
+
Contributor explicitly and finally terminates Your grants, and (b) on an
|
240 |
+
ongoing basis, if such Contributor fails to notify You of the
|
241 |
+
non-compliance by some reasonable means prior to 60 days after You have
|
242 |
+
come back into compliance. Moreover, Your grants from a particular
|
243 |
+
Contributor are reinstated on an ongoing basis if such Contributor
|
244 |
+
notifies You of the non-compliance by some reasonable means, this is the
|
245 |
+
first time You have received notice of non-compliance with this License
|
246 |
+
from such Contributor, and You become compliant prior to 30 days after
|
247 |
+
Your receipt of the notice.
|
248 |
+
|
249 |
+
5.2. If You initiate litigation against any entity by asserting a patent
|
250 |
+
infringement claim (excluding declaratory judgment actions,
|
251 |
+
counter-claims, and cross-claims) alleging that a Contributor Version
|
252 |
+
directly or indirectly infringes any patent, then the rights granted to
|
253 |
+
You by any and all Contributors for the Covered Software under Section
|
254 |
+
2.1 of this License shall terminate.
|
255 |
+
|
256 |
+
5.3. In the event of termination under Sections 5.1 or 5.2 above, all
|
257 |
+
end user license agreements (excluding distributors and resellers) which
|
258 |
+
have been validly granted by You or Your distributors under this License
|
259 |
+
prior to termination shall survive termination.
|
260 |
+
|
261 |
+
************************************************************************
|
262 |
+
* *
|
263 |
+
* 6. Disclaimer of Warranty *
|
264 |
+
* ------------------------- *
|
265 |
+
* *
|
266 |
+
* Covered Software is provided under this License on an "as is" *
|
267 |
+
* basis, without warranty of any kind, either expressed, implied, or *
|
268 |
+
* statutory, including, without limitation, warranties that the *
|
269 |
+
* Covered Software is free of defects, merchantable, fit for a *
|
270 |
+
* particular purpose or non-infringing. The entire risk as to the *
|
271 |
+
* quality and performance of the Covered Software is with You. *
|
272 |
+
* Should any Covered Software prove defective in any respect, You *
|
273 |
+
* (not any Contributor) assume the cost of any necessary servicing, *
|
274 |
+
* repair, or correction. This disclaimer of warranty constitutes an *
|
275 |
+
* essential part of this License. No use of any Covered Software is *
|
276 |
+
* authorized under this License except under this disclaimer. *
|
277 |
+
* *
|
278 |
+
************************************************************************
|
279 |
+
|
280 |
+
************************************************************************
|
281 |
+
* *
|
282 |
+
* 7. Limitation of Liability *
|
283 |
+
* -------------------------- *
|
284 |
+
* *
|
285 |
+
* Under no circumstances and under no legal theory, whether tort *
|
286 |
+
* (including negligence), contract, or otherwise, shall any *
|
287 |
+
* Contributor, or anyone who distributes Covered Software as *
|
288 |
+
* permitted above, be liable to You for any direct, indirect, *
|
289 |
+
* special, incidental, or consequential damages of any character *
|
290 |
+
* including, without limitation, damages for lost profits, loss of *
|
291 |
+
* goodwill, work stoppage, computer failure or malfunction, or any *
|
292 |
+
* and all other commercial damages or losses, even if such party *
|
293 |
+
* shall have been informed of the possibility of such damages. This *
|
294 |
+
* limitation of liability shall not apply to liability for death or *
|
295 |
+
* personal injury resulting from such party's negligence to the *
|
296 |
+
* extent applicable law prohibits such limitation. Some *
|
297 |
+
* jurisdictions do not allow the exclusion or limitation of *
|
298 |
+
* incidental or consequential damages, so this exclusion and *
|
299 |
+
* limitation may not apply to You. *
|
300 |
+
* *
|
301 |
+
************************************************************************
|
302 |
+
|
303 |
+
8. Litigation
|
304 |
+
-------------
|
305 |
+
|
306 |
+
Any litigation relating to this License may be brought only in the
|
307 |
+
courts of a jurisdiction where the defendant maintains its principal
|
308 |
+
place of business and such litigation shall be governed by laws of that
|
309 |
+
jurisdiction, without reference to its conflict-of-law provisions.
|
310 |
+
Nothing in this Section shall prevent a party's ability to bring
|
311 |
+
cross-claims or counter-claims.
|
312 |
+
|
313 |
+
9. Miscellaneous
|
314 |
+
----------------
|
315 |
+
|
316 |
+
This License represents the complete agreement concerning the subject
|
317 |
+
matter hereof. If any provision of this License is held to be
|
318 |
+
unenforceable, such provision shall be reformed only to the extent
|
319 |
+
necessary to make it enforceable. Any law or regulation which provides
|
320 |
+
that the language of a contract shall be construed against the drafter
|
321 |
+
shall not be used to construe this License against a Contributor.
|
322 |
+
|
323 |
+
10. Versions of the License
|
324 |
+
---------------------------
|
325 |
+
|
326 |
+
10.1. New Versions
|
327 |
+
|
328 |
+
Mozilla Foundation is the license steward. Except as provided in Section
|
329 |
+
10.3, no one other than the license steward has the right to modify or
|
330 |
+
publish new versions of this License. Each version will be given a
|
331 |
+
distinguishing version number.
|
332 |
+
|
333 |
+
10.2. Effect of New Versions
|
334 |
+
|
335 |
+
You may distribute the Covered Software under the terms of the version
|
336 |
+
of the License under which You originally received the Covered Software,
|
337 |
+
or under the terms of any subsequent version published by the license
|
338 |
+
steward.
|
339 |
+
|
340 |
+
10.3. Modified Versions
|
341 |
+
|
342 |
+
If you create software not governed by this License, and you want to
|
343 |
+
create a new license for such software, you may create and use a
|
344 |
+
modified version of this License if you rename the license and remove
|
345 |
+
any references to the name of the license steward (except to note that
|
346 |
+
such modified license differs from this License).
|
347 |
+
|
348 |
+
10.4. Distributing Source Code Form that is Incompatible With Secondary
|
349 |
+
Licenses
|
350 |
+
|
351 |
+
If You choose to distribute Source Code Form that is Incompatible With
|
352 |
+
Secondary Licenses under the terms of this version of the License, the
|
353 |
+
notice described in Exhibit B of this License must be attached.
|
354 |
+
|
355 |
+
Exhibit A - Source Code Form License Notice
|
356 |
+
-------------------------------------------
|
357 |
+
|
358 |
+
This Source Code Form is subject to the terms of the Mozilla Public
|
359 |
+
License, v. 2.0. If a copy of the MPL was not distributed with this
|
360 |
+
file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
361 |
+
|
362 |
+
If it is not possible or desirable to put the notice in a particular
|
363 |
+
file, then You may include the notice in a location (such as a LICENSE
|
364 |
+
file in a relevant directory) where a recipient would be likely to look
|
365 |
+
for such a notice.
|
366 |
+
|
367 |
+
You may add additional accurate notices of copyright ownership.
|
368 |
+
|
369 |
+
Exhibit B - "Incompatible With Secondary Licenses" Notice
|
370 |
+
---------------------------------------------------------
|
371 |
+
|
372 |
+
This Source Code Form is "Incompatible With Secondary Licenses", as
|
373 |
+
defined by the Mozilla Public License, v. 2.0.
|
MANIFEST.in
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
include README.md
|
2 |
+
include LICENSE.txt
|
3 |
+
include requirements.*.txt
|
4 |
+
include *.cff
|
5 |
+
include requirements.txt
|
6 |
+
include TTS/VERSION
|
7 |
+
recursive-include TTS *.json
|
8 |
+
recursive-include TTS *.html
|
9 |
+
recursive-include TTS *.png
|
10 |
+
recursive-include TTS *.md
|
11 |
+
recursive-include TTS *.py
|
12 |
+
recursive-include TTS *.pyx
|
13 |
+
recursive-include images *.png
|
14 |
+
recursive-exclude tests *
|
15 |
+
prune tests*
|
Makefile
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
.DEFAULT_GOAL := help
|
2 |
+
.PHONY: test system-deps dev-deps deps style lint install help docs
|
3 |
+
|
4 |
+
help:
|
5 |
+
@grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | sort | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[36m%-30s\033[0m %s\n", $$1, $$2}'
|
6 |
+
|
7 |
+
target_dirs := tests TTS notebooks recipes
|
8 |
+
|
9 |
+
test_all: ## run tests and don't stop on an error.
|
10 |
+
nose2 --with-coverage --coverage TTS tests
|
11 |
+
./run_bash_tests.sh
|
12 |
+
|
13 |
+
test: ## run tests.
|
14 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests
|
15 |
+
|
16 |
+
test_vocoder: ## run vocoder tests.
|
17 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests.vocoder_tests
|
18 |
+
|
19 |
+
test_tts: ## run tts tests.
|
20 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests.tts_tests
|
21 |
+
|
22 |
+
test_aux: ## run aux tests.
|
23 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests.aux_tests
|
24 |
+
./run_bash_tests.sh
|
25 |
+
|
26 |
+
test_zoo: ## run zoo tests.
|
27 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests.zoo_tests
|
28 |
+
|
29 |
+
inference_tests: ## run inference tests.
|
30 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests.inference_tests
|
31 |
+
|
32 |
+
data_tests: ## run data tests.
|
33 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests.data_tests
|
34 |
+
|
35 |
+
test_text: ## run text tests.
|
36 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests.text_tests
|
37 |
+
|
38 |
+
test_failed: ## only run tests failed the last time.
|
39 |
+
nose2 -F -v -B --with-coverage --coverage TTS tests
|
40 |
+
|
41 |
+
style: ## update code style.
|
42 |
+
black ${target_dirs}
|
43 |
+
isort ${target_dirs}
|
44 |
+
|
45 |
+
lint: ## run pylint linter.
|
46 |
+
pylint ${target_dirs}
|
47 |
+
black ${target_dirs} --check
|
48 |
+
isort ${target_dirs} --check-only
|
49 |
+
|
50 |
+
system-deps: ## install linux system deps
|
51 |
+
sudo apt-get install -y libsndfile1-dev
|
52 |
+
|
53 |
+
dev-deps: ## install development deps
|
54 |
+
pip install -r requirements.dev.txt
|
55 |
+
|
56 |
+
doc-deps: ## install docs dependencies
|
57 |
+
pip install -r docs/requirements.txt
|
58 |
+
|
59 |
+
build-docs: ## build the docs
|
60 |
+
cd docs && make clean && make build
|
61 |
+
|
62 |
+
hub-deps: ## install deps for torch hub use
|
63 |
+
pip install -r requirements.hub.txt
|
64 |
+
|
65 |
+
deps: ## install 🐸 requirements.
|
66 |
+
pip install -r requirements.txt
|
67 |
+
|
68 |
+
install: ## install 🐸 TTS for development.
|
69 |
+
pip install -e .[all]
|
70 |
+
|
71 |
+
docs: ## build the docs
|
72 |
+
$(MAKE) -C docs clean && $(MAKE) -C docs html
|
README.md
CHANGED
@@ -1,3 +1,373 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
|
3 |
+
## 🐸Coqui.ai News
|
4 |
+
- 📣 [🐶Bark](https://github.com/suno-ai/bark) is now available for inference with uncontrained voice cloning. [Docs](https://tts.readthedocs.io/en/dev/models/bark.html)
|
5 |
+
- 📣 You can use [~1100 Fairseq models](https://github.com/facebookresearch/fairseq/tree/main/examples/mms) with 🐸TTS.
|
6 |
+
- 📣 🐸TTS now supports 🐢Tortoise with faster inference. [Docs](https://tts.readthedocs.io/en/dev/models/tortoise.html)
|
7 |
+
- 📣 **Coqui Studio API** is landed on 🐸TTS. - [Example](https://github.com/coqui-ai/TTS/blob/dev/README.md#-python-api)
|
8 |
+
- 📣 [**Coqui Studio API**](https://docs.coqui.ai/docs) is live.
|
9 |
+
- 📣 Voice generation with prompts - **Prompt to Voice** - is live on [**Coqui Studio**](https://app.coqui.ai/auth/signin)!! - [Blog Post](https://coqui.ai/blog/tts/prompt-to-voice)
|
10 |
+
- 📣 Voice generation with fusion - **Voice fusion** - is live on [**Coqui Studio**](https://app.coqui.ai/auth/signin).
|
11 |
+
- 📣 Voice cloning is live on [**Coqui Studio**](https://app.coqui.ai/auth/signin).
|
12 |
+
|
13 |
+
## <img src="https://raw.githubusercontent.com/coqui-ai/TTS/main/images/coqui-log-green-TTS.png" height="56"/>
|
14 |
+
|
15 |
+
|
16 |
+
🐸TTS is a library for advanced Text-to-Speech generation. It's built on the latest research, was designed to achieve the best trade-off among ease-of-training, speed and quality.
|
17 |
+
🐸TTS comes with pretrained models, tools for measuring dataset quality and already used in **20+ languages** for products and research projects.
|
18 |
+
|
19 |
+
[![Dicord](https://img.shields.io/discord/1037326658807533628?color=%239B59B6&label=chat%20on%20discord)](https://discord.gg/5eXr5seRrv)
|
20 |
+
[![License](<https://img.shields.io/badge/License-MPL%202.0-brightgreen.svg>)](https://opensource.org/licenses/MPL-2.0)
|
21 |
+
[![PyPI version](https://badge.fury.io/py/TTS.svg)](https://badge.fury.io/py/TTS)
|
22 |
+
[![Covenant](https://camo.githubusercontent.com/7d620efaa3eac1c5b060ece5d6aacfcc8b81a74a04d05cd0398689c01c4463bb/68747470733a2f2f696d672e736869656c64732e696f2f62616467652f436f6e7472696275746f72253230436f76656e616e742d76322e3025323061646f707465642d6666363962342e737667)](https://github.com/coqui-ai/TTS/blob/master/CODE_OF_CONDUCT.md)
|
23 |
+
[![Downloads](https://pepy.tech/badge/tts)](https://pepy.tech/project/tts)
|
24 |
+
[![DOI](https://zenodo.org/badge/265612440.svg)](https://zenodo.org/badge/latestdoi/265612440)
|
25 |
+
|
26 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/aux_tests.yml/badge.svg)
|
27 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/data_tests.yml/badge.svg)
|
28 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/docker.yaml/badge.svg)
|
29 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/inference_tests.yml/badge.svg)
|
30 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/style_check.yml/badge.svg)
|
31 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/text_tests.yml/badge.svg)
|
32 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/tts_tests.yml/badge.svg)
|
33 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/vocoder_tests.yml/badge.svg)
|
34 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/zoo_tests0.yml/badge.svg)
|
35 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/zoo_tests1.yml/badge.svg)
|
36 |
+
![GithubActions](https://github.com/coqui-ai/TTS/actions/workflows/zoo_tests2.yml/badge.svg)
|
37 |
+
[![Docs](<https://readthedocs.org/projects/tts/badge/?version=latest&style=plastic>)](https://tts.readthedocs.io/en/latest/)
|
38 |
+
|
39 |
+
📰 [**Subscribe to 🐸Coqui.ai Newsletter**](https://coqui.ai/?subscription=true)
|
40 |
+
|
41 |
+
📢 [English Voice Samples](https://erogol.github.io/ddc-samples/) and [SoundCloud playlist](https://soundcloud.com/user-565970875/pocket-article-wavernn-and-tacotron2)
|
42 |
+
|
43 |
+
📄 [Text-to-Speech paper collection](https://github.com/erogol/TTS-papers)
|
44 |
+
|
45 |
+
<img src="https://static.scarf.sh/a.png?x-pxid=cf317fe7-2188-4721-bc01-124bb5d5dbb2" />
|
46 |
+
|
47 |
+
## 💬 Where to ask questions
|
48 |
+
Please use our dedicated channels for questions and discussion. Help is much more valuable if it's shared publicly so that more people can benefit from it.
|
49 |
+
|
50 |
+
| Type | Platforms |
|
51 |
+
| ------------------------------- | --------------------------------------- |
|
52 |
+
| 🚨 **Bug Reports** | [GitHub Issue Tracker] |
|
53 |
+
| 🎁 **Feature Requests & Ideas** | [GitHub Issue Tracker] |
|
54 |
+
| 👩💻 **Usage Questions** | [GitHub Discussions] |
|
55 |
+
| 🗯 **General Discussion** | [GitHub Discussions] or [Discord] |
|
56 |
+
|
57 |
+
[github issue tracker]: https://github.com/coqui-ai/tts/issues
|
58 |
+
[github discussions]: https://github.com/coqui-ai/TTS/discussions
|
59 |
+
[discord]: https://discord.gg/5eXr5seRrv
|
60 |
+
[Tutorials and Examples]: https://github.com/coqui-ai/TTS/wiki/TTS-Notebooks-and-Tutorials
|
61 |
+
|
62 |
+
|
63 |
+
## 🔗 Links and Resources
|
64 |
+
| Type | Links |
|
65 |
+
| ------------------------------- | --------------------------------------- |
|
66 |
+
| 💼 **Documentation** | [ReadTheDocs](https://tts.readthedocs.io/en/latest/)
|
67 |
+
| 💾 **Installation** | [TTS/README.md](https://github.com/coqui-ai/TTS/tree/dev#install-tts)|
|
68 |
+
| 👩💻 **Contributing** | [CONTRIBUTING.md](https://github.com/coqui-ai/TTS/blob/main/CONTRIBUTING.md)|
|
69 |
+
| 📌 **Road Map** | [Main Development Plans](https://github.com/coqui-ai/TTS/issues/378)
|
70 |
+
| 🚀 **Released Models** | [TTS Releases](https://github.com/coqui-ai/TTS/releases) and [Experimental Models](https://github.com/coqui-ai/TTS/wiki/Experimental-Released-Models)|
|
71 |
+
|
72 |
+
## 🥇 TTS Performance
|
73 |
+
<p align="center"><img src="https://raw.githubusercontent.com/coqui-ai/TTS/main/images/TTS-performance.png" width="800" /></p>
|
74 |
+
|
75 |
+
Underlined "TTS*" and "Judy*" are **internal** 🐸TTS models that are not released open-source. They are here to show the potential.
|
76 |
+
|
77 |
+
## Features
|
78 |
+
- High-performance Deep Learning models for Text2Speech tasks.
|
79 |
+
- Text2Spec models (Tacotron, Tacotron2, Glow-TTS, SpeedySpeech).
|
80 |
+
- Speaker Encoder to compute speaker embeddings efficiently.
|
81 |
+
- Vocoder models (MelGAN, Multiband-MelGAN, GAN-TTS, ParallelWaveGAN, WaveGrad, WaveRNN)
|
82 |
+
- Fast and efficient model training.
|
83 |
+
- Detailed training logs on the terminal and Tensorboard.
|
84 |
+
- Support for Multi-speaker TTS.
|
85 |
+
- Efficient, flexible, lightweight but feature complete `Trainer API`.
|
86 |
+
- Released and ready-to-use models.
|
87 |
+
- Tools to curate Text2Speech datasets under```dataset_analysis```.
|
88 |
+
- Utilities to use and test your models.
|
89 |
+
- Modular (but not too much) code base enabling easy implementation of new ideas.
|
90 |
+
|
91 |
+
## Implemented Models
|
92 |
+
### Spectrogram models
|
93 |
+
- Tacotron: [paper](https://arxiv.org/abs/1703.10135)
|
94 |
+
- Tacotron2: [paper](https://arxiv.org/abs/1712.05884)
|
95 |
+
- Glow-TTS: [paper](https://arxiv.org/abs/2005.11129)
|
96 |
+
- Speedy-Speech: [paper](https://arxiv.org/abs/2008.03802)
|
97 |
+
- Align-TTS: [paper](https://arxiv.org/abs/2003.01950)
|
98 |
+
- FastPitch: [paper](https://arxiv.org/pdf/2006.06873.pdf)
|
99 |
+
- FastSpeech: [paper](https://arxiv.org/abs/1905.09263)
|
100 |
+
- FastSpeech2: [paper](https://arxiv.org/abs/2006.04558)
|
101 |
+
- SC-GlowTTS: [paper](https://arxiv.org/abs/2104.05557)
|
102 |
+
- Capacitron: [paper](https://arxiv.org/abs/1906.03402)
|
103 |
+
- OverFlow: [paper](https://arxiv.org/abs/2211.06892)
|
104 |
+
- Neural HMM TTS: [paper](https://arxiv.org/abs/2108.13320)
|
105 |
+
|
106 |
+
### End-to-End Models
|
107 |
+
- VITS: [paper](https://arxiv.org/pdf/2106.06103)
|
108 |
+
- 🐸 YourTTS: [paper](https://arxiv.org/abs/2112.02418)
|
109 |
+
- 🐢 Tortoise: [orig. repo](https://github.com/neonbjb/tortoise-tts)
|
110 |
+
- 🐶 Bark: [orig. repo](https://github.com/suno-ai/bark)
|
111 |
+
|
112 |
+
### Attention Methods
|
113 |
+
- Guided Attention: [paper](https://arxiv.org/abs/1710.08969)
|
114 |
+
- Forward Backward Decoding: [paper](https://arxiv.org/abs/1907.09006)
|
115 |
+
- Graves Attention: [paper](https://arxiv.org/abs/1910.10288)
|
116 |
+
- Double Decoder Consistency: [blog](https://erogol.com/solving-attention-problems-of-tts-models-with-double-decoder-consistency/)
|
117 |
+
- Dynamic Convolutional Attention: [paper](https://arxiv.org/pdf/1910.10288.pdf)
|
118 |
+
- Alignment Network: [paper](https://arxiv.org/abs/2108.10447)
|
119 |
+
|
120 |
+
### Speaker Encoder
|
121 |
+
- GE2E: [paper](https://arxiv.org/abs/1710.10467)
|
122 |
+
- Angular Loss: [paper](https://arxiv.org/pdf/2003.11982.pdf)
|
123 |
+
|
124 |
+
### Vocoders
|
125 |
+
- MelGAN: [paper](https://arxiv.org/abs/1910.06711)
|
126 |
+
- MultiBandMelGAN: [paper](https://arxiv.org/abs/2005.05106)
|
127 |
+
- ParallelWaveGAN: [paper](https://arxiv.org/abs/1910.11480)
|
128 |
+
- GAN-TTS discriminators: [paper](https://arxiv.org/abs/1909.11646)
|
129 |
+
- WaveRNN: [origin](https://github.com/fatchord/WaveRNN/)
|
130 |
+
- WaveGrad: [paper](https://arxiv.org/abs/2009.00713)
|
131 |
+
- HiFiGAN: [paper](https://arxiv.org/abs/2010.05646)
|
132 |
+
- UnivNet: [paper](https://arxiv.org/abs/2106.07889)
|
133 |
+
|
134 |
+
### Voice Conversion
|
135 |
+
- FreeVC: [paper](https://arxiv.org/abs/2210.15418)
|
136 |
+
|
137 |
+
You can also help us implement more models.
|
138 |
+
|
139 |
+
## Install TTS
|
140 |
+
🐸TTS is tested on Ubuntu 18.04 with **python >= 3.7, < 3.11.**.
|
141 |
+
|
142 |
+
If you are only interested in [synthesizing speech](https://tts.readthedocs.io/en/latest/inference.html) with the released 🐸TTS models, installing from PyPI is the easiest option.
|
143 |
+
|
144 |
+
```bash
|
145 |
+
pip install TTS
|
146 |
+
```
|
147 |
+
|
148 |
+
If you plan to code or train models, clone 🐸TTS and install it locally.
|
149 |
+
|
150 |
+
```bash
|
151 |
+
git clone https://github.com/coqui-ai/TTS
|
152 |
+
pip install -e .[all,dev,notebooks] # Select the relevant extras
|
153 |
+
```
|
154 |
+
|
155 |
+
If you are on Ubuntu (Debian), you can also run following commands for installation.
|
156 |
+
|
157 |
+
```bash
|
158 |
+
$ make system-deps # intended to be used on Ubuntu (Debian). Let us know if you have a different OS.
|
159 |
+
$ make install
|
160 |
+
```
|
161 |
+
|
162 |
+
If you are on Windows, 👑@GuyPaddock wrote installation instructions [here](https://stackoverflow.com/questions/66726331/how-can-i-run-mozilla-tts-coqui-tts-training-with-cuda-on-a-windows-system).
|
163 |
+
|
164 |
+
|
165 |
+
## Docker Image
|
166 |
+
You can also try TTS without install with the docker image.
|
167 |
+
Simply run the following command and you will be able to run TTS without installing it.
|
168 |
+
|
169 |
+
```bash
|
170 |
+
docker run --rm -it -p 5002:5002 --entrypoint /bin/bash ghcr.io/coqui-ai/tts-cpu
|
171 |
+
python3 TTS/server/server.py --list_models #To get the list of available models
|
172 |
+
python3 TTS/server/server.py --model_name tts_models/en/vctk/vits # To start a server
|
173 |
+
```
|
174 |
+
|
175 |
+
You can then enjoy the TTS server [here](http://[::1]:5002/)
|
176 |
+
More details about the docker images (like GPU support) can be found [here](https://tts.readthedocs.io/en/latest/docker_images.html)
|
177 |
+
|
178 |
+
|
179 |
+
## Synthesizing speech by 🐸TTS
|
180 |
+
|
181 |
+
### 🐍 Python API
|
182 |
+
|
183 |
+
```python
|
184 |
+
from TTS.api import TTS
|
185 |
+
|
186 |
+
# Running a multi-speaker and multi-lingual model
|
187 |
+
|
188 |
+
# List available 🐸TTS models and choose the first one
|
189 |
+
model_name = TTS.list_models()[0]
|
190 |
+
# Init TTS
|
191 |
+
tts = TTS(model_name)
|
192 |
+
|
193 |
+
# Run TTS
|
194 |
+
|
195 |
+
# ❗ Since this model is multi-speaker and multi-lingual, we must set the target speaker and the language
|
196 |
+
# Text to speech with a numpy output
|
197 |
+
wav = tts.tts("This is a test! This is also a test!!", speaker=tts.speakers[0], language=tts.languages[0])
|
198 |
+
# Text to speech to a file
|
199 |
+
tts.tts_to_file(text="Hello world!", speaker=tts.speakers[0], language=tts.languages[0], file_path="output.wav")
|
200 |
+
|
201 |
+
# Running a single speaker model
|
202 |
+
|
203 |
+
# Init TTS with the target model name
|
204 |
+
tts = TTS(model_name="tts_models/de/thorsten/tacotron2-DDC", progress_bar=False, gpu=False)
|
205 |
+
# Run TTS
|
206 |
+
tts.tts_to_file(text="Ich bin eine Testnachricht.", file_path=OUTPUT_PATH)
|
207 |
+
|
208 |
+
# Example voice cloning with YourTTS in English, French and Portuguese
|
209 |
+
|
210 |
+
tts = TTS(model_name="tts_models/multilingual/multi-dataset/your_tts", progress_bar=False, gpu=True)
|
211 |
+
tts.tts_to_file("This is voice cloning.", speaker_wav="my/cloning/audio.wav", language="en", file_path="output.wav")
|
212 |
+
tts.tts_to_file("C'est le clonage de la voix.", speaker_wav="my/cloning/audio.wav", language="fr-fr", file_path="output.wav")
|
213 |
+
tts.tts_to_file("Isso é clonagem de voz.", speaker_wav="my/cloning/audio.wav", language="pt-br", file_path="output.wav")
|
214 |
+
|
215 |
+
|
216 |
+
# Example voice conversion converting speaker of the `source_wav` to the speaker of the `target_wav`
|
217 |
+
|
218 |
+
tts = TTS(model_name="voice_conversion_models/multilingual/vctk/freevc24", progress_bar=False, gpu=True)
|
219 |
+
tts.voice_conversion_to_file(source_wav="my/source.wav", target_wav="my/target.wav", file_path="output.wav")
|
220 |
+
|
221 |
+
# Example voice cloning by a single speaker TTS model combining with the voice conversion model. This way, you can
|
222 |
+
# clone voices by using any model in 🐸TTS.
|
223 |
+
|
224 |
+
tts = TTS("tts_models/de/thorsten/tacotron2-DDC")
|
225 |
+
tts.tts_with_vc_to_file(
|
226 |
+
"Wie sage ich auf Italienisch, dass ich dich liebe?",
|
227 |
+
speaker_wav="target/speaker.wav",
|
228 |
+
file_path="output.wav"
|
229 |
+
)
|
230 |
+
|
231 |
+
# Example text to speech using [🐸Coqui Studio](https://coqui.ai) models.
|
232 |
+
|
233 |
+
# You can use all of your available speakers in the studio.
|
234 |
+
# [🐸Coqui Studio](https://coqui.ai) API token is required. You can get it from the [account page](https://coqui.ai/account).
|
235 |
+
# You should set the `COQUI_STUDIO_TOKEN` environment variable to use the API token.
|
236 |
+
|
237 |
+
# If you have a valid API token set you will see the studio speakers as separate models in the list.
|
238 |
+
# The name format is coqui_studio/en/<studio_speaker_name>/coqui_studio
|
239 |
+
models = TTS().list_models()
|
240 |
+
# Init TTS with the target studio speaker
|
241 |
+
tts = TTS(model_name="coqui_studio/en/Torcull Diarmuid/coqui_studio", progress_bar=False, gpu=False)
|
242 |
+
# Run TTS
|
243 |
+
tts.tts_to_file(text="This is a test.", file_path=OUTPUT_PATH)
|
244 |
+
# Run TTS with emotion and speed control
|
245 |
+
tts.tts_to_file(text="This is a test.", file_path=OUTPUT_PATH, emotion="Happy", speed=1.5)
|
246 |
+
|
247 |
+
|
248 |
+
#Example text to speech using **Fairseq models in ~1100 languages** 🤯.
|
249 |
+
|
250 |
+
#For these models use the following name format: `tts_models/<lang-iso_code>/fairseq/vits`.
|
251 |
+
#You can find the list of language ISO codes [here](https://dl.fbaipublicfiles.com/mms/tts/all-tts-languages.html) and learn about the Fairseq models [here](https://github.com/facebookresearch/fairseq/tree/main/examples/mms).
|
252 |
+
|
253 |
+
# TTS with on the fly voice conversion
|
254 |
+
api = TTS("tts_models/deu/fairseq/vits")
|
255 |
+
api.tts_with_vc_to_file(
|
256 |
+
"Wie sage ich auf Italienisch, dass ich dich liebe?",
|
257 |
+
speaker_wav="target/speaker.wav",
|
258 |
+
file_path="output.wav"
|
259 |
+
)
|
260 |
+
```
|
261 |
+
|
262 |
+
### Command line `tts`
|
263 |
+
#### Single Speaker Models
|
264 |
+
|
265 |
+
- List provided models:
|
266 |
+
|
267 |
+
```
|
268 |
+
$ tts --list_models
|
269 |
+
```
|
270 |
+
- Get model info (for both tts_models and vocoder_models):
|
271 |
+
- Query by type/name:
|
272 |
+
The model_info_by_name uses the name as it from the --list_models.
|
273 |
+
```
|
274 |
+
$ tts --model_info_by_name "<model_type>/<language>/<dataset>/<model_name>"
|
275 |
+
```
|
276 |
+
For example:
|
277 |
+
|
278 |
+
```
|
279 |
+
$ tts --model_info_by_name tts_models/tr/common-voice/glow-tts
|
280 |
+
```
|
281 |
+
```
|
282 |
+
$ tts --model_info_by_name vocoder_models/en/ljspeech/hifigan_v2
|
283 |
+
```
|
284 |
+
- Query by type/idx:
|
285 |
+
The model_query_idx uses the corresponding idx from --list_models.
|
286 |
+
```
|
287 |
+
$ tts --model_info_by_idx "<model_type>/<model_query_idx>"
|
288 |
+
```
|
289 |
+
For example:
|
290 |
+
|
291 |
+
```
|
292 |
+
$ tts --model_info_by_idx tts_models/3
|
293 |
+
```
|
294 |
+
|
295 |
+
- Run TTS with default models:
|
296 |
+
|
297 |
+
```
|
298 |
+
$ tts --text "Text for TTS" --out_path output/path/speech.wav
|
299 |
+
```
|
300 |
+
|
301 |
+
- Run a TTS model with its default vocoder model:
|
302 |
+
|
303 |
+
```
|
304 |
+
$ tts --text "Text for TTS" --model_name "<model_type>/<language>/<dataset>/<model_name>" --out_path output/path/speech.wav
|
305 |
+
```
|
306 |
+
For example:
|
307 |
+
|
308 |
+
```
|
309 |
+
$ tts --text "Text for TTS" --model_name "tts_models/en/ljspeech/glow-tts" --out_path output/path/speech.wav
|
310 |
+
```
|
311 |
+
|
312 |
+
- Run with specific TTS and vocoder models from the list:
|
313 |
+
|
314 |
+
```
|
315 |
+
$ tts --text "Text for TTS" --model_name "<model_type>/<language>/<dataset>/<model_name>" --vocoder_name "<model_type>/<language>/<dataset>/<model_name>" --out_path output/path/speech.wav
|
316 |
+
```
|
317 |
+
|
318 |
+
For example:
|
319 |
+
|
320 |
+
```
|
321 |
+
$ tts --text "Text for TTS" --model_name "tts_models/en/ljspeech/glow-tts" --vocoder_name "vocoder_models/en/ljspeech/univnet" --out_path output/path/speech.wav
|
322 |
+
```
|
323 |
+
|
324 |
+
|
325 |
+
- Run your own TTS model (Using Griffin-Lim Vocoder):
|
326 |
+
|
327 |
+
```
|
328 |
+
$ tts --text "Text for TTS" --model_path path/to/model.pth --config_path path/to/config.json --out_path output/path/speech.wav
|
329 |
+
```
|
330 |
+
|
331 |
+
- Run your own TTS and Vocoder models:
|
332 |
+
```
|
333 |
+
$ tts --text "Text for TTS" --model_path path/to/model.pth --config_path path/to/config.json --out_path output/path/speech.wav
|
334 |
+
--vocoder_path path/to/vocoder.pth --vocoder_config_path path/to/vocoder_config.json
|
335 |
+
```
|
336 |
+
|
337 |
+
#### Multi-speaker Models
|
338 |
+
|
339 |
+
- List the available speakers and choose a <speaker_id> among them:
|
340 |
+
|
341 |
+
```
|
342 |
+
$ tts --model_name "<language>/<dataset>/<model_name>" --list_speaker_idxs
|
343 |
+
```
|
344 |
+
|
345 |
+
- Run the multi-speaker TTS model with the target speaker ID:
|
346 |
+
|
347 |
+
```
|
348 |
+
$ tts --text "Text for TTS." --out_path output/path/speech.wav --model_name "<language>/<dataset>/<model_name>" --speaker_idx <speaker_id>
|
349 |
+
```
|
350 |
+
|
351 |
+
- Run your own multi-speaker TTS model:
|
352 |
+
|
353 |
+
```
|
354 |
+
$ tts --text "Text for TTS" --out_path output/path/speech.wav --model_path path/to/model.pth --config_path path/to/config.json --speakers_file_path path/to/speaker.json --speaker_idx <speaker_id>
|
355 |
+
```
|
356 |
+
|
357 |
+
## Directory Structure
|
358 |
+
```
|
359 |
+
|- notebooks/ (Jupyter Notebooks for model evaluation, parameter selection and data analysis.)
|
360 |
+
|- utils/ (common utilities.)
|
361 |
+
|- TTS
|
362 |
+
|- bin/ (folder for all the executables.)
|
363 |
+
|- train*.py (train your target model.)
|
364 |
+
|- ...
|
365 |
+
|- tts/ (text to speech models)
|
366 |
+
|- layers/ (model layer definitions)
|
367 |
+
|- models/ (model definitions)
|
368 |
+
|- utils/ (model specific utilities.)
|
369 |
+
|- speaker_encoder/ (Speaker Encoder models.)
|
370 |
+
|- (same)
|
371 |
+
|- vocoder/ (Vocoder models.)
|
372 |
+
|- (same)
|
373 |
+
```
|
hubconf.py
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
dependencies = [
|
2 |
+
'torch', 'gdown', 'pysbd', 'gruut', 'anyascii', 'pypinyin', 'coqpit', 'mecab-python3', 'unidic-lite'
|
3 |
+
]
|
4 |
+
import torch
|
5 |
+
|
6 |
+
from TTS.utils.manage import ModelManager
|
7 |
+
from TTS.utils.synthesizer import Synthesizer
|
8 |
+
|
9 |
+
|
10 |
+
def tts(model_name='tts_models/en/ljspeech/tacotron2-DCA',
|
11 |
+
vocoder_name=None,
|
12 |
+
use_cuda=False):
|
13 |
+
"""TTS entry point for PyTorch Hub that provides a Synthesizer object to synthesize speech from a give text.
|
14 |
+
|
15 |
+
Example:
|
16 |
+
>>> synthesizer = torch.hub.load('coqui-ai/TTS', 'tts', source='github')
|
17 |
+
>>> wavs = synthesizer.tts("This is a test! This is also a test!!")
|
18 |
+
wavs - is a list of values of the synthesized speech.
|
19 |
+
|
20 |
+
Args:
|
21 |
+
model_name (str, optional): One of the model names from .model.json. Defaults to 'tts_models/en/ljspeech/tacotron2-DCA'.
|
22 |
+
vocoder_name (str, optional): One of the model names from .model.json. Defaults to 'vocoder_models/en/ljspeech/multiband-melgan'.
|
23 |
+
pretrained (bool, optional): [description]. Defaults to True.
|
24 |
+
|
25 |
+
Returns:
|
26 |
+
TTS.utils.synthesizer.Synthesizer: Synthesizer object wrapping both vocoder and tts models.
|
27 |
+
"""
|
28 |
+
manager = ModelManager()
|
29 |
+
|
30 |
+
model_path, config_path, model_item = manager.download_model(model_name)
|
31 |
+
vocoder_name = model_item[
|
32 |
+
'default_vocoder'] if vocoder_name is None else vocoder_name
|
33 |
+
vocoder_path, vocoder_config_path, _ = manager.download_model(vocoder_name)
|
34 |
+
|
35 |
+
# create synthesizer
|
36 |
+
synt = Synthesizer(tts_checkpoint=model_path,
|
37 |
+
tts_config_path=config_path,
|
38 |
+
vocoder_checkpoint=vocoder_path,
|
39 |
+
vocoder_config=vocoder_config_path,
|
40 |
+
use_cuda=use_cuda)
|
41 |
+
return synt
|
42 |
+
|
43 |
+
|
44 |
+
if __name__ == '__main__':
|
45 |
+
synthesizer = torch.hub.load('coqui-ai/TTS:dev', 'tts', source='github')
|
46 |
+
synthesizer.tts("This is a test!")
|
pyproject.toml
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[build-system]
|
2 |
+
requires = ["setuptools", "wheel", "cython==0.29.30", "numpy==1.22.0", "packaging"]
|
3 |
+
|
4 |
+
[flake8]
|
5 |
+
max-line-length=120
|
6 |
+
|
7 |
+
[tool.black]
|
8 |
+
line-length = 120
|
9 |
+
target-version = ['py39']
|
10 |
+
exclude = '''
|
11 |
+
|
12 |
+
(
|
13 |
+
/(
|
14 |
+
\.eggs # exclude a few common directories in the
|
15 |
+
| \.git # root of the project
|
16 |
+
| \.hg
|
17 |
+
| \.mypy_cache
|
18 |
+
| \.tox
|
19 |
+
| \.venv
|
20 |
+
| _build
|
21 |
+
| buck-out
|
22 |
+
| build
|
23 |
+
| dist
|
24 |
+
)/
|
25 |
+
| foo.py # also separately exclude a file named foo.py in
|
26 |
+
# the root of the project
|
27 |
+
)
|
28 |
+
'''
|
29 |
+
|
30 |
+
[tool.isort]
|
31 |
+
line_length = 120
|
32 |
+
profile = "black"
|
33 |
+
multi_line_output = 3
|
requirements.dev.txt
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
black
|
2 |
+
coverage
|
3 |
+
isort
|
4 |
+
nose2
|
5 |
+
pylint==2.10.2
|
requirements.notebooks.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
bokeh==1.4.0
|
requirements.txt
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# core deps
|
2 |
+
numpy==1.22.0;python_version<="3.10"
|
3 |
+
numpy==1.24.3;python_version>"3.10"
|
4 |
+
cython==0.29.30
|
5 |
+
scipy>=1.4.0
|
6 |
+
torch>=1.7
|
7 |
+
torchaudio
|
8 |
+
soundfile
|
9 |
+
librosa==0.10.0.*
|
10 |
+
numba==0.55.1;python_version<"3.9"
|
11 |
+
numba==0.57.0;python_version>="3.9"
|
12 |
+
inflect==5.6.0
|
13 |
+
tqdm
|
14 |
+
anyascii
|
15 |
+
pyyaml
|
16 |
+
fsspec>=2021.04.0
|
17 |
+
aiohttp
|
18 |
+
packaging
|
19 |
+
# deps for examples
|
20 |
+
flask
|
21 |
+
# deps for inference
|
22 |
+
pysbd
|
23 |
+
# deps for notebooks
|
24 |
+
umap-learn==0.5.1
|
25 |
+
pandas
|
26 |
+
# deps for training
|
27 |
+
matplotlib
|
28 |
+
# coqui stack
|
29 |
+
trainer
|
30 |
+
# config management
|
31 |
+
coqpit>=0.0.16
|
32 |
+
# chinese g2p deps
|
33 |
+
jieba
|
34 |
+
pypinyin
|
35 |
+
# japanese g2p deps
|
36 |
+
mecab-python3==1.0.6
|
37 |
+
unidic-lite==1.0.8
|
38 |
+
# gruut+supported langs
|
39 |
+
gruut[de,es,fr]==2.2.3
|
40 |
+
# deps for korean
|
41 |
+
jamo
|
42 |
+
nltk
|
43 |
+
g2pkk>=0.1.1
|
44 |
+
# deps for bangla
|
45 |
+
bangla==0.0.2
|
46 |
+
bnnumerizer
|
47 |
+
bnunicodenormalizer==0.1.1
|
48 |
+
#deps for tortoise
|
49 |
+
k_diffusion
|
50 |
+
einops
|
51 |
+
transformers
|
52 |
+
#deps for bark
|
53 |
+
encodec
|
run_bash_tests.sh
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
set -e
|
2 |
+
TF_CPP_MIN_LOG_LEVEL=3
|
3 |
+
|
4 |
+
# runtime bash based tests
|
5 |
+
# TODO: move these to python
|
6 |
+
./tests/bash_tests/test_demo_server.sh && \
|
7 |
+
./tests/bash_tests/test_compute_statistics.sh
|
setup.cfg
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[build_py]
|
2 |
+
build_lib=temp_build
|
3 |
+
|
4 |
+
[bdist_wheel]
|
5 |
+
bdist_dir=temp_build
|
6 |
+
|
7 |
+
[install_lib]
|
8 |
+
build_dir=temp_build
|
setup.py
ADDED
@@ -0,0 +1,138 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
#!/usr/bin/env python
|
2 |
+
# ,*++++++*, ,*++++++*,
|
3 |
+
# *++. .+++ *++. .++*
|
4 |
+
# *+* ,++++* *+* *+* ,++++, *+*
|
5 |
+
# ,+, .++++++++++* ,++,,,,*+, ,++++++++++. *+,
|
6 |
+
# *+. .++++++++++++..++ *+.,++++++++++++. .+*
|
7 |
+
# .+* ++++++++++++.*+, .+*.++++++++++++ *+,
|
8 |
+
# .++ *++++++++* ++, .++.*++++++++* ++,
|
9 |
+
# ,+++*. . .*++, ,++*. .*+++*
|
10 |
+
# *+, .,*++**. .**++**. ,+*
|
11 |
+
# .+* *+,
|
12 |
+
# *+. Coqui .+*
|
13 |
+
# *+* +++ TTS +++ *+*
|
14 |
+
# .+++*. . . *+++.
|
15 |
+
# ,+* *+++*... ...*+++* *+,
|
16 |
+
# .++. .""""+++++++****+++++++"""". ++.
|
17 |
+
# ,++. .++,
|
18 |
+
# .++* *++.
|
19 |
+
# *+++, ,+++*
|
20 |
+
# .,*++++::::::++++*,.
|
21 |
+
# ``````
|
22 |
+
|
23 |
+
import os
|
24 |
+
import subprocess
|
25 |
+
import sys
|
26 |
+
from packaging.version import Version
|
27 |
+
|
28 |
+
import numpy
|
29 |
+
import setuptools.command.build_py
|
30 |
+
import setuptools.command.develop
|
31 |
+
from Cython.Build import cythonize
|
32 |
+
from setuptools import Extension, find_packages, setup
|
33 |
+
|
34 |
+
python_version = sys.version.split()[0]
|
35 |
+
if Version(python_version) < Version("3.9") or Version(python_version) >= Version("3.12"):
|
36 |
+
raise RuntimeError("TTS requires python >= 3.9 and < 3.12 " "but your Python version is {}".format(sys.version))
|
37 |
+
|
38 |
+
|
39 |
+
cwd = os.path.dirname(os.path.abspath(__file__))
|
40 |
+
with open(os.path.join(cwd, "TTS", "VERSION")) as fin:
|
41 |
+
version = fin.read().strip()
|
42 |
+
|
43 |
+
|
44 |
+
class build_py(setuptools.command.build_py.build_py): # pylint: disable=too-many-ancestors
|
45 |
+
def run(self):
|
46 |
+
setuptools.command.build_py.build_py.run(self)
|
47 |
+
|
48 |
+
|
49 |
+
class develop(setuptools.command.develop.develop):
|
50 |
+
def run(self):
|
51 |
+
setuptools.command.develop.develop.run(self)
|
52 |
+
|
53 |
+
|
54 |
+
# The documentation for this feature is in server/README.md
|
55 |
+
package_data = ["TTS/server/templates/*"]
|
56 |
+
|
57 |
+
|
58 |
+
def pip_install(package_name):
|
59 |
+
subprocess.call([sys.executable, "-m", "pip", "install", package_name])
|
60 |
+
|
61 |
+
|
62 |
+
requirements = open(os.path.join(cwd, "requirements.txt"), "r").readlines()
|
63 |
+
with open(os.path.join(cwd, "requirements.notebooks.txt"), "r") as f:
|
64 |
+
requirements_notebooks = f.readlines()
|
65 |
+
with open(os.path.join(cwd, "requirements.dev.txt"), "r") as f:
|
66 |
+
requirements_dev = f.readlines()
|
67 |
+
requirements_all = requirements_dev + requirements_notebooks
|
68 |
+
|
69 |
+
with open("README.md", "r", encoding="utf-8") as readme_file:
|
70 |
+
README = readme_file.read()
|
71 |
+
|
72 |
+
exts = [
|
73 |
+
Extension(
|
74 |
+
name="TTS.tts.utils.monotonic_align.core",
|
75 |
+
sources=["TTS/tts/utils/monotonic_align/core.pyx"],
|
76 |
+
)
|
77 |
+
]
|
78 |
+
setup(
|
79 |
+
name="TTS",
|
80 |
+
version=version,
|
81 |
+
url="https://github.com/coqui-ai/TTS",
|
82 |
+
author="Eren Gölge",
|
83 |
+
author_email="egolge@coqui.ai",
|
84 |
+
description="Deep learning for Text to Speech by Coqui.",
|
85 |
+
long_description=README,
|
86 |
+
long_description_content_type="text/markdown",
|
87 |
+
license="MPL-2.0",
|
88 |
+
# cython
|
89 |
+
include_dirs=numpy.get_include(),
|
90 |
+
ext_modules=cythonize(exts, language_level=3),
|
91 |
+
# ext_modules=find_cython_extensions(),
|
92 |
+
# package
|
93 |
+
include_package_data=True,
|
94 |
+
packages=find_packages(include=["TTS"], exclude=["*.tests", "*tests.*", "tests.*", "*tests", "tests"]),
|
95 |
+
package_data={
|
96 |
+
"TTS": [
|
97 |
+
"VERSION",
|
98 |
+
]
|
99 |
+
},
|
100 |
+
project_urls={
|
101 |
+
"Documentation": "https://github.com/coqui-ai/TTS/wiki",
|
102 |
+
"Tracker": "https://github.com/coqui-ai/TTS/issues",
|
103 |
+
"Repository": "https://github.com/coqui-ai/TTS",
|
104 |
+
"Discussions": "https://github.com/coqui-ai/TTS/discussions",
|
105 |
+
},
|
106 |
+
cmdclass={
|
107 |
+
"build_py": build_py,
|
108 |
+
"develop": develop,
|
109 |
+
# 'build_ext': build_ext
|
110 |
+
},
|
111 |
+
install_requires=requirements,
|
112 |
+
extras_require={
|
113 |
+
"all": requirements_all,
|
114 |
+
"dev": requirements_dev,
|
115 |
+
"notebooks": requirements_notebooks,
|
116 |
+
},
|
117 |
+
python_requires=">=3.9.0, <3.12",
|
118 |
+
entry_points={"console_scripts": ["tts=TTS.bin.synthesize:main", "tts-server = TTS.server.server:main"]},
|
119 |
+
classifiers=[
|
120 |
+
"Programming Language :: Python",
|
121 |
+
"Programming Language :: Python :: 3",
|
122 |
+
"Programming Language :: Python :: 3.9",
|
123 |
+
"Programming Language :: Python :: 3.10",
|
124 |
+
"Programming Language :: Python :: 3.11",
|
125 |
+
"Development Status :: 3 - Alpha",
|
126 |
+
"Intended Audience :: Science/Research",
|
127 |
+
"Intended Audience :: Developers",
|
128 |
+
"Operating System :: POSIX :: Linux",
|
129 |
+
"License :: OSI Approved :: Mozilla Public License 2.0 (MPL 2.0)",
|
130 |
+
"Topic :: Software Development",
|
131 |
+
"Topic :: Software Development :: Libraries :: Python Modules",
|
132 |
+
"Topic :: Multimedia :: Sound/Audio :: Speech",
|
133 |
+
"Topic :: Multimedia :: Sound/Audio",
|
134 |
+
"Topic :: Multimedia",
|
135 |
+
"Topic :: Scientific/Engineering :: Artificial Intelligence",
|
136 |
+
],
|
137 |
+
zip_safe=False,
|
138 |
+
)
|