konstantin-paulus commited on
Commit
50f6de3
1 Parent(s): ecf83ea

rhasspy/piper-voices duplicate as of 2024-07-05

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .DS_Store +0 -0
  2. README.md +7 -3
  3. _script/voice_names.sh +7 -0
  4. _script/voicefest.py +325 -0
  5. ar/ar_JO/kareem/low/MODEL_CARD +15 -0
  6. ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx +3 -0
  7. ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx.json +508 -0
  8. ar/ar_JO/kareem/low/samples/speaker_0.mp3 +0 -0
  9. ar/ar_JO/kareem/medium/MODEL_CARD +15 -0
  10. ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx +3 -0
  11. ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx.json +508 -0
  12. ar/ar_JO/kareem/medium/samples/speaker_0.mp3 +0 -0
  13. ca/ca_ES/upc_ona/medium/MODEL_CARD +15 -0
  14. ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx +3 -0
  15. ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx.json +493 -0
  16. ca/ca_ES/upc_ona/medium/samples/speaker_0.mp3 +0 -0
  17. ca/ca_ES/upc_ona/x_low/ALIASES +1 -0
  18. ca/ca_ES/upc_ona/x_low/MODEL_CARD +15 -0
  19. ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx +3 -0
  20. ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx.json +420 -0
  21. ca/ca_ES/upc_ona/x_low/samples/speaker_0.mp3 +0 -0
  22. ca/ca_ES/upc_pau/x_low/ALIASES +1 -0
  23. ca/ca_ES/upc_pau/x_low/MODEL_CARD +15 -0
  24. ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx +3 -0
  25. ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx.json +420 -0
  26. ca/ca_ES/upc_pau/x_low/samples/speaker_0.mp3 +0 -0
  27. cs/cs_CZ/jirka/low/MODEL_CARD +15 -0
  28. cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx +3 -0
  29. cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx.json +508 -0
  30. cs/cs_CZ/jirka/low/samples/speaker_0.mp3 +0 -0
  31. cs/cs_CZ/jirka/medium/MODEL_CARD +15 -0
  32. cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx +3 -0
  33. cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx.json +508 -0
  34. cs/cs_CZ/jirka/medium/samples/speaker_0.mp3 +0 -0
  35. cy/cy_GB/gwryw_gogleddol/medium/MODEL_CARD +15 -0
  36. cy/cy_GB/gwryw_gogleddol/medium/cy_GB-gwryw_gogleddol-medium.onnx +3 -0
  37. cy/cy_GB/gwryw_gogleddol/medium/cy_GB-gwryw_gogleddol-medium.onnx.json +502 -0
  38. cy/cy_GB/gwryw_gogleddol/medium/samples/speaker_0.mp3 +0 -0
  39. da/da_DK/talesyntese/medium/ALIASES +1 -0
  40. da/da_DK/talesyntese/medium/MODEL_CARD +15 -0
  41. da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx +3 -0
  42. da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx.json +493 -0
  43. da/da_DK/talesyntese/medium/samples/speaker_0.mp3 +0 -0
  44. de/de_DE/eva_k/x_low/ALIASES +1 -0
  45. de/de_DE/eva_k/x_low/MODEL_CARD +15 -0
  46. de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx +3 -0
  47. de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx.json +420 -0
  48. de/de_DE/eva_k/x_low/samples/speaker_0.mp3 +0 -0
  49. de/de_DE/karlsson/low/ALIASES +1 -0
  50. de/de_DE/karlsson/low/MODEL_CARD +15 -0
.DS_Store ADDED
Binary file (6.15 kB). View file
 
README.md CHANGED
@@ -1,3 +1,7 @@
1
- ---
2
- license: mit
3
- ---
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ ---
4
+
5
+ **Fork from:** [rhasspy/piper-voices](https://huggingface.co/rhasspy/piper-voices).
6
+
7
+ For checkpoints that you can use to [train your own voices](https://github.com/rhasspy/piper/blob/master/TRAINING.md), see [piper-checkpoints](https://huggingface.co/datasets/rhasspy/piper-checkpoints/tree/main)
_script/voice_names.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env bash
2
+ set -eo pipefail
3
+
4
+ this_dir="$( cd "$( dirname "$0" )" && pwd )"
5
+ repo_dir="$(realpath "${this_dir}/../")"
6
+
7
+ find "${repo_dir}" -type f -name '*.onnx' -exec basename '{}' '.onnx' \; | sort | uniq
_script/voicefest.py ADDED
@@ -0,0 +1,325 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python3
2
+ import hashlib
3
+ import json
4
+ import unittest
5
+ from dataclasses import dataclass
6
+ from pathlib import Path
7
+ from typing import Set
8
+
9
+ _DIR = Path(__file__).parent
10
+ _REPO_DIR = _DIR.parent
11
+
12
+
13
+ @dataclass
14
+ class Language:
15
+ native: str
16
+ english: str
17
+ country: str
18
+
19
+
20
+ _LANGUAGES = {
21
+ "ar_JO": Language("العربية", "Arabic", "Jordan"),
22
+ "ca_ES": Language("Català", "Catalan", "Spain"),
23
+ "cs_CZ": Language("Čeština", "Czech", "Czech Republic"),
24
+ "cy_GB": Language("Cymraeg", "Welsh", "Great Britain"),
25
+ "da_DK": Language("Dansk", "Danish", "Denmark"),
26
+ "de_DE": Language("Deutsch", "German", "Germany"),
27
+ "el_GR": Language("Ελληνικά", "Greek", "Greece"),
28
+ "en_GB": Language("English", "English", "Great Britain"),
29
+ "en_US": Language("English", "English", "United States"),
30
+ "es_ES": Language("Español", "Spanish", "Spain"),
31
+ "es_MX": Language("Español", "Spanish", "Mexico"),
32
+ "fa_IR": Language("فارسی", "Farsi", "Iran"),
33
+ "fi_FI": Language("Suomi", "Finnish", "Finland"),
34
+ "fr_FR": Language("Français", "French", "France"),
35
+ "is_IS": Language("íslenska", "Icelandic", "Iceland"),
36
+ "it_IT": Language("Italiano", "Italian", "Italy"),
37
+ "hu_HU": Language("Magyar", "Hungarian", "Hungary"),
38
+ "ka_GE": Language("ქართული ენა", "Georgian", "Georgia"),
39
+ "kk_KZ": Language("қазақша", "Kazakh", "Kazakhstan"),
40
+ "lb_LU": Language("Lëtzebuergesch", "Luxembourgish", "Luxembourg"),
41
+ "ne_NP": Language("नेपाली", "Nepali", "Nepal"),
42
+ "nl_BE": Language("Nederlands", "Dutch", "Belgium"),
43
+ "nl_NL": Language("Nederlands", "Dutch", "Netherlands"),
44
+ "no_NO": Language("Norsk", "Norwegian", "Norway"),
45
+ "pl_PL": Language("Polski", "Polish", "Poland"),
46
+ "pt_BR": Language("Português", "Portuguese", "Brazil"),
47
+ "pt_PT": Language("Português", "Portuguese", "Portugal"),
48
+ "ro_RO": Language("Română", "Romanian", "Romania"),
49
+ "ru_RU": Language("Русский", "Russian", "Russia"),
50
+ "sk_SK": Language("Slovenčina", "Slovak", "Slovakia"),
51
+ "sl_SI": Language("Slovenščina", "Slovenian", "Slovenia"),
52
+ "sr_RS": Language("srpski", "Serbian", "Serbia"),
53
+ "sv_SE": Language("Svenska", "Swedish", "Sweden"),
54
+ "sw_CD": Language("Kiswahili", "Swahili", "Democratic Republic of the Congo"),
55
+ "tr_TR": Language("Türkçe", "Turkish", "Turkey"),
56
+ "uk_UA": Language("украї́нська мо́ва", "Ukrainian", "Ukraine"),
57
+ "vi_VN": Language("Tiếng Việt", "Vietnamese", "Vietnam"),
58
+ "zh_CN": Language("简体中文", "Chinese", "China"),
59
+ }
60
+
61
+ # -----------------------------------------------------------------------------
62
+
63
+
64
+ def add_languages():
65
+ for onnx_path in _REPO_DIR.rglob("*.onnx"):
66
+ config_path = f"{onnx_path}.json"
67
+ with open(config_path, "r", encoding="utf-8") as config_file:
68
+ config = json.load(config_file)
69
+
70
+ lang_code, dataset, quality = onnx_path.stem.split("-")
71
+ is_changed = False
72
+
73
+ lang_info = _LANGUAGES.get(lang_code)
74
+ assert lang_info is not None, f"Missing name for language: {lang_code}"
75
+
76
+ lang_family, lang_region = lang_code.split("_", maxsplit=1)
77
+ lang_dict = {
78
+ "code": lang_code,
79
+ "family": lang_family,
80
+ "region": lang_region,
81
+ "name_native": lang_info.native,
82
+ "name_english": lang_info.english,
83
+ "country_english": lang_info.country,
84
+ }
85
+
86
+ if "language" not in config:
87
+ config["language"] = lang_dict
88
+ is_changed = True
89
+ else:
90
+ current_lang_dict = config["language"]
91
+ if "code" not in current_lang_dict:
92
+ current_lang_dict["code"] = lang_dict["code"]
93
+ is_changed = True
94
+
95
+ if "family" not in current_lang_dict:
96
+ current_lang_dict["family"] = lang_dict["family"]
97
+ is_changed = True
98
+
99
+ if "region" not in current_lang_dict:
100
+ current_lang_dict["region"] = lang_dict["region"]
101
+ is_changed = True
102
+
103
+ if "name_native" not in current_lang_dict:
104
+ current_lang_dict["name_native"] = lang_dict["name_native"]
105
+ is_changed = True
106
+
107
+ if "name_english" not in current_lang_dict:
108
+ current_lang_dict["name_english"] = lang_dict["name_english"]
109
+ is_changed = True
110
+
111
+ if "country_english" not in current_lang_dict:
112
+ current_lang_dict["country_english"] = lang_dict["country_english"]
113
+ is_changed = True
114
+
115
+ if "dataset" not in config:
116
+ config["dataset"] = dataset
117
+ is_changed = True
118
+
119
+ if "quality" not in config["audio"]:
120
+ config["audio"]["quality"] = quality
121
+ is_changed = True
122
+
123
+ if is_changed:
124
+ with open(config_path, "w", encoding="utf-8") as config_file:
125
+ json.dump(config, config_file, ensure_ascii=False, indent=2)
126
+
127
+
128
+ # -----------------------------------------------------------------------------
129
+
130
+
131
+ class VoiceTest(unittest.TestCase):
132
+ def test_voices(self):
133
+ used_aliases: Set[str] = set()
134
+
135
+ for onnx_path in _REPO_DIR.rglob("*.onnx"):
136
+ with self.subTest(onnx_path=onnx_path):
137
+ self.assertGreater(onnx_path.stat().st_size, 0, "Empty onnx file")
138
+
139
+ # Load JSON config for voice
140
+ config_path = onnx_path.parent / f"{onnx_path.name}.json"
141
+ with open(config_path, "r", encoding="utf-8") as config_file:
142
+ config = json.load(config_file)
143
+
144
+ # Verify config
145
+ self.assertIn(
146
+ "piper_version", config, "Missing piper_version in config"
147
+ )
148
+ self.assertIn("language", config, "Missing language in config")
149
+ self.assertIn("dataset", config, "Missing dataset in config")
150
+ self.assertIn(
151
+ "quality", config["audio"], "Missing audio quality in config"
152
+ )
153
+
154
+ # Verify directory structure
155
+ # <lang_family>/<lang_code>/<dataset>/<quality>/
156
+ quality_dir = onnx_path.parent
157
+ dataset_dir = quality_dir.parent
158
+ lang_code_dir = dataset_dir.parent
159
+ lang_family_dir = lang_code_dir.parent
160
+
161
+ self.assertEqual(
162
+ lang_family_dir.name,
163
+ config["language"]["family"],
164
+ "Wrong lang family dir",
165
+ )
166
+ self.assertEqual(
167
+ lang_code_dir.name,
168
+ config["language"]["code"],
169
+ "Wrong lang code dir",
170
+ )
171
+ self.assertEqual(
172
+ dataset_dir.name, config["dataset"], "Wrong dataset dir"
173
+ )
174
+ self.assertEqual(
175
+ quality_dir.name, config["audio"]["quality"], "Wrong quality dir"
176
+ )
177
+ self.assertIn(lang_code_dir.name, _LANGUAGES, "Unknown language code")
178
+
179
+ # Verify file names
180
+ file_lang_code, file_dataset, file_quality = onnx_path.stem.split("-")
181
+ file_lang_family = file_lang_code.split("_", maxsplit=1)[0]
182
+
183
+ self.assertEqual(
184
+ file_lang_family,
185
+ config["language"]["family"],
186
+ "Wrong lang family file",
187
+ )
188
+ self.assertEqual(
189
+ file_lang_code, config["language"]["code"], "Wrong lang code file"
190
+ )
191
+ self.assertEqual(file_dataset, config["dataset"], "Wrong dataset file")
192
+ self.assertEqual(
193
+ file_quality, config["audio"]["quality"], "Wrong quality"
194
+ )
195
+
196
+ # Verify aliases are unique
197
+ aliases_path = onnx_path.parent / "ALIASES"
198
+ if aliases_path.exists():
199
+ with open(aliases_path, "r", encoding="utf-8") as aliases_file:
200
+ for alias in aliases_file:
201
+ alias = alias.strip()
202
+ self.assertNotIn(
203
+ alias,
204
+ used_aliases,
205
+ "Alias is already in use by another voice",
206
+ )
207
+ used_aliases.add(alias)
208
+
209
+
210
+ def run_tests() -> None:
211
+ runner = unittest.TextTestRunner()
212
+ result = runner.run(unittest.makeSuite(VoiceTest))
213
+ assert not result.failures, "Test failures"
214
+
215
+
216
+ # -----------------------------------------------------------------------------
217
+
218
+
219
+ def write_voices_json() -> None:
220
+ # {
221
+ # "<family>_<region>-<dataset>-<quality>": {
222
+ # "key": "<voice_key>",
223
+ # "name": "<dataset>",
224
+ # "language": {
225
+ # "code": "<family>_<region>",
226
+ # "family": "<family>",
227
+ # "region": "<region>",
228
+ # "name_native": "<native>",
229
+ # "name_english": "<english>",
230
+ # "country_english": "<country>",
231
+ # },
232
+ # "quality": "<quality>", // x_low, low, medium, high
233
+ # "num_speakers": int,
234
+ # "speaker_id_map": {
235
+ # "name": int,
236
+ # ...
237
+ # }
238
+ # "files": {
239
+ # "relative/path/to/file": {
240
+ # "size_bytes": int,
241
+ # "md5_digest": str, // hex
242
+ # },
243
+ # ...
244
+ # },
245
+ # "aliases": ["alias", ...],
246
+ # },
247
+ # ...
248
+ # }
249
+ voices = {}
250
+
251
+ for onnx_path in sorted(_REPO_DIR.rglob("*.onnx")):
252
+ voice_dir = onnx_path.parent
253
+ config_path = voice_dir / f"{onnx_path.name}.json"
254
+ with open(config_path, "r", encoding="utf-8") as config_file:
255
+ config = json.load(config_file)
256
+
257
+ quality = config["audio"]["quality"]
258
+ dataset = config["dataset"]
259
+ lang_code = config["language"]["code"]
260
+ lang_family, lang_region = lang_code.split("_", maxsplit=1)
261
+ lang_names = _LANGUAGES[lang_code]
262
+ voice_key = f"{lang_code}-{dataset}-{quality}"
263
+
264
+ model_card_path = voice_dir / "MODEL_CARD"
265
+ assert model_card_path.exists(), f"Missing {model_card_path}"
266
+
267
+ aliases: Set[str] = set()
268
+ aliases_path = voice_dir / "ALIASES"
269
+ if aliases_path.exists():
270
+ with open(aliases_path, "r", encoding="utf-8") as aliases_file:
271
+ for alias in aliases_file:
272
+ aliases.add(alias.strip())
273
+
274
+ voices[voice_key] = {
275
+ "key": voice_key,
276
+ "name": dataset,
277
+ "language": {
278
+ "code": lang_code,
279
+ "family": lang_family,
280
+ "region": lang_region,
281
+ "name_native": lang_names.native,
282
+ "name_english": lang_names.english,
283
+ "country_english": lang_names.country,
284
+ },
285
+ "quality": quality,
286
+ "num_speakers": config["num_speakers"],
287
+ "speaker_id_map": config.get("speaker_id_map", {}),
288
+ "files": {
289
+ str(file_path.relative_to(_REPO_DIR)): {
290
+ "size_bytes": file_path.stat().st_size,
291
+ "md5_digest": get_file_hash(file_path),
292
+ }
293
+ for file_path in (
294
+ onnx_path,
295
+ config_path,
296
+ model_card_path,
297
+ )
298
+ },
299
+ "aliases": sorted(list(aliases)),
300
+ }
301
+
302
+ with open(_REPO_DIR / "voices.json", "w", encoding="utf-8") as voices_file:
303
+ json.dump(voices, voices_file, indent=4, ensure_ascii=False)
304
+
305
+
306
+ def get_file_hash(path, bytes_per_chunk: int = 8192) -> str:
307
+ """Hash a file in chunks using md5."""
308
+ path_hash = hashlib.md5()
309
+ with open(path, "rb") as path_file:
310
+ chunk = path_file.read(bytes_per_chunk)
311
+ while chunk:
312
+ path_hash.update(chunk)
313
+ chunk = path_file.read(bytes_per_chunk)
314
+
315
+ return path_hash.hexdigest()
316
+
317
+
318
+ # -----------------------------------------------------------------------------
319
+
320
+ if __name__ == "__main__":
321
+ add_languages()
322
+ run_tests()
323
+
324
+ print("Writing voices.json")
325
+ write_voices_json()
ar/ar_JO/kareem/low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for kareem (low)
2
+
3
+ * Language: ar_JO (Arabic, Jordan)
4
+ * Speakers: 1
5
+ * Quality: low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/AliMokhammad/arabicttstrain/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S English lessac voice (low quality).
ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2887e9d68b125965c747e1371fa21e1cef19555ea98d0795a0d5d71188b13890
3
+ size 63201294
ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": "kareem",
3
+ "audio": {
4
+ "sample_rate": 16000,
5
+ "quality": "low"
6
+ },
7
+ "espeak": {
8
+ "voice": "ar"
9
+ },
10
+ "language": {
11
+ "code": "ar_JO",
12
+ "family": "ar",
13
+ "region": "JO",
14
+ "name_native": "العربية",
15
+ "name_english": "Arabic",
16
+ "country_english": "Jordan"
17
+ },
18
+ "inference": {
19
+ "noise_scale": 0.667,
20
+ "length_scale": 1,
21
+ "noise_w": 0.8
22
+ },
23
+ "phoneme_type": "espeak",
24
+ "phoneme_map": {},
25
+ "phoneme_id_map": {
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "\"": [
33
+ 150
34
+ ],
35
+ "#": [
36
+ 149
37
+ ],
38
+ "$": [
39
+ 2
40
+ ],
41
+ "'": [
42
+ 5
43
+ ],
44
+ "(": [
45
+ 6
46
+ ],
47
+ ")": [
48
+ 7
49
+ ],
50
+ ",": [
51
+ 8
52
+ ],
53
+ "-": [
54
+ 9
55
+ ],
56
+ ".": [
57
+ 10
58
+ ],
59
+ "0": [
60
+ 130
61
+ ],
62
+ "1": [
63
+ 131
64
+ ],
65
+ "2": [
66
+ 132
67
+ ],
68
+ "3": [
69
+ 133
70
+ ],
71
+ "4": [
72
+ 134
73
+ ],
74
+ "5": [
75
+ 135
76
+ ],
77
+ "6": [
78
+ 136
79
+ ],
80
+ "7": [
81
+ 137
82
+ ],
83
+ "8": [
84
+ 138
85
+ ],
86
+ "9": [
87
+ 139
88
+ ],
89
+ ":": [
90
+ 11
91
+ ],
92
+ ";": [
93
+ 12
94
+ ],
95
+ "?": [
96
+ 13
97
+ ],
98
+ "X": [
99
+ 156
100
+ ],
101
+ "^": [
102
+ 1
103
+ ],
104
+ "_": [
105
+ 0
106
+ ],
107
+ "a": [
108
+ 14
109
+ ],
110
+ "b": [
111
+ 15
112
+ ],
113
+ "c": [
114
+ 16
115
+ ],
116
+ "d": [
117
+ 17
118
+ ],
119
+ "e": [
120
+ 18
121
+ ],
122
+ "f": [
123
+ 19
124
+ ],
125
+ "g": [
126
+ 154
127
+ ],
128
+ "h": [
129
+ 20
130
+ ],
131
+ "i": [
132
+ 21
133
+ ],
134
+ "j": [
135
+ 22
136
+ ],
137
+ "k": [
138
+ 23
139
+ ],
140
+ "l": [
141
+ 24
142
+ ],
143
+ "m": [
144
+ 25
145
+ ],
146
+ "n": [
147
+ 26
148
+ ],
149
+ "o": [
150
+ 27
151
+ ],
152
+ "p": [
153
+ 28
154
+ ],
155
+ "q": [
156
+ 29
157
+ ],
158
+ "r": [
159
+ 30
160
+ ],
161
+ "s": [
162
+ 31
163
+ ],
164
+ "t": [
165
+ 32
166
+ ],
167
+ "u": [
168
+ 33
169
+ ],
170
+ "v": [
171
+ 34
172
+ ],
173
+ "w": [
174
+ 35
175
+ ],
176
+ "x": [
177
+ 36
178
+ ],
179
+ "y": [
180
+ 37
181
+ ],
182
+ "z": [
183
+ 38
184
+ ],
185
+ "æ": [
186
+ 39
187
+ ],
188
+ "ç": [
189
+ 40
190
+ ],
191
+ "ð": [
192
+ 41
193
+ ],
194
+ "ø": [
195
+ 42
196
+ ],
197
+ "ħ": [
198
+ 43
199
+ ],
200
+ "ŋ": [
201
+ 44
202
+ ],
203
+ "œ": [
204
+ 45
205
+ ],
206
+ "ǀ": [
207
+ 46
208
+ ],
209
+ "ǁ": [
210
+ 47
211
+ ],
212
+ "ǂ": [
213
+ 48
214
+ ],
215
+ "ǃ": [
216
+ 49
217
+ ],
218
+ "ɐ": [
219
+ 50
220
+ ],
221
+ "ɑ": [
222
+ 51
223
+ ],
224
+ "ɒ": [
225
+ 52
226
+ ],
227
+ "ɓ": [
228
+ 53
229
+ ],
230
+ "ɔ": [
231
+ 54
232
+ ],
233
+ "ɕ": [
234
+ 55
235
+ ],
236
+ "ɖ": [
237
+ 56
238
+ ],
239
+ "ɗ": [
240
+ 57
241
+ ],
242
+ "ɘ": [
243
+ 58
244
+ ],
245
+ "ə": [
246
+ 59
247
+ ],
248
+ "ɚ": [
249
+ 60
250
+ ],
251
+ "ɛ": [
252
+ 61
253
+ ],
254
+ "ɜ": [
255
+ 62
256
+ ],
257
+ "ɞ": [
258
+ 63
259
+ ],
260
+ "ɟ": [
261
+ 64
262
+ ],
263
+ "ɠ": [
264
+ 65
265
+ ],
266
+ "ɡ": [
267
+ 66
268
+ ],
269
+ "ɢ": [
270
+ 67
271
+ ],
272
+ "ɣ": [
273
+ 68
274
+ ],
275
+ "ɤ": [
276
+ 69
277
+ ],
278
+ "ɥ": [
279
+ 70
280
+ ],
281
+ "ɦ": [
282
+ 71
283
+ ],
284
+ "ɧ": [
285
+ 72
286
+ ],
287
+ "ɨ": [
288
+ 73
289
+ ],
290
+ "ɪ": [
291
+ 74
292
+ ],
293
+ "ɫ": [
294
+ 75
295
+ ],
296
+ "ɬ": [
297
+ 76
298
+ ],
299
+ "ɭ": [
300
+ 77
301
+ ],
302
+ "ɮ": [
303
+ 78
304
+ ],
305
+ "ɯ": [
306
+ 79
307
+ ],
308
+ "ɰ": [
309
+ 80
310
+ ],
311
+ "ɱ": [
312
+ 81
313
+ ],
314
+ "ɲ": [
315
+ 82
316
+ ],
317
+ "ɳ": [
318
+ 83
319
+ ],
320
+ "ɴ": [
321
+ 84
322
+ ],
323
+ "ɵ": [
324
+ 85
325
+ ],
326
+ "ɶ": [
327
+ 86
328
+ ],
329
+ "ɸ": [
330
+ 87
331
+ ],
332
+ "ɹ": [
333
+ 88
334
+ ],
335
+ "ɺ": [
336
+ 89
337
+ ],
338
+ "ɻ": [
339
+ 90
340
+ ],
341
+ "ɽ": [
342
+ 91
343
+ ],
344
+ "ɾ": [
345
+ 92
346
+ ],
347
+ "ʀ": [
348
+ 93
349
+ ],
350
+ "ʁ": [
351
+ 94
352
+ ],
353
+ "ʂ": [
354
+ 95
355
+ ],
356
+ "ʃ": [
357
+ 96
358
+ ],
359
+ "ʄ": [
360
+ 97
361
+ ],
362
+ "ʈ": [
363
+ 98
364
+ ],
365
+ "ʉ": [
366
+ 99
367
+ ],
368
+ "ʊ": [
369
+ 100
370
+ ],
371
+ "ʋ": [
372
+ 101
373
+ ],
374
+ "ʌ": [
375
+ 102
376
+ ],
377
+ "ʍ": [
378
+ 103
379
+ ],
380
+ "ʎ": [
381
+ 104
382
+ ],
383
+ "ʏ": [
384
+ 105
385
+ ],
386
+ "ʐ": [
387
+ 106
388
+ ],
389
+ "ʑ": [
390
+ 107
391
+ ],
392
+ "ʒ": [
393
+ 108
394
+ ],
395
+ "ʔ": [
396
+ 109
397
+ ],
398
+ "ʕ": [
399
+ 110
400
+ ],
401
+ "ʘ": [
402
+ 111
403
+ ],
404
+ "ʙ": [
405
+ 112
406
+ ],
407
+ "ʛ": [
408
+ 113
409
+ ],
410
+ "ʜ": [
411
+ 114
412
+ ],
413
+ "ʝ": [
414
+ 115
415
+ ],
416
+ "ʟ": [
417
+ 116
418
+ ],
419
+ "ʡ": [
420
+ 117
421
+ ],
422
+ "ʢ": [
423
+ 118
424
+ ],
425
+ "ʦ": [
426
+ 155
427
+ ],
428
+ "ʰ": [
429
+ 145
430
+ ],
431
+ "ʲ": [
432
+ 119
433
+ ],
434
+ "ˈ": [
435
+ 120
436
+ ],
437
+ "ˌ": [
438
+ 121
439
+ ],
440
+ "ː": [
441
+ 122
442
+ ],
443
+ "ˑ": [
444
+ 123
445
+ ],
446
+ "˞": [
447
+ 124
448
+ ],
449
+ "ˤ": [
450
+ 146
451
+ ],
452
+ "̃": [
453
+ 141
454
+ ],
455
+ "̊": [
456
+ 158
457
+ ],
458
+ "̝": [
459
+ 157
460
+ ],
461
+ "̧": [
462
+ 140
463
+ ],
464
+ "̩": [
465
+ 144
466
+ ],
467
+ "̪": [
468
+ 142
469
+ ],
470
+ "̯": [
471
+ 143
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ],
479
+ "β": [
480
+ 125
481
+ ],
482
+ "ε": [
483
+ 147
484
+ ],
485
+ "θ": [
486
+ 126
487
+ ],
488
+ "χ": [
489
+ 127
490
+ ],
491
+ "ᵻ": [
492
+ 128
493
+ ],
494
+ "↑": [
495
+ 151
496
+ ],
497
+ "↓": [
498
+ 148
499
+ ],
500
+ "ⱱ": [
501
+ 129
502
+ ]
503
+ },
504
+ "num_symbols": 256,
505
+ "num_speakers": 1,
506
+ "speaker_id_map": {},
507
+ "piper_version": "1.0.0"
508
+ }
ar/ar_JO/kareem/low/samples/speaker_0.mp3 ADDED
Binary file (107 kB). View file
 
ar/ar_JO/kareem/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for kareem (medium)
2
+
3
+ * Language: ar_JO (Arabic, Jordan)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/AliMokhammad/arabicttstrain/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S English lessac voice (medium quality).
ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e95cab07b679da603bba17c4dec7ab3111320571964ee95c0379603c086491e
3
+ size 63201294
ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": "kareem",
3
+ "audio": {
4
+ "sample_rate": 22050,
5
+ "quality": "medium"
6
+ },
7
+ "espeak": {
8
+ "voice": "ar"
9
+ },
10
+ "language": {
11
+ "code": "ar_JO",
12
+ "family": "ar",
13
+ "region": "JO",
14
+ "name_native": "العربية",
15
+ "name_english": "Arabic",
16
+ "country_english": "Jordan"
17
+ },
18
+ "inference": {
19
+ "noise_scale": 0.667,
20
+ "length_scale": 1,
21
+ "noise_w": 0.8
22
+ },
23
+ "phoneme_type": "espeak",
24
+ "phoneme_map": {},
25
+ "phoneme_id_map": {
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "\"": [
33
+ 150
34
+ ],
35
+ "#": [
36
+ 149
37
+ ],
38
+ "$": [
39
+ 2
40
+ ],
41
+ "'": [
42
+ 5
43
+ ],
44
+ "(": [
45
+ 6
46
+ ],
47
+ ")": [
48
+ 7
49
+ ],
50
+ ",": [
51
+ 8
52
+ ],
53
+ "-": [
54
+ 9
55
+ ],
56
+ ".": [
57
+ 10
58
+ ],
59
+ "0": [
60
+ 130
61
+ ],
62
+ "1": [
63
+ 131
64
+ ],
65
+ "2": [
66
+ 132
67
+ ],
68
+ "3": [
69
+ 133
70
+ ],
71
+ "4": [
72
+ 134
73
+ ],
74
+ "5": [
75
+ 135
76
+ ],
77
+ "6": [
78
+ 136
79
+ ],
80
+ "7": [
81
+ 137
82
+ ],
83
+ "8": [
84
+ 138
85
+ ],
86
+ "9": [
87
+ 139
88
+ ],
89
+ ":": [
90
+ 11
91
+ ],
92
+ ";": [
93
+ 12
94
+ ],
95
+ "?": [
96
+ 13
97
+ ],
98
+ "X": [
99
+ 156
100
+ ],
101
+ "^": [
102
+ 1
103
+ ],
104
+ "_": [
105
+ 0
106
+ ],
107
+ "a": [
108
+ 14
109
+ ],
110
+ "b": [
111
+ 15
112
+ ],
113
+ "c": [
114
+ 16
115
+ ],
116
+ "d": [
117
+ 17
118
+ ],
119
+ "e": [
120
+ 18
121
+ ],
122
+ "f": [
123
+ 19
124
+ ],
125
+ "g": [
126
+ 154
127
+ ],
128
+ "h": [
129
+ 20
130
+ ],
131
+ "i": [
132
+ 21
133
+ ],
134
+ "j": [
135
+ 22
136
+ ],
137
+ "k": [
138
+ 23
139
+ ],
140
+ "l": [
141
+ 24
142
+ ],
143
+ "m": [
144
+ 25
145
+ ],
146
+ "n": [
147
+ 26
148
+ ],
149
+ "o": [
150
+ 27
151
+ ],
152
+ "p": [
153
+ 28
154
+ ],
155
+ "q": [
156
+ 29
157
+ ],
158
+ "r": [
159
+ 30
160
+ ],
161
+ "s": [
162
+ 31
163
+ ],
164
+ "t": [
165
+ 32
166
+ ],
167
+ "u": [
168
+ 33
169
+ ],
170
+ "v": [
171
+ 34
172
+ ],
173
+ "w": [
174
+ 35
175
+ ],
176
+ "x": [
177
+ 36
178
+ ],
179
+ "y": [
180
+ 37
181
+ ],
182
+ "z": [
183
+ 38
184
+ ],
185
+ "æ": [
186
+ 39
187
+ ],
188
+ "ç": [
189
+ 40
190
+ ],
191
+ "ð": [
192
+ 41
193
+ ],
194
+ "ø": [
195
+ 42
196
+ ],
197
+ "ħ": [
198
+ 43
199
+ ],
200
+ "ŋ": [
201
+ 44
202
+ ],
203
+ "œ": [
204
+ 45
205
+ ],
206
+ "ǀ": [
207
+ 46
208
+ ],
209
+ "ǁ": [
210
+ 47
211
+ ],
212
+ "ǂ": [
213
+ 48
214
+ ],
215
+ "ǃ": [
216
+ 49
217
+ ],
218
+ "ɐ": [
219
+ 50
220
+ ],
221
+ "ɑ": [
222
+ 51
223
+ ],
224
+ "ɒ": [
225
+ 52
226
+ ],
227
+ "ɓ": [
228
+ 53
229
+ ],
230
+ "ɔ": [
231
+ 54
232
+ ],
233
+ "ɕ": [
234
+ 55
235
+ ],
236
+ "ɖ": [
237
+ 56
238
+ ],
239
+ "ɗ": [
240
+ 57
241
+ ],
242
+ "ɘ": [
243
+ 58
244
+ ],
245
+ "ə": [
246
+ 59
247
+ ],
248
+ "ɚ": [
249
+ 60
250
+ ],
251
+ "ɛ": [
252
+ 61
253
+ ],
254
+ "ɜ": [
255
+ 62
256
+ ],
257
+ "ɞ": [
258
+ 63
259
+ ],
260
+ "ɟ": [
261
+ 64
262
+ ],
263
+ "ɠ": [
264
+ 65
265
+ ],
266
+ "ɡ": [
267
+ 66
268
+ ],
269
+ "ɢ": [
270
+ 67
271
+ ],
272
+ "ɣ": [
273
+ 68
274
+ ],
275
+ "ɤ": [
276
+ 69
277
+ ],
278
+ "ɥ": [
279
+ 70
280
+ ],
281
+ "ɦ": [
282
+ 71
283
+ ],
284
+ "ɧ": [
285
+ 72
286
+ ],
287
+ "ɨ": [
288
+ 73
289
+ ],
290
+ "ɪ": [
291
+ 74
292
+ ],
293
+ "ɫ": [
294
+ 75
295
+ ],
296
+ "ɬ": [
297
+ 76
298
+ ],
299
+ "ɭ": [
300
+ 77
301
+ ],
302
+ "ɮ": [
303
+ 78
304
+ ],
305
+ "ɯ": [
306
+ 79
307
+ ],
308
+ "ɰ": [
309
+ 80
310
+ ],
311
+ "ɱ": [
312
+ 81
313
+ ],
314
+ "ɲ": [
315
+ 82
316
+ ],
317
+ "ɳ": [
318
+ 83
319
+ ],
320
+ "ɴ": [
321
+ 84
322
+ ],
323
+ "ɵ": [
324
+ 85
325
+ ],
326
+ "ɶ": [
327
+ 86
328
+ ],
329
+ "ɸ": [
330
+ 87
331
+ ],
332
+ "ɹ": [
333
+ 88
334
+ ],
335
+ "ɺ": [
336
+ 89
337
+ ],
338
+ "ɻ": [
339
+ 90
340
+ ],
341
+ "ɽ": [
342
+ 91
343
+ ],
344
+ "ɾ": [
345
+ 92
346
+ ],
347
+ "ʀ": [
348
+ 93
349
+ ],
350
+ "ʁ": [
351
+ 94
352
+ ],
353
+ "ʂ": [
354
+ 95
355
+ ],
356
+ "ʃ": [
357
+ 96
358
+ ],
359
+ "ʄ": [
360
+ 97
361
+ ],
362
+ "ʈ": [
363
+ 98
364
+ ],
365
+ "ʉ": [
366
+ 99
367
+ ],
368
+ "ʊ": [
369
+ 100
370
+ ],
371
+ "ʋ": [
372
+ 101
373
+ ],
374
+ "ʌ": [
375
+ 102
376
+ ],
377
+ "ʍ": [
378
+ 103
379
+ ],
380
+ "ʎ": [
381
+ 104
382
+ ],
383
+ "ʏ": [
384
+ 105
385
+ ],
386
+ "ʐ": [
387
+ 106
388
+ ],
389
+ "ʑ": [
390
+ 107
391
+ ],
392
+ "ʒ": [
393
+ 108
394
+ ],
395
+ "ʔ": [
396
+ 109
397
+ ],
398
+ "ʕ": [
399
+ 110
400
+ ],
401
+ "ʘ": [
402
+ 111
403
+ ],
404
+ "ʙ": [
405
+ 112
406
+ ],
407
+ "ʛ": [
408
+ 113
409
+ ],
410
+ "ʜ": [
411
+ 114
412
+ ],
413
+ "ʝ": [
414
+ 115
415
+ ],
416
+ "ʟ": [
417
+ 116
418
+ ],
419
+ "ʡ": [
420
+ 117
421
+ ],
422
+ "ʢ": [
423
+ 118
424
+ ],
425
+ "ʦ": [
426
+ 155
427
+ ],
428
+ "ʰ": [
429
+ 145
430
+ ],
431
+ "ʲ": [
432
+ 119
433
+ ],
434
+ "ˈ": [
435
+ 120
436
+ ],
437
+ "ˌ": [
438
+ 121
439
+ ],
440
+ "ː": [
441
+ 122
442
+ ],
443
+ "ˑ": [
444
+ 123
445
+ ],
446
+ "˞": [
447
+ 124
448
+ ],
449
+ "ˤ": [
450
+ 146
451
+ ],
452
+ "̃": [
453
+ 141
454
+ ],
455
+ "̊": [
456
+ 158
457
+ ],
458
+ "̝": [
459
+ 157
460
+ ],
461
+ "̧": [
462
+ 140
463
+ ],
464
+ "̩": [
465
+ 144
466
+ ],
467
+ "̪": [
468
+ 142
469
+ ],
470
+ "̯": [
471
+ 143
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ],
479
+ "β": [
480
+ 125
481
+ ],
482
+ "ε": [
483
+ 147
484
+ ],
485
+ "θ": [
486
+ 126
487
+ ],
488
+ "χ": [
489
+ 127
490
+ ],
491
+ "ᵻ": [
492
+ 128
493
+ ],
494
+ "↑": [
495
+ 151
496
+ ],
497
+ "↓": [
498
+ 148
499
+ ],
500
+ "ⱱ": [
501
+ 129
502
+ ]
503
+ },
504
+ "num_symbols": 256,
505
+ "num_speakers": 1,
506
+ "speaker_id_map": {},
507
+ "piper_version": "1.0.0"
508
+ }
ar/ar_JO/kareem/medium/samples/speaker_0.mp3 ADDED
Binary file (147 kB). View file
 
ca/ca_ES/upc_ona/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for upc_ona (medium)
2
+
3
+ * Language: ca_ES (Catalan, Spain)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://collectivat.cat/asr#upc-festcat-tts-corpora
11
+ * License: CC BY-SA 3.0 ES
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S English lessac voice (medium quality).
ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdb652db8c11a4475527346cf3241cb064d1ba393cf370f3f2ec09a872d118fd
3
+ size 63201294
ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx.json ADDED
@@ -0,0 +1,493 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "ca"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ]
479
+ },
480
+ "num_symbols": 256,
481
+ "num_speakers": 1,
482
+ "speaker_id_map": {},
483
+ "piper_version": "1.0.0",
484
+ "language": {
485
+ "code": "ca_ES",
486
+ "family": "ca",
487
+ "region": "ES",
488
+ "name_native": "Català",
489
+ "name_english": "Catalan",
490
+ "country_english": "Spain"
491
+ },
492
+ "dataset": "upc_ona"
493
+ }
ca/ca_ES/upc_ona/medium/samples/speaker_0.mp3 ADDED
Binary file (173 kB). View file
 
ca/ca_ES/upc_ona/x_low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ ca-upc_ona-x-low
ca/ca_ES/upc_ona/x_low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for upc_ona (x_low)
2
+
3
+ * Language: ca_ES (Catalan, Spain)
4
+ * Speakers: 1
5
+ * Quality: x_low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://collectivat.cat/asr#upc-festcat-tts-corpora
11
+ * License: CC BY-SA 3.0 ES
12
+
13
+ ## Training
14
+
15
+ Trained from scratch.
ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13661d26423e0c791823823a5971f4e1aaf644a62e65e0e94d299c0e70560e14
3
+ size 20628813
ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "x_low"
5
+ },
6
+ "espeak": {
7
+ "voice": "ca"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "ca_ES",
413
+ "family": "ca",
414
+ "region": "ES",
415
+ "name_native": "Català",
416
+ "name_english": "Catalan",
417
+ "country_english": "Spain"
418
+ },
419
+ "dataset": "upc_ona"
420
+ }
ca/ca_ES/upc_ona/x_low/samples/speaker_0.mp3 ADDED
Binary file (139 kB). View file
 
ca/ca_ES/upc_pau/x_low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ ca-upc_pau-x-low
ca/ca_ES/upc_pau/x_low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for upc_pau (x_low)
2
+
3
+ * Language: ca_ES (Catalan, Spain)
4
+ * Speakers: 1
5
+ * Quality: x_low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://collectivat.cat/asr#upc-festcat-tts-corpora
11
+ * License: CC BY-SA 3.0 ES
12
+
13
+ ## Training
14
+
15
+ Trained from scratch.
ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c936a1a78b0a795af3c2422a0f2edb26303c389ff961616902ba12e26b489071
3
+ size 28130791
ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "x_low"
5
+ },
6
+ "espeak": {
7
+ "voice": "ca"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "ca_ES",
413
+ "family": "ca",
414
+ "region": "ES",
415
+ "name_native": "Català",
416
+ "name_english": "Catalan",
417
+ "country_english": "Spain"
418
+ },
419
+ "dataset": "upc_pau"
420
+ }
ca/ca_ES/upc_pau/x_low/samples/speaker_0.mp3 ADDED
Binary file (151 kB). View file
 
cs/cs_CZ/jirka/low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for jirka (low)
2
+
3
+ * Language: cs_CZ (Czech, Czech Republic)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (low quality).
cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e73fb306a165b41927d2c9d882f71e9f1c86ac5edf37c5441370a6e4e6ef7d
3
+ size 63201294
cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "low"
5
+ },
6
+ "espeak": {
7
+ "voice": "cs"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ " ": [
18
+ 3
19
+ ],
20
+ "!": [
21
+ 4
22
+ ],
23
+ "\"": [
24
+ 150
25
+ ],
26
+ "#": [
27
+ 149
28
+ ],
29
+ "$": [
30
+ 2
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ "0": [
51
+ 130
52
+ ],
53
+ "1": [
54
+ 131
55
+ ],
56
+ "2": [
57
+ 132
58
+ ],
59
+ "3": [
60
+ 133
61
+ ],
62
+ "4": [
63
+ 134
64
+ ],
65
+ "5": [
66
+ 135
67
+ ],
68
+ "6": [
69
+ 136
70
+ ],
71
+ "7": [
72
+ 137
73
+ ],
74
+ "8": [
75
+ 138
76
+ ],
77
+ "9": [
78
+ 139
79
+ ],
80
+ ":": [
81
+ 11
82
+ ],
83
+ ";": [
84
+ 12
85
+ ],
86
+ "?": [
87
+ 13
88
+ ],
89
+ "X": [
90
+ 156
91
+ ],
92
+ "^": [
93
+ 1
94
+ ],
95
+ "_": [
96
+ 0
97
+ ],
98
+ "a": [
99
+ 14
100
+ ],
101
+ "b": [
102
+ 15
103
+ ],
104
+ "c": [
105
+ 16
106
+ ],
107
+ "d": [
108
+ 17
109
+ ],
110
+ "e": [
111
+ 18
112
+ ],
113
+ "f": [
114
+ 19
115
+ ],
116
+ "g": [
117
+ 154
118
+ ],
119
+ "h": [
120
+ 20
121
+ ],
122
+ "i": [
123
+ 21
124
+ ],
125
+ "j": [
126
+ 22
127
+ ],
128
+ "k": [
129
+ 23
130
+ ],
131
+ "l": [
132
+ 24
133
+ ],
134
+ "m": [
135
+ 25
136
+ ],
137
+ "n": [
138
+ 26
139
+ ],
140
+ "o": [
141
+ 27
142
+ ],
143
+ "p": [
144
+ 28
145
+ ],
146
+ "q": [
147
+ 29
148
+ ],
149
+ "r": [
150
+ 30
151
+ ],
152
+ "s": [
153
+ 31
154
+ ],
155
+ "t": [
156
+ 32
157
+ ],
158
+ "u": [
159
+ 33
160
+ ],
161
+ "v": [
162
+ 34
163
+ ],
164
+ "w": [
165
+ 35
166
+ ],
167
+ "x": [
168
+ 36
169
+ ],
170
+ "y": [
171
+ 37
172
+ ],
173
+ "z": [
174
+ 38
175
+ ],
176
+ "æ": [
177
+ 39
178
+ ],
179
+ "ç": [
180
+ 40
181
+ ],
182
+ "ð": [
183
+ 41
184
+ ],
185
+ "ø": [
186
+ 42
187
+ ],
188
+ "ħ": [
189
+ 43
190
+ ],
191
+ "ŋ": [
192
+ 44
193
+ ],
194
+ "œ": [
195
+ 45
196
+ ],
197
+ "ǀ": [
198
+ 46
199
+ ],
200
+ "ǁ": [
201
+ 47
202
+ ],
203
+ "ǂ": [
204
+ 48
205
+ ],
206
+ "ǃ": [
207
+ 49
208
+ ],
209
+ "ɐ": [
210
+ 50
211
+ ],
212
+ "ɑ": [
213
+ 51
214
+ ],
215
+ "ɒ": [
216
+ 52
217
+ ],
218
+ "ɓ": [
219
+ 53
220
+ ],
221
+ "ɔ": [
222
+ 54
223
+ ],
224
+ "ɕ": [
225
+ 55
226
+ ],
227
+ "ɖ": [
228
+ 56
229
+ ],
230
+ "ɗ": [
231
+ 57
232
+ ],
233
+ "ɘ": [
234
+ 58
235
+ ],
236
+ "ə": [
237
+ 59
238
+ ],
239
+ "ɚ": [
240
+ 60
241
+ ],
242
+ "ɛ": [
243
+ 61
244
+ ],
245
+ "ɜ": [
246
+ 62
247
+ ],
248
+ "ɞ": [
249
+ 63
250
+ ],
251
+ "ɟ": [
252
+ 64
253
+ ],
254
+ "ɠ": [
255
+ 65
256
+ ],
257
+ "ɡ": [
258
+ 66
259
+ ],
260
+ "ɢ": [
261
+ 67
262
+ ],
263
+ "ɣ": [
264
+ 68
265
+ ],
266
+ "ɤ": [
267
+ 69
268
+ ],
269
+ "ɥ": [
270
+ 70
271
+ ],
272
+ "ɦ": [
273
+ 71
274
+ ],
275
+ "ɧ": [
276
+ 72
277
+ ],
278
+ "ɨ": [
279
+ 73
280
+ ],
281
+ "ɪ": [
282
+ 74
283
+ ],
284
+ "ɫ": [
285
+ 75
286
+ ],
287
+ "ɬ": [
288
+ 76
289
+ ],
290
+ "ɭ": [
291
+ 77
292
+ ],
293
+ "ɮ": [
294
+ 78
295
+ ],
296
+ "ɯ": [
297
+ 79
298
+ ],
299
+ "ɰ": [
300
+ 80
301
+ ],
302
+ "ɱ": [
303
+ 81
304
+ ],
305
+ "ɲ": [
306
+ 82
307
+ ],
308
+ "ɳ": [
309
+ 83
310
+ ],
311
+ "ɴ": [
312
+ 84
313
+ ],
314
+ "ɵ": [
315
+ 85
316
+ ],
317
+ "ɶ": [
318
+ 86
319
+ ],
320
+ "ɸ": [
321
+ 87
322
+ ],
323
+ "ɹ": [
324
+ 88
325
+ ],
326
+ "ɺ": [
327
+ 89
328
+ ],
329
+ "ɻ": [
330
+ 90
331
+ ],
332
+ "ɽ": [
333
+ 91
334
+ ],
335
+ "ɾ": [
336
+ 92
337
+ ],
338
+ "ʀ": [
339
+ 93
340
+ ],
341
+ "ʁ": [
342
+ 94
343
+ ],
344
+ "ʂ": [
345
+ 95
346
+ ],
347
+ "ʃ": [
348
+ 96
349
+ ],
350
+ "ʄ": [
351
+ 97
352
+ ],
353
+ "ʈ": [
354
+ 98
355
+ ],
356
+ "ʉ": [
357
+ 99
358
+ ],
359
+ "ʊ": [
360
+ 100
361
+ ],
362
+ "ʋ": [
363
+ 101
364
+ ],
365
+ "ʌ": [
366
+ 102
367
+ ],
368
+ "ʍ": [
369
+ 103
370
+ ],
371
+ "ʎ": [
372
+ 104
373
+ ],
374
+ "ʏ": [
375
+ 105
376
+ ],
377
+ "ʐ": [
378
+ 106
379
+ ],
380
+ "ʑ": [
381
+ 107
382
+ ],
383
+ "ʒ": [
384
+ 108
385
+ ],
386
+ "ʔ": [
387
+ 109
388
+ ],
389
+ "ʕ": [
390
+ 110
391
+ ],
392
+ "ʘ": [
393
+ 111
394
+ ],
395
+ "ʙ": [
396
+ 112
397
+ ],
398
+ "ʛ": [
399
+ 113
400
+ ],
401
+ "ʜ": [
402
+ 114
403
+ ],
404
+ "ʝ": [
405
+ 115
406
+ ],
407
+ "ʟ": [
408
+ 116
409
+ ],
410
+ "ʡ": [
411
+ 117
412
+ ],
413
+ "ʢ": [
414
+ 118
415
+ ],
416
+ "ʦ": [
417
+ 155
418
+ ],
419
+ "ʰ": [
420
+ 145
421
+ ],
422
+ "ʲ": [
423
+ 119
424
+ ],
425
+ "ˈ": [
426
+ 120
427
+ ],
428
+ "ˌ": [
429
+ 121
430
+ ],
431
+ "ː": [
432
+ 122
433
+ ],
434
+ "ˑ": [
435
+ 123
436
+ ],
437
+ "˞": [
438
+ 124
439
+ ],
440
+ "ˤ": [
441
+ 146
442
+ ],
443
+ "̃": [
444
+ 141
445
+ ],
446
+ "̊": [
447
+ 158
448
+ ],
449
+ "̝": [
450
+ 157
451
+ ],
452
+ "̧": [
453
+ 140
454
+ ],
455
+ "̩": [
456
+ 144
457
+ ],
458
+ "̪": [
459
+ 142
460
+ ],
461
+ "̯": [
462
+ 143
463
+ ],
464
+ "̺": [
465
+ 152
466
+ ],
467
+ "̻": [
468
+ 153
469
+ ],
470
+ "β": [
471
+ 125
472
+ ],
473
+ "ε": [
474
+ 147
475
+ ],
476
+ "θ": [
477
+ 126
478
+ ],
479
+ "χ": [
480
+ 127
481
+ ],
482
+ "ᵻ": [
483
+ 128
484
+ ],
485
+ "↑": [
486
+ 151
487
+ ],
488
+ "↓": [
489
+ 148
490
+ ],
491
+ "ⱱ": [
492
+ 129
493
+ ]
494
+ },
495
+ "num_symbols": 256,
496
+ "num_speakers": 1,
497
+ "speaker_id_map": {},
498
+ "piper_version": "1.0.0",
499
+ "language": {
500
+ "code": "cs_CZ",
501
+ "family": "cs",
502
+ "region": "CZ",
503
+ "name_native": "Čeština",
504
+ "name_english": "Czech",
505
+ "country_english": "Czech Republic"
506
+ },
507
+ "dataset": "jirka"
508
+ }
cs/cs_CZ/jirka/low/samples/speaker_0.mp3 ADDED
Binary file (96.1 kB). View file
 
cs/cs_CZ/jirka/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for jirka (medium)
2
+
3
+ * Language: cs_CZ (Czech, Czech Republic)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbd5c900acacc8e8cbecd64347abb8de39c00a9d3104bed06fee92e4f319efc8
3
+ size 63201294
cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "cs"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ " ": [
18
+ 3
19
+ ],
20
+ "!": [
21
+ 4
22
+ ],
23
+ "\"": [
24
+ 150
25
+ ],
26
+ "#": [
27
+ 149
28
+ ],
29
+ "$": [
30
+ 2
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ "0": [
51
+ 130
52
+ ],
53
+ "1": [
54
+ 131
55
+ ],
56
+ "2": [
57
+ 132
58
+ ],
59
+ "3": [
60
+ 133
61
+ ],
62
+ "4": [
63
+ 134
64
+ ],
65
+ "5": [
66
+ 135
67
+ ],
68
+ "6": [
69
+ 136
70
+ ],
71
+ "7": [
72
+ 137
73
+ ],
74
+ "8": [
75
+ 138
76
+ ],
77
+ "9": [
78
+ 139
79
+ ],
80
+ ":": [
81
+ 11
82
+ ],
83
+ ";": [
84
+ 12
85
+ ],
86
+ "?": [
87
+ 13
88
+ ],
89
+ "X": [
90
+ 156
91
+ ],
92
+ "^": [
93
+ 1
94
+ ],
95
+ "_": [
96
+ 0
97
+ ],
98
+ "a": [
99
+ 14
100
+ ],
101
+ "b": [
102
+ 15
103
+ ],
104
+ "c": [
105
+ 16
106
+ ],
107
+ "d": [
108
+ 17
109
+ ],
110
+ "e": [
111
+ 18
112
+ ],
113
+ "f": [
114
+ 19
115
+ ],
116
+ "g": [
117
+ 154
118
+ ],
119
+ "h": [
120
+ 20
121
+ ],
122
+ "i": [
123
+ 21
124
+ ],
125
+ "j": [
126
+ 22
127
+ ],
128
+ "k": [
129
+ 23
130
+ ],
131
+ "l": [
132
+ 24
133
+ ],
134
+ "m": [
135
+ 25
136
+ ],
137
+ "n": [
138
+ 26
139
+ ],
140
+ "o": [
141
+ 27
142
+ ],
143
+ "p": [
144
+ 28
145
+ ],
146
+ "q": [
147
+ 29
148
+ ],
149
+ "r": [
150
+ 30
151
+ ],
152
+ "s": [
153
+ 31
154
+ ],
155
+ "t": [
156
+ 32
157
+ ],
158
+ "u": [
159
+ 33
160
+ ],
161
+ "v": [
162
+ 34
163
+ ],
164
+ "w": [
165
+ 35
166
+ ],
167
+ "x": [
168
+ 36
169
+ ],
170
+ "y": [
171
+ 37
172
+ ],
173
+ "z": [
174
+ 38
175
+ ],
176
+ "æ": [
177
+ 39
178
+ ],
179
+ "ç": [
180
+ 40
181
+ ],
182
+ "ð": [
183
+ 41
184
+ ],
185
+ "ø": [
186
+ 42
187
+ ],
188
+ "ħ": [
189
+ 43
190
+ ],
191
+ "ŋ": [
192
+ 44
193
+ ],
194
+ "œ": [
195
+ 45
196
+ ],
197
+ "ǀ": [
198
+ 46
199
+ ],
200
+ "ǁ": [
201
+ 47
202
+ ],
203
+ "ǂ": [
204
+ 48
205
+ ],
206
+ "ǃ": [
207
+ 49
208
+ ],
209
+ "ɐ": [
210
+ 50
211
+ ],
212
+ "ɑ": [
213
+ 51
214
+ ],
215
+ "ɒ": [
216
+ 52
217
+ ],
218
+ "ɓ": [
219
+ 53
220
+ ],
221
+ "ɔ": [
222
+ 54
223
+ ],
224
+ "ɕ": [
225
+ 55
226
+ ],
227
+ "ɖ": [
228
+ 56
229
+ ],
230
+ "ɗ": [
231
+ 57
232
+ ],
233
+ "ɘ": [
234
+ 58
235
+ ],
236
+ "ə": [
237
+ 59
238
+ ],
239
+ "ɚ": [
240
+ 60
241
+ ],
242
+ "ɛ": [
243
+ 61
244
+ ],
245
+ "ɜ": [
246
+ 62
247
+ ],
248
+ "ɞ": [
249
+ 63
250
+ ],
251
+ "ɟ": [
252
+ 64
253
+ ],
254
+ "ɠ": [
255
+ 65
256
+ ],
257
+ "ɡ": [
258
+ 66
259
+ ],
260
+ "ɢ": [
261
+ 67
262
+ ],
263
+ "ɣ": [
264
+ 68
265
+ ],
266
+ "ɤ": [
267
+ 69
268
+ ],
269
+ "ɥ": [
270
+ 70
271
+ ],
272
+ "ɦ": [
273
+ 71
274
+ ],
275
+ "ɧ": [
276
+ 72
277
+ ],
278
+ "ɨ": [
279
+ 73
280
+ ],
281
+ "ɪ": [
282
+ 74
283
+ ],
284
+ "ɫ": [
285
+ 75
286
+ ],
287
+ "ɬ": [
288
+ 76
289
+ ],
290
+ "ɭ": [
291
+ 77
292
+ ],
293
+ "ɮ": [
294
+ 78
295
+ ],
296
+ "ɯ": [
297
+ 79
298
+ ],
299
+ "ɰ": [
300
+ 80
301
+ ],
302
+ "ɱ": [
303
+ 81
304
+ ],
305
+ "ɲ": [
306
+ 82
307
+ ],
308
+ "ɳ": [
309
+ 83
310
+ ],
311
+ "ɴ": [
312
+ 84
313
+ ],
314
+ "ɵ": [
315
+ 85
316
+ ],
317
+ "ɶ": [
318
+ 86
319
+ ],
320
+ "ɸ": [
321
+ 87
322
+ ],
323
+ "ɹ": [
324
+ 88
325
+ ],
326
+ "ɺ": [
327
+ 89
328
+ ],
329
+ "ɻ": [
330
+ 90
331
+ ],
332
+ "ɽ": [
333
+ 91
334
+ ],
335
+ "ɾ": [
336
+ 92
337
+ ],
338
+ "ʀ": [
339
+ 93
340
+ ],
341
+ "ʁ": [
342
+ 94
343
+ ],
344
+ "ʂ": [
345
+ 95
346
+ ],
347
+ "ʃ": [
348
+ 96
349
+ ],
350
+ "ʄ": [
351
+ 97
352
+ ],
353
+ "ʈ": [
354
+ 98
355
+ ],
356
+ "ʉ": [
357
+ 99
358
+ ],
359
+ "ʊ": [
360
+ 100
361
+ ],
362
+ "ʋ": [
363
+ 101
364
+ ],
365
+ "ʌ": [
366
+ 102
367
+ ],
368
+ "ʍ": [
369
+ 103
370
+ ],
371
+ "ʎ": [
372
+ 104
373
+ ],
374
+ "ʏ": [
375
+ 105
376
+ ],
377
+ "ʐ": [
378
+ 106
379
+ ],
380
+ "ʑ": [
381
+ 107
382
+ ],
383
+ "ʒ": [
384
+ 108
385
+ ],
386
+ "ʔ": [
387
+ 109
388
+ ],
389
+ "ʕ": [
390
+ 110
391
+ ],
392
+ "ʘ": [
393
+ 111
394
+ ],
395
+ "ʙ": [
396
+ 112
397
+ ],
398
+ "ʛ": [
399
+ 113
400
+ ],
401
+ "ʜ": [
402
+ 114
403
+ ],
404
+ "ʝ": [
405
+ 115
406
+ ],
407
+ "ʟ": [
408
+ 116
409
+ ],
410
+ "ʡ": [
411
+ 117
412
+ ],
413
+ "ʢ": [
414
+ 118
415
+ ],
416
+ "ʦ": [
417
+ 155
418
+ ],
419
+ "ʰ": [
420
+ 145
421
+ ],
422
+ "ʲ": [
423
+ 119
424
+ ],
425
+ "ˈ": [
426
+ 120
427
+ ],
428
+ "ˌ": [
429
+ 121
430
+ ],
431
+ "ː": [
432
+ 122
433
+ ],
434
+ "ˑ": [
435
+ 123
436
+ ],
437
+ "˞": [
438
+ 124
439
+ ],
440
+ "ˤ": [
441
+ 146
442
+ ],
443
+ "̃": [
444
+ 141
445
+ ],
446
+ "̊": [
447
+ 158
448
+ ],
449
+ "̝": [
450
+ 157
451
+ ],
452
+ "̧": [
453
+ 140
454
+ ],
455
+ "̩": [
456
+ 144
457
+ ],
458
+ "̪": [
459
+ 142
460
+ ],
461
+ "̯": [
462
+ 143
463
+ ],
464
+ "̺": [
465
+ 152
466
+ ],
467
+ "̻": [
468
+ 153
469
+ ],
470
+ "β": [
471
+ 125
472
+ ],
473
+ "ε": [
474
+ 147
475
+ ],
476
+ "θ": [
477
+ 126
478
+ ],
479
+ "χ": [
480
+ 127
481
+ ],
482
+ "ᵻ": [
483
+ 128
484
+ ],
485
+ "↑": [
486
+ 151
487
+ ],
488
+ "↓": [
489
+ 148
490
+ ],
491
+ "ⱱ": [
492
+ 129
493
+ ]
494
+ },
495
+ "num_symbols": 256,
496
+ "num_speakers": 1,
497
+ "speaker_id_map": {},
498
+ "piper_version": "1.0.0",
499
+ "language": {
500
+ "code": "cs_CZ",
501
+ "family": "cs",
502
+ "region": "CZ",
503
+ "name_native": "Čeština",
504
+ "name_english": "Czech",
505
+ "country_english": "Czech Republic"
506
+ },
507
+ "dataset": "jirka"
508
+ }
cs/cs_CZ/jirka/medium/samples/speaker_0.mp3 ADDED
Binary file (132 kB). View file
 
cy/cy_GB/gwryw_gogleddol/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for gwryw_gogleddol (medium)
2
+
3
+ * Language: cy_GB (Welsh, Great Britain)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://git.techiaith.bangor.ac.uk/data-porth-technolegau-iaith/corpws-talentau-llais
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
cy/cy_GB/gwryw_gogleddol/medium/cy_GB-gwryw_gogleddol-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7d87df65e2c67ddee49829906ec51982fe123d418472731dab696f4dcefe8c6
3
+ size 63511038
cy/cy_GB/gwryw_gogleddol/medium/cy_GB-gwryw_gogleddol-medium.onnx.json ADDED
@@ -0,0 +1,502 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": "gwryw_gogleddol",
3
+ "audio": {
4
+ "sample_rate": 22050,
5
+ "quality": "medium"
6
+ },
7
+ "espeak": {
8
+ "voice": "cy"
9
+ },
10
+ "language": {
11
+ "code": "cy_GB",
12
+ "family": "cy",
13
+ "region": "GB",
14
+ "name_native": "Cymraeg",
15
+ "name_english": "Welsh",
16
+ "country_english": "Great Britain"
17
+ },
18
+ "inference": {
19
+ "noise_scale": 0.667,
20
+ "length_scale": 1,
21
+ "noise_w": 0.8
22
+ },
23
+ "phoneme_type": "espeak",
24
+ "phoneme_map": {},
25
+ "phoneme_id_map": {
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "\"": [
33
+ 150
34
+ ],
35
+ "#": [
36
+ 149
37
+ ],
38
+ "$": [
39
+ 2
40
+ ],
41
+ "'": [
42
+ 5
43
+ ],
44
+ "(": [
45
+ 6
46
+ ],
47
+ ")": [
48
+ 7
49
+ ],
50
+ ",": [
51
+ 8
52
+ ],
53
+ "-": [
54
+ 9
55
+ ],
56
+ ".": [
57
+ 10
58
+ ],
59
+ "0": [
60
+ 130
61
+ ],
62
+ "1": [
63
+ 131
64
+ ],
65
+ "2": [
66
+ 132
67
+ ],
68
+ "3": [
69
+ 133
70
+ ],
71
+ "4": [
72
+ 134
73
+ ],
74
+ "5": [
75
+ 135
76
+ ],
77
+ "6": [
78
+ 136
79
+ ],
80
+ "7": [
81
+ 137
82
+ ],
83
+ "8": [
84
+ 138
85
+ ],
86
+ "9": [
87
+ 139
88
+ ],
89
+ ":": [
90
+ 11
91
+ ],
92
+ ";": [
93
+ 12
94
+ ],
95
+ "?": [
96
+ 13
97
+ ],
98
+ "X": [
99
+ 156
100
+ ],
101
+ "^": [
102
+ 1
103
+ ],
104
+ "_": [
105
+ 0
106
+ ],
107
+ "a": [
108
+ 14
109
+ ],
110
+ "b": [
111
+ 15
112
+ ],
113
+ "c": [
114
+ 16
115
+ ],
116
+ "d": [
117
+ 17
118
+ ],
119
+ "e": [
120
+ 18
121
+ ],
122
+ "f": [
123
+ 19
124
+ ],
125
+ "g": [
126
+ 154
127
+ ],
128
+ "h": [
129
+ 20
130
+ ],
131
+ "i": [
132
+ 21
133
+ ],
134
+ "j": [
135
+ 22
136
+ ],
137
+ "k": [
138
+ 23
139
+ ],
140
+ "l": [
141
+ 24
142
+ ],
143
+ "m": [
144
+ 25
145
+ ],
146
+ "n": [
147
+ 26
148
+ ],
149
+ "o": [
150
+ 27
151
+ ],
152
+ "p": [
153
+ 28
154
+ ],
155
+ "q": [
156
+ 29
157
+ ],
158
+ "r": [
159
+ 30
160
+ ],
161
+ "s": [
162
+ 31
163
+ ],
164
+ "t": [
165
+ 32
166
+ ],
167
+ "u": [
168
+ 33
169
+ ],
170
+ "v": [
171
+ 34
172
+ ],
173
+ "w": [
174
+ 35
175
+ ],
176
+ "x": [
177
+ 36
178
+ ],
179
+ "y": [
180
+ 37
181
+ ],
182
+ "z": [
183
+ 38
184
+ ],
185
+ "æ": [
186
+ 39
187
+ ],
188
+ "ç": [
189
+ 40
190
+ ],
191
+ "ð": [
192
+ 41
193
+ ],
194
+ "ø": [
195
+ 42
196
+ ],
197
+ "ħ": [
198
+ 43
199
+ ],
200
+ "ŋ": [
201
+ 44
202
+ ],
203
+ "œ": [
204
+ 45
205
+ ],
206
+ "ǀ": [
207
+ 46
208
+ ],
209
+ "ǁ": [
210
+ 47
211
+ ],
212
+ "ǂ": [
213
+ 48
214
+ ],
215
+ "ǃ": [
216
+ 49
217
+ ],
218
+ "ɐ": [
219
+ 50
220
+ ],
221
+ "ɑ": [
222
+ 51
223
+ ],
224
+ "ɒ": [
225
+ 52
226
+ ],
227
+ "ɓ": [
228
+ 53
229
+ ],
230
+ "ɔ": [
231
+ 54
232
+ ],
233
+ "ɕ": [
234
+ 55
235
+ ],
236
+ "ɖ": [
237
+ 56
238
+ ],
239
+ "ɗ": [
240
+ 57
241
+ ],
242
+ "ɘ": [
243
+ 58
244
+ ],
245
+ "ə": [
246
+ 59
247
+ ],
248
+ "ɚ": [
249
+ 60
250
+ ],
251
+ "ɛ": [
252
+ 61
253
+ ],
254
+ "ɜ": [
255
+ 62
256
+ ],
257
+ "ɞ": [
258
+ 63
259
+ ],
260
+ "ɟ": [
261
+ 64
262
+ ],
263
+ "ɠ": [
264
+ 65
265
+ ],
266
+ "ɡ": [
267
+ 66
268
+ ],
269
+ "ɢ": [
270
+ 67
271
+ ],
272
+ "ɣ": [
273
+ 68
274
+ ],
275
+ "ɤ": [
276
+ 69
277
+ ],
278
+ "ɥ": [
279
+ 70
280
+ ],
281
+ "ɦ": [
282
+ 71
283
+ ],
284
+ "ɧ": [
285
+ 72
286
+ ],
287
+ "ɨ": [
288
+ 73
289
+ ],
290
+ "ɪ": [
291
+ 74
292
+ ],
293
+ "ɫ": [
294
+ 75
295
+ ],
296
+ "ɬ": [
297
+ 76
298
+ ],
299
+ "ɭ": [
300
+ 77
301
+ ],
302
+ "ɮ": [
303
+ 78
304
+ ],
305
+ "ɯ": [
306
+ 79
307
+ ],
308
+ "ɰ": [
309
+ 80
310
+ ],
311
+ "ɱ": [
312
+ 81
313
+ ],
314
+ "ɲ": [
315
+ 82
316
+ ],
317
+ "ɳ": [
318
+ 83
319
+ ],
320
+ "ɴ": [
321
+ 84
322
+ ],
323
+ "ɵ": [
324
+ 85
325
+ ],
326
+ "ɶ": [
327
+ 86
328
+ ],
329
+ "ɸ": [
330
+ 87
331
+ ],
332
+ "ɹ": [
333
+ 88
334
+ ],
335
+ "ɺ": [
336
+ 89
337
+ ],
338
+ "ɻ": [
339
+ 90
340
+ ],
341
+ "ɽ": [
342
+ 91
343
+ ],
344
+ "ɾ": [
345
+ 92
346
+ ],
347
+ "ʀ": [
348
+ 93
349
+ ],
350
+ "ʁ": [
351
+ 94
352
+ ],
353
+ "ʂ": [
354
+ 95
355
+ ],
356
+ "ʃ": [
357
+ 96
358
+ ],
359
+ "ʄ": [
360
+ 97
361
+ ],
362
+ "ʈ": [
363
+ 98
364
+ ],
365
+ "ʉ": [
366
+ 99
367
+ ],
368
+ "ʊ": [
369
+ 100
370
+ ],
371
+ "ʋ": [
372
+ 101
373
+ ],
374
+ "ʌ": [
375
+ 102
376
+ ],
377
+ "ʍ": [
378
+ 103
379
+ ],
380
+ "ʎ": [
381
+ 104
382
+ ],
383
+ "ʏ": [
384
+ 105
385
+ ],
386
+ "ʐ": [
387
+ 106
388
+ ],
389
+ "ʑ": [
390
+ 107
391
+ ],
392
+ "ʒ": [
393
+ 108
394
+ ],
395
+ "ʔ": [
396
+ 109
397
+ ],
398
+ "ʕ": [
399
+ 110
400
+ ],
401
+ "ʘ": [
402
+ 111
403
+ ],
404
+ "ʙ": [
405
+ 112
406
+ ],
407
+ "ʛ": [
408
+ 113
409
+ ],
410
+ "ʜ": [
411
+ 114
412
+ ],
413
+ "ʝ": [
414
+ 115
415
+ ],
416
+ "ʟ": [
417
+ 116
418
+ ],
419
+ "ʡ": [
420
+ 117
421
+ ],
422
+ "ʢ": [
423
+ 118
424
+ ],
425
+ "ʦ": [
426
+ 155
427
+ ],
428
+ "ʰ": [
429
+ 145
430
+ ],
431
+ "ʲ": [
432
+ 119
433
+ ],
434
+ "ˈ": [
435
+ 120
436
+ ],
437
+ "ˌ": [
438
+ 121
439
+ ],
440
+ "ː": [
441
+ 122
442
+ ],
443
+ "ˑ": [
444
+ 123
445
+ ],
446
+ "˞": [
447
+ 124
448
+ ],
449
+ "ˤ": [
450
+ 146
451
+ ],
452
+ "̃": [
453
+ 141
454
+ ],
455
+ "̧": [
456
+ 140
457
+ ],
458
+ "̩": [
459
+ 144
460
+ ],
461
+ "̪": [
462
+ 142
463
+ ],
464
+ "̯": [
465
+ 143
466
+ ],
467
+ "̺": [
468
+ 152
469
+ ],
470
+ "̻": [
471
+ 153
472
+ ],
473
+ "β": [
474
+ 125
475
+ ],
476
+ "ε": [
477
+ 147
478
+ ],
479
+ "θ": [
480
+ 126
481
+ ],
482
+ "χ": [
483
+ 127
484
+ ],
485
+ "ᵻ": [
486
+ 128
487
+ ],
488
+ "↑": [
489
+ 151
490
+ ],
491
+ "↓": [
492
+ 148
493
+ ],
494
+ "ⱱ": [
495
+ 129
496
+ ]
497
+ },
498
+ "num_symbols": 256,
499
+ "num_speakers": 1,
500
+ "speaker_id_map": {},
501
+ "piper_version": "1.0.0"
502
+ }
cy/cy_GB/gwryw_gogleddol/medium/samples/speaker_0.mp3 ADDED
Binary file (114 kB). View file
 
da/da_DK/talesyntese/medium/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ da-nst_talesyntese-medium
da/da_DK/talesyntese/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for talesyntese (medium)
2
+
3
+ * Language: da_DK (Danish, Denmark)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.nb.no/sprakbanken/en/resource-catalogue/oai-nb-no-sbr-21/
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9271efd25f7b8494bbd28d48dd675c8c119daa284f3ee488008935f515f1241
3
+ size 63201294
da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx.json ADDED
@@ -0,0 +1,493 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "da"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ]
479
+ },
480
+ "num_symbols": 256,
481
+ "num_speakers": 1,
482
+ "speaker_id_map": {},
483
+ "piper_version": "0.2.0",
484
+ "language": {
485
+ "code": "da_DK",
486
+ "family": "da",
487
+ "region": "DK",
488
+ "name_native": "Dansk",
489
+ "name_english": "Danish",
490
+ "country_english": "Denmark"
491
+ },
492
+ "dataset": "talesyntese"
493
+ }
da/da_DK/talesyntese/medium/samples/speaker_0.mp3 ADDED
Binary file (72.7 kB). View file
 
de/de_DE/eva_k/x_low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ de-eva_k-x-low
de/de_DE/eva_k/x_low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for eva_k (x_low)
2
+
3
+ * Language: de (German)
4
+ * Speakers: 1
5
+ * Quality: x_low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.caito.de/2019/01/03/the-m-ailabs-speech-dataset/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Trained from scratch.
de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e88cf290fbfb768bf111330d2e8a46e376b0d85e3423a28bfebbc863a260dad8
3
+ size 20628813
de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "x_low"
5
+ },
6
+ "espeak": {
7
+ "voice": "de"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "de_DE",
413
+ "family": "de",
414
+ "region": "DE",
415
+ "name_native": "Deutsch",
416
+ "name_english": "German",
417
+ "country_english": "Germany"
418
+ },
419
+ "dataset": "eva_k"
420
+ }
de/de_DE/eva_k/x_low/samples/speaker_0.mp3 ADDED
Binary file (73.6 kB). View file
 
de/de_DE/karlsson/low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ de-karlsson-low
de/de_DE/karlsson/low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for karlsson (low)
2
+
3
+ * Language: de_DE (German, Germany)
4
+ * Speakers: 1
5
+ * Quality: low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.caito.de/2019/01/03/the-m-ailabs-speech-dataset/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English Ryan voice (low quality).