SpireLab commited on
Commit
f15e280
·
verified ·
1 Parent(s): a6aef0c

Initial_commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +22 -0
  2. API_Main.py +108 -0
  3. Dockerfile +27 -0
  4. README.md +169 -3
  5. model_related/Bengali_Female/speakers.pth +3 -0
  6. model_related/Bengali_Male/speakers.pth +3 -0
  7. model_related/Bhojpuri_Female/speakers.pth +3 -0
  8. model_related/Bhojpuri_Male/speakers.pth +3 -0
  9. model_related/Chhattisgarhi_Female/speakers.pth +3 -0
  10. model_related/Chhattisgarhi_Male/speakers.pth +3 -0
  11. model_related/English_Female/speakers.pth +3 -0
  12. model_related/English_Male/speakers.pth +3 -0
  13. model_related/Gujarati_Female/speakers.pth +3 -0
  14. model_related/Gujarati_Male/speakers.pth +3 -0
  15. model_related/Hindi_Female/speakers.pth +3 -0
  16. model_related/Hindi_Male/speakers.pth +3 -0
  17. model_related/Kannada_Female/speakers.pth +3 -0
  18. model_related/Kannada_Male/speakers.pth +3 -0
  19. model_related/Magahi_Female/speakers.pth +3 -0
  20. model_related/Magahi_Male/speakers.pth +3 -0
  21. model_related/Maithili_Female/speakers.pth +3 -0
  22. model_related/Maithili_Male/speakers.pth +3 -0
  23. model_related/Marathi_Female/speakers.pth +3 -0
  24. model_related/Marathi_Male/speakers.pth +3 -0
  25. model_related/Telugu_Female/speakers.pth +3 -0
  26. model_related/Telugu_Male/speakers.pth +3 -0
  27. models/best_model.pth +3 -0
  28. models/config.json +662 -0
  29. models/language_ids.json +13 -0
  30. models/speakers.pth +3 -0
  31. reference_audio/bengali_female.wav +3 -0
  32. reference_audio/bengali_male.wav +3 -0
  33. reference_audio/bhojpuri_female.wav +3 -0
  34. reference_audio/bhojpuri_male.wav +3 -0
  35. reference_audio/chhattisgarhi_female.wav +3 -0
  36. reference_audio/chhattisgarhi_male.wav +3 -0
  37. reference_audio/english_female.wav +3 -0
  38. reference_audio/english_male.wav +3 -0
  39. reference_audio/gujarati_female.wav +3 -0
  40. reference_audio/gujarati_male.wav +3 -0
  41. reference_audio/hindi_female.wav +3 -0
  42. reference_audio/hindi_male.wav +3 -0
  43. reference_audio/kannada_female.wav +3 -0
  44. reference_audio/kannada_male.wav +3 -0
  45. reference_audio/magahi_female.wav +3 -0
  46. reference_audio/magahi_male.wav +3 -0
  47. reference_audio/maithili_female.wav +3 -0
  48. reference_audio/maithili_male.wav +3 -0
  49. reference_audio/marathi_female.wav +3 -0
  50. reference_audio/marathi_male.wav +3 -0
.gitattributes CHANGED
@@ -33,3 +33,25 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ reference_audio/bengali_female.wav filter=lfs diff=lfs merge=lfs -text
37
+ reference_audio/bengali_male.wav filter=lfs diff=lfs merge=lfs -text
38
+ reference_audio/bhojpuri_female.wav filter=lfs diff=lfs merge=lfs -text
39
+ reference_audio/bhojpuri_male.wav filter=lfs diff=lfs merge=lfs -text
40
+ reference_audio/chhattisgarhi_female.wav filter=lfs diff=lfs merge=lfs -text
41
+ reference_audio/chhattisgarhi_male.wav filter=lfs diff=lfs merge=lfs -text
42
+ reference_audio/english_female.wav filter=lfs diff=lfs merge=lfs -text
43
+ reference_audio/english_male.wav filter=lfs diff=lfs merge=lfs -text
44
+ reference_audio/gujarati_female.wav filter=lfs diff=lfs merge=lfs -text
45
+ reference_audio/gujarati_male.wav filter=lfs diff=lfs merge=lfs -text
46
+ reference_audio/hindi_female.wav filter=lfs diff=lfs merge=lfs -text
47
+ reference_audio/hindi_male.wav filter=lfs diff=lfs merge=lfs -text
48
+ reference_audio/kannada_female.wav filter=lfs diff=lfs merge=lfs -text
49
+ reference_audio/kannada_male.wav filter=lfs diff=lfs merge=lfs -text
50
+ reference_audio/magahi_female.wav filter=lfs diff=lfs merge=lfs -text
51
+ reference_audio/magahi_male.wav filter=lfs diff=lfs merge=lfs -text
52
+ reference_audio/maithili_female.wav filter=lfs diff=lfs merge=lfs -text
53
+ reference_audio/maithili_male.wav filter=lfs diff=lfs merge=lfs -text
54
+ reference_audio/marathi_female.wav filter=lfs diff=lfs merge=lfs -text
55
+ reference_audio/marathi_male.wav filter=lfs diff=lfs merge=lfs -text
56
+ reference_audio/telugu_female.wav filter=lfs diff=lfs merge=lfs -text
57
+ reference_audio/telugu_male.wav filter=lfs diff=lfs merge=lfs -text
API_Main.py ADDED
@@ -0,0 +1,108 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ import string
3
+ import random
4
+ import uvicorn
5
+ import numpy as np
6
+ from io import BytesIO
7
+ from TTS.api import TTS
8
+ from fastapi import FastAPI
9
+ from scipy.io.wavfile import write
10
+ from fastapi.responses import Response, JSONResponse
11
+
12
+
13
+ device = "cuda" if torch.cuda.is_available() else "cpu"
14
+ print(f"Using device: {device}")
15
+
16
+ MODEL_PATH = "models/best_model.pth"
17
+ CONFIG_PATH = "models/config.json"
18
+
19
+ print(f"Loading model")
20
+ tts = TTS(
21
+ model_path=MODEL_PATH,
22
+ config_path=CONFIG_PATH,
23
+ progress_bar=False,
24
+ ).to(device)
25
+
26
+ sample_rate = 22050
27
+
28
+ ref_path = {
29
+ "chhattisgarhi_male" : "reference_audio/chhattisgarhi_male.wav",
30
+ "chhattisgarhi_female" : "reference_audio/chhattisgarhi_female.wav",
31
+ "kannada_male" : "reference_audio/kannada_male.wav",
32
+ "kannada_female" : "reference_audio/kannada_female.wav",
33
+ "maithili_male" : "reference_audio/maithili_male.wav",
34
+ "maithili_female" : "reference_audio/maithili_female.wav",
35
+ "telugu_male" : "reference_audio/telugu_male.wav",
36
+ "telugu_female" : "reference_audio/telugu_female.wav",
37
+ "bengali_male" : "reference_audio/bengali_male.wav",
38
+ "bengali_female" : "reference_audio/bengali_female.wav",
39
+ "bhojpuri_male" : "reference_audio/bhojpuri_male.wav",
40
+ "bhojpuri_female" : "reference_audio/bhojpuri_female.wav",
41
+ "marathi_female" : "reference_audio/marathi_female.wav",
42
+ "marathi_male" : "reference_audio/marathi_male.wav",
43
+ "gujarati_male" : "reference_audio/gujarati_male.wav",
44
+ "gujarati_female" : "reference_audio/gujarati_female.wav",
45
+ "hindi_male" : "reference_audio/hindi_male.wav",
46
+ "hindi_female" : "reference_audio/hindi_female.wav",
47
+ "magahi_female" : "reference_audio/magahi_female.wav",
48
+ "magahi_male" : "reference_audio/magahi_male.wav",
49
+ "english_female" : "reference_audio/english_female.wav",
50
+ "english_male" : "reference_audio/english_male.wav",
51
+ }
52
+
53
+ languageCODE = {
54
+ "bhojpuri": "bho",
55
+ "bengali": "bn",
56
+ "english": "en",
57
+ "gujarati": "gu",
58
+ "hindi": "hi",
59
+ "chhattisgarhi": "hne",
60
+ "kannada": "kn",
61
+ "magahi": "mag",
62
+ "maithili": "mai",
63
+ "marathi": "mr",
64
+ "telugu": "te"
65
+ }
66
+
67
+ app = FastAPI()
68
+ @app.get("/Get_Inference")
69
+ async def Inference(text : str, lang : str, speaker : str):
70
+
71
+ if not text or not lang or not speaker:
72
+ return JSONResponse({"comment" : "Missing Field."}, status_code = 422)
73
+
74
+ spk = speaker.lower()
75
+ lan = lang.lower()
76
+
77
+ if spk not in ref_path:
78
+ return JSONResponse({"comment" : "Speaker not present in the system."}, status_code = 422)
79
+
80
+ if lan not in languageCODE or lan not in languageCODE.values():
81
+ return JSONResponse({"comment" : "Language not present in the system."}, status_code = 422)
82
+
83
+
84
+ wav = np.array(tts.tts(text=text, speaker_wav=ref_path[speaker], language = languageCODE[lan] if lan not in languageCODE.values() else lan))
85
+ wav_norm = wav * (32767 / max(0.01, np.max(np.abs(wav))))
86
+ wav_norm = wav_norm.astype(np.int16)
87
+
88
+ wav_buffer = BytesIO()
89
+ write(wav_buffer, sample_rate, wav_norm)
90
+ wav_buffer.seek(0)
91
+ wav_buffer.name = lang + "_" + speaker + "_" + ''.join(random.choice(string.ascii_uppercase + string.digits + string.ascii_lowercase) for _ in range(7)) + ".wav"
92
+ return Response(wav_buffer.read())
93
+
94
+
95
+ def start_server():
96
+ print('Starting Server...')
97
+
98
+ uvicorn.run(
99
+ "API_Main:app",
100
+ host = "0.0.0.0",
101
+ port = 8080,
102
+ workers = 1,
103
+ log_level="debug",
104
+ reload=False,
105
+ )
106
+
107
+ if __name__ == "__main__":
108
+ start_server()
Dockerfile ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM pytorch/pytorch:2.0.1-cuda11.7-cudnn8-runtime
2
+
3
+ WORKDIR /app
4
+
5
+ RUN python --version
6
+
7
+ RUN apt-get update && apt-get install -y \
8
+ git \
9
+ libsndfile1 \
10
+ build-essential \
11
+ && rm -rf /var/lib/apt/lists/*
12
+
13
+ RUN pip install --no-cache-dir Cython packaging
14
+
15
+ RUN pip install --no-cache-dir fastapi python-multipart uvicorn
16
+
17
+ RUN git clone https://github.com/PranavDBhat/LIMMITS-24-Coquiai.git /app/LIMMITS-24-Coquiai
18
+
19
+ RUN cd /app/LIMMITS-24-Coquiai && \
20
+ pip install --no-cache-dir -r requirements.txt
21
+
22
+ RUN cd /app/LIMMITS-24-Coquiai && \
23
+ pip install -e .
24
+
25
+ COPY ./ ./
26
+
27
+ RUN [ "python", "API_Main.py" ]
README.md CHANGED
@@ -1,3 +1,169 @@
1
- ---
2
- license: mit
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # SYSPIN Hackathon TTS API Documentation
2
+
3
+ ## Overview
4
+
5
+ This API provides a Text-to-Speech (TTS) service that converts input text into speech audio. It supports multiple Indian languages and offers voice customization through predefined male and female speaker references.
6
+
7
+ ---
8
+
9
+ ## Endpoint: `/Get_Inference`
10
+
11
+ * **Method**: `GET`
12
+ * **Description**: Generates speech audio from the provided text using the specified language and speaker.
13
+
14
+ ### Query Parameters
15
+
16
+ | Parameter | Type | Required | Description | |
17
+ | --------- | ------ | -------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | --------------------------------------------- |
18
+ | `text` | string | Yes | The input text to be converted into speech. | |
19
+ | `lang` | string | Yes | The language of the input text. Acceptable values include: `bhojpuri`, `bengali`, `english`, `gujarati`, `hindi`, `chhattisgarhi`, `kannada`, `magahi`, `maithili`, `marathi`, `telugu`. | |
20
+ | `speaker` | string | Yes | The desired speaker's voice. Format: `<language>_<gender>`. For example: `hindi_male`, `english_female`. Refer to the available speakers below. |
21
+
22
+ ### Available Speakers
23
+
24
+ | Language | Language codes | Male Speaker | Female Speaker | |
25
+ | ------------- | -------- | ------------------- | --------------------- | ----------------------------------------------------------------------------------------------------------------------------------- |
26
+ | chhattisgarhi | hne | chhattisgarhi\_male | chhattisgarhi\_female | |
27
+ | kannada | kn | kannada\_male | kannada\_female | |
28
+ | maithili | mai | maithili\_male | maithili\_female | |
29
+ | telugu | te | telugu\_male | telugu\_female | |
30
+ | bengali | bn | bengali\_male | bengali\_female | |
31
+ | bhojpuri | bho | bhojpuri\_male | bhojpuri\_female | |
32
+ | marathi | mr | marathi\_male | marathi\_female | |
33
+ | gujarati | gu | gujarati\_male | gujarati\_female | |
34
+ | hindi | hi | hindi\_male | hindi\_female | |
35
+ | magahi | mag | magahi\_male | magahi\_female | |
36
+ | english | en | english\_male | english\_female |
37
+
38
+ ### Responses
39
+
40
+ * **200 OK**: Returns a WAV audio file as a streaming response containing the synthesized speech.
41
+ * **422 Unprocessable Entity**: Returned when:
42
+
43
+ * Any of the required query parameters (`text`, `lang`, `speaker`) are missing.
44
+ * The specified `lang` is not supported.
45
+ * The specified `speaker` is not available.
46
+
47
+
48
+
49
+ ## Running the Server
50
+
51
+ To start the FastAPI server:
52
+
53
+ ```bash
54
+ docker build -t your_image_name ./
55
+ docker run -d -p 8080:8080 your_image_name
56
+ ```
57
+
58
+ ## Hosting on a GPU
59
+
60
+ To run your FastAPI-based Text-to-Speech (TTS) server inside a Docker container with GPU support, follow these steps:
61
+
62
+ ---
63
+
64
+ ## Prerequisites
65
+
66
+ 1. **NVIDIA GPU**: Ensure your system has an NVIDIA GPU installed.
67
+
68
+ 2. **NVIDIA Drivers**: Install the appropriate NVIDIA drivers for your GPU.
69
+
70
+ 3. **Docker**: Install Docker on your system.
71
+
72
+ 4. **NVIDIA Container Toolkit**: Install the NVIDIA Container Toolkit to enable GPU support in Docker containers.
73
+
74
+ ---
75
+
76
+ ## Installation Steps
77
+
78
+ ### 1. Install NVIDIA Drivers
79
+
80
+ Ensure that the NVIDIA drivers compatible with your GPU are installed on your system.
81
+
82
+ ### 2. Install Docker
83
+
84
+ If Docker is not already installed, you can install it by following the official Docker installation guide for your operating system.
85
+
86
+ ### 3. Install NVIDIA Container Toolkit
87
+
88
+ The NVIDIA Container Toolkit allows Docker containers to utilize the GPU.
89
+
90
+ **For Ubuntu:**
91
+
92
+ ```bash
93
+ # Add the package repositories
94
+ distribution=$(. /etc/os-release;echo $ID$VERSION_ID)
95
+ curl -s -L https://nvidia.github.io/nvidia-docker/gpgkey | sudo apt-key add -
96
+ curl -s -L https://nvidia.github.io/nvidia-docker/$distribution/nvidia-docker.list | \
97
+ sudo tee /etc/apt/sources.list.d/nvidia-docker.list
98
+
99
+ # Update the package lists
100
+ sudo apt-get update
101
+
102
+ # Install the NVIDIA Container Toolkit
103
+ sudo apt-get install -y nvidia-container-toolkit
104
+
105
+ # Restart the Docker daemon to apply changes
106
+ sudo systemctl restart docker
107
+ ```
108
+
109
+ **For other operating systems:** Refer to the [NVIDIA Container Toolkit installation guide](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html) for detailed instructions.
110
+
111
+ ### 4. Verify GPU Access in Docker
112
+
113
+ To confirm that Docker can access your GPU, run the following command:
114
+
115
+ ```bash
116
+ docker run --rm --gpus all nvidia/cuda:12.4.0-base-ubuntu22.04 nvidia-smi
117
+ ```
118
+
119
+
120
+ ## Running Your FastAPI TTS Server with GPU Support
121
+
122
+ Assuming your FastAPI TTS application is containerized and ready to run:
123
+
124
+ 1. **Build Your Docker Image**
125
+
126
+ Navigate to the directory containing your `Dockerfile` and build the Docker image:
127
+
128
+ ```bash
129
+ docker build -t your_image_name .
130
+ ```
131
+
132
+
133
+ 2. **Run the Docker Container with GPU Support**
134
+
135
+ Start the container with GPU access enabled:
136
+
137
+ ```bash
138
+ docker run --gpus all -p 8080:8080 your_image_name
139
+ ```
140
+
141
+ ## Example API Call
142
+
143
+ ```python
144
+ import requests
145
+
146
+ # Define the base URL of your API
147
+ base_url = 'http://localhost:8080/Get_Inference'
148
+
149
+ # Set up the query parameters
150
+ params = {
151
+ 'text': 'Hello world',
152
+ 'lang': 'english',
153
+ 'speaker': 'english_female'
154
+ }
155
+
156
+ # Send the GET request
157
+ response = requests.get(base_url, params=params)
158
+
159
+ # Check if the request was successful
160
+ if response.status_code == 200:
161
+ # Save the audio content to a file
162
+ with open('output.wav', 'wb') as f:
163
+ f.write(response.content)
164
+ print("Audio saved as 'output.wav'")
165
+ else:
166
+ # Print the error message
167
+ print(f"Request failed with status code {response.status_code}")
168
+ print("Response:", response.text)
169
+ ```
model_related/Bengali_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e148bf409293b45ae4fd27d516232fc7f66068f57ffdab78eeb46fcc56fb843
3
+ size 134
model_related/Bengali_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eab41b51845880320ed1fc60145d91f489cd34e2c62623a113ef3c4f56c3bc70
3
+ size 134
model_related/Bhojpuri_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0758d5c58c0c3b2375b876bd3fa319bc9678af9b295d676065b67f93ffd870b8
3
+ size 134
model_related/Bhojpuri_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd0b455b4f26bb30aa785aa82cb767268df7ecd7687eebedeb5143ff0c45736e
3
+ size 134
model_related/Chhattisgarhi_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abf3fe4309d65f0f0fbbc2f2b3aff3928482818e32ff69575f50049f27ee6b3d
3
+ size 134
model_related/Chhattisgarhi_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9593a0c877baea24a42f7ab59b49c7a1911e21ad5ba1a5bd1f9f1d736b8ede79
3
+ size 134
model_related/English_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d54951c45b4bc40ec0d4aef4adfdd74c3569b1b8ddb7f278f36cf7bb1f0ebfaa
3
+ size 134
model_related/English_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3977b874607e6e96b95870e9abdf92b1729ca913c29142f9a12bf048cf156bda
3
+ size 134
model_related/Gujarati_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fcfb056e543d6cacebc2fbeee09c7b7dce47073f90b364d2bca4bb74b9c5af9
3
+ size 133
model_related/Gujarati_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7175678de9331b704704942edb94b0047d7389594ca8b474e61cc7d9b9340081
3
+ size 133
model_related/Hindi_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0830857099353182c42e709b2fe7df2ee590cec4a1fc57549fdc1550ce6a7108
3
+ size 134
model_related/Hindi_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:221cd9b955f2fc8adb79675929fe0cc6a49479e774f2e4f160587934fcf3c2e3
3
+ size 134
model_related/Kannada_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14b146984304ef7a2d653ccaa75cfac547075dee2ee8678074a4a1609f050090
3
+ size 133
model_related/Kannada_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e30be0891dea3f5ddd51b2a76c76d5b1e83a6957c21ae1cfd0ada5f9895e12c8
3
+ size 133
model_related/Magahi_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bc6765fa7972cd5afaee8f60e38c9413797dbb25b240453a04d29fcf87170ef
3
+ size 134
model_related/Magahi_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd4c2775d591ee6d50519c9456cf62026082ed2574fb2321fa47db3a0844b6c4
3
+ size 134
model_related/Maithili_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa059452f7ff378eb48c086458f6a89bc09d3575ecb4d9b08dd013feff8aa961
3
+ size 134
model_related/Maithili_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57519e60ae79d12606e4856facadbdf83d89fc2473127298ba7f7d22b4a0aad7
3
+ size 134
model_related/Marathi_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f5af64238bfd96d9d451eead5b119fdfdfee524ef636724e94835b295f9a54c
3
+ size 134
model_related/Marathi_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb72a8ee86e5fb9ecda480028e586e11d856c9cd33b168b479c542df581b4c00
3
+ size 133
model_related/Telugu_Female/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8c2542da9e6ff71aa439e85d795fefbc02543fda1f6ac92e4f2a1a1e61bbe21
3
+ size 134
model_related/Telugu_Male/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:510e82da22f608832af21a289709f3b801d6659d7cbd12962bb1743319b145f7
3
+ size 134
models/best_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f100ad6435878949e41d458c6c49b401326a8bf4d020fd9cb5aa41b09e4f5d
3
+ size 135
models/config.json ADDED
@@ -0,0 +1,662 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "output_path": "/home1/jesuraj/speechlm/espnet/egs2/LIMMITS_25/speechlm1/downloads",
3
+ "logger_uri": null,
4
+ "run_name": "yourtts_syspin_baseline",
5
+ "project_name": "YourTTS",
6
+ "run_description": "\n - Original YourTTS trained using VCTK dataset\n ",
7
+ "print_step": 50,
8
+ "plot_step": 100,
9
+ "model_param_stats": false,
10
+ "wandb_entity": null,
11
+ "dashboard_logger": "tensorboard",
12
+ "save_on_interrupt": true,
13
+ "log_model_step": 1000,
14
+ "save_step": 10000,
15
+ "save_n_checkpoints": 10,
16
+ "save_checkpoints": true,
17
+ "save_all_best": false,
18
+ "save_best_after": 0,
19
+ "target_loss": "loss_1",
20
+ "print_eval": false,
21
+ "test_delay_epochs": 0,
22
+ "run_eval": true,
23
+ "run_eval_steps": null,
24
+ "distributed_backend": "nccl",
25
+ "distributed_url": "tcp://localhost:54321",
26
+ "mixed_precision": false,
27
+ "precision": "fp16",
28
+ "epochs": 1000,
29
+ "batch_size": 16,
30
+ "eval_batch_size": 16,
31
+ "grad_clip": [
32
+ 1000.0,
33
+ 1000.0
34
+ ],
35
+ "scheduler_after_epoch": true,
36
+ "lr": 0.001,
37
+ "optimizer": "AdamW",
38
+ "optimizer_params": {
39
+ "betas": [
40
+ 0.8,
41
+ 0.99
42
+ ],
43
+ "eps": 1e-09,
44
+ "weight_decay": 0.01
45
+ },
46
+ "lr_scheduler": null,
47
+ "lr_scheduler_params": {},
48
+ "use_grad_scaler": false,
49
+ "allow_tf32": false,
50
+ "cudnn_enable": true,
51
+ "cudnn_deterministic": false,
52
+ "cudnn_benchmark": false,
53
+ "training_seed": 54321,
54
+ "model": "vits",
55
+ "num_loader_workers": 8,
56
+ "num_eval_loader_workers": 0,
57
+ "use_noise_augment": false,
58
+ "audio": {
59
+ "fft_size": 1024,
60
+ "sample_rate": 22050,
61
+ "win_length": 1024,
62
+ "hop_length": 256,
63
+ "num_mels": 80,
64
+ "mel_fmin": 0,
65
+ "mel_fmax": null
66
+ },
67
+ "use_phonemes": false,
68
+ "phonemizer": "espeak",
69
+ "phoneme_language": "en",
70
+ "compute_input_seq_cache": true,
71
+ "text_cleaner": "multilingual_cleaners",
72
+ "enable_eos_bos_chars": false,
73
+ "test_sentences_file": "",
74
+ "phoneme_cache_path": null,
75
+ "characters": {
76
+ "characters_class": "TTS.tts.models.vits.VitsCharacters",
77
+ "vocab_dict": null,
78
+ "pad": "_",
79
+ "eos": "&",
80
+ "bos": "*",
81
+ "blank": null,
82
+ "characters": "\u0cc8\u092f\u2013\u0951\u0905\u0c1f\u0c2c\u0a8f\ufe0f\u0a82\u099dH\u0c9bM\u2026\u0997\u0926\u0cb5\u099f\u00e8\u0c89\u0917\u0c32\u0914\u09b9\u0c4cY\u0aa2\u0a8d\u0c02\u0c4b\u0c13\u09b0\u09a8\u0aac\u09a5\u0a88\u0c93\u0c47\u0936\u0a9b\u0c09\u0919\u0c2a\u0c17\u099e\u0c0b\u098aD\u0986\u0aa1 \u0ccd\u0a95\u0c12\u0aa0RI\u090a\u0cd5\u091f\u0c97\u0c36\u0cb9\u0ab3\u09b7\u0a9e\u0aaa\u09aa\u0c37\u0cb8j\u0a86Wk\u0a81\u0958\u0937\u0cab\u09be\u095eqn\\\u0ca8\u0ce0\u091b\u09aesz\u09a3\u0995\u0c2b\u0aa3\u0aa6\u00bb1\u09bfA5\u0ca5\u092c\u091d\u09c8\u09a2\u0c9e'\u0ac9\u0c16\u0acc\u0c9c\u0ccc\u0924\u0cc0E\u00e0J,\u0c8bu\u0ca2c]\u0cca\u0caa\u099aT\u0a89\u09ce\u0a98\u0ca6\u0987\u0aa5\u0a97\u0cbf\u0c98\u09c7v\u0ca7\u0901\u0c28\u09dc\u0ac2o\u0ab2\u0c40\u0c25\u0c21\u0c82\u095a\u0c95\u09cd\u0ca0\u0c1e#\u095b\u00e9\u0cb2\u0927\u0948\u0cad\u0959\u0ab6\u093e\u0cac\u0abe\u0acdl\u09df\u0ca3\u0abf\u0ab9\u0988\u09ac\u0a96\u095d\u0909\u090b\u0c31\u0993\u0945\u0983\u0c14\u0ab7\u09f0\u0a8a\u0907\u0c19\u0989\u0c48\u09c0\u0955\u094b\u09cb\u0c1d\u0cc1\u0999\u0c99\u0c2f\u0a93\u0931\u099b\u00e2\"9\u0c92\u0c30\u0998\u0c9aZ\u09a0\u0a90\u00ef\u0c07\u092b\u0c1a\u0cbd\u0cc3(\u0cdeOB2\u09b2\u0ac1\u0c3f\u0ac5\u0922\u0c8a\u0ac8\u09af\u091e\u0ac7\u0c06we\u09f7\u0c35\u0c26\u0932hQ\u0c18a\u0c8fi\u0911\u0943\u092a\u0939\u0c4d\u0c41\u09adP3C4\u098f\u0ca4\u09ab\u0c69\u09c1\u0a9f\u0972\u0970\u0a9a\u0c2e\u0941\u0a83\u0c1bx\u09b8\u0c10r\u0cb6\u092e\u0923\u0925\u0c24\u0c33\u0c38\u0cc2\u0930[\u0942\u0949\u0964\u0a85\u0ccb\u0908\u0cbe\u0cbc*\u0caf\u0aab\u0c42\u0a8b\u0a87\u0c27\u0c3e\u09a1X`\u0c0e\u0954\u0aa8\u0ab8\u093f\u0ac3\u09c3N\u0cb3\u0cb0\u0c96\u0981\u095c\u0a9cL\u0c90\u0cb1\u0aad\u0990\u0910\u0920\u0960\u0947\u09c2\u0c66U\u091aV\u09dd\u0c15\u098b\u0c46\u0ac0G\u0921\u0c9d\u0c88\u09bc\u0c22\u093c\u0c9f\u099c\u092df\u0916\u0c05\u0cc7K\u0a9d\u090f\u09a6?\u0c4a\u0902\u0c94\u0ae0\u0c87\u094a\u0a94\u0c0f\u0985\u0c08\u0abc\u0cc67\u0933\u0918\u00f4\u0928@\u0c8e\u091c\u0915\u0c238\u0996\u0cb7t\u0982\u0c43m\u0c03\u0994\u09cc\u0c39\u0940\u0ab5\u093d\u0a91\u090d\u0c2d\u09b6\u0cae\u0938bF\u0c83\u09a7\u0aa4y\u0935p\u09030{&\u0c0a\u0ca1\u0906\u0ab0\u0acb\u0c86\u094dg\u09a4\u0aae\u0950\u0c1c\u094c\u0aa7\u0934\u0aaf\u0c20\u0c85\u095fSd\u0913",
83
+ "punctuations": "!'(),-.:;? ",
84
+ "phonemes": "",
85
+ "is_unique": true,
86
+ "is_sorted": true
87
+ },
88
+ "add_blank": true,
89
+ "batch_group_size": 32,
90
+ "loss_masking": null,
91
+ "min_audio_len": 1,
92
+ "max_audio_len": Infinity,
93
+ "min_text_len": 1,
94
+ "max_text_len": Infinity,
95
+ "compute_f0": false,
96
+ "compute_energy": false,
97
+ "compute_linear_spec": true,
98
+ "precompute_num_workers": 12,
99
+ "start_by_longest": true,
100
+ "shuffle": false,
101
+ "drop_last": false,
102
+ "datasets": [
103
+ {
104
+ "formatter": "syspin_ml",
105
+ "dataset_name": "",
106
+ "path": "model_related/Bengali_Female",
107
+ "meta_file_train": "SyspinSpeakers/Bengali_Female.tsv",
108
+ "ignored_speakers": null,
109
+ "language": "bn",
110
+ "phonemizer": "",
111
+ "meta_file_val": "",
112
+ "meta_file_attn_mask": ""
113
+ },
114
+ {
115
+ "formatter": "syspin_ml",
116
+ "dataset_name": "",
117
+ "path": "model_related/Chhattisgarhi_Male",
118
+ "meta_file_train": "SyspinSpeakers/Chhattisgarhi_Male.tsv",
119
+ "ignored_speakers": null,
120
+ "language": "hne",
121
+ "phonemizer": "",
122
+ "meta_file_val": "",
123
+ "meta_file_attn_mask": ""
124
+ },
125
+ {
126
+ "formatter": "syspin_ml",
127
+ "dataset_name": "",
128
+ "path": "model_related/Magahi_Male",
129
+ "meta_file_train": "SyspinSpeakers/Magahi_Male.tsv",
130
+ "ignored_speakers": null,
131
+ "language": "mag",
132
+ "phonemizer": "",
133
+ "meta_file_val": "",
134
+ "meta_file_attn_mask": ""
135
+ },
136
+ {
137
+ "formatter": "syspin_ml",
138
+ "dataset_name": "",
139
+ "path": "model_related/Marathi_Male",
140
+ "meta_file_train": "SyspinSpeakers/Marathi_Male.tsv",
141
+ "ignored_speakers": null,
142
+ "language": "mr",
143
+ "phonemizer": "",
144
+ "meta_file_val": "",
145
+ "meta_file_attn_mask": ""
146
+ },
147
+ {
148
+ "formatter": "syspin_ml",
149
+ "dataset_name": "",
150
+ "path": "model_related/Maithili_Female",
151
+ "meta_file_train": "SyspinSpeakers/Maithili_Female.tsv",
152
+ "ignored_speakers": null,
153
+ "language": "mai",
154
+ "phonemizer": "",
155
+ "meta_file_val": "",
156
+ "meta_file_attn_mask": ""
157
+ },
158
+ {
159
+ "formatter": "syspin_ml",
160
+ "dataset_name": "",
161
+ "path": "model_related/English_Male",
162
+ "meta_file_train": "SyspinSpeakers/English_Male.tsv",
163
+ "ignored_speakers": null,
164
+ "language": "en",
165
+ "phonemizer": "",
166
+ "meta_file_val": "",
167
+ "meta_file_attn_mask": ""
168
+ },
169
+ {
170
+ "formatter": "syspin_ml",
171
+ "dataset_name": "",
172
+ "path": "model_related/Chhattisgarhi_Female",
173
+ "meta_file_train": "SyspinSpeakers/Chhattisgarhi_Female.tsv",
174
+ "ignored_speakers": null,
175
+ "language": "hne",
176
+ "phonemizer": "",
177
+ "meta_file_val": "",
178
+ "meta_file_attn_mask": ""
179
+ },
180
+ {
181
+ "formatter": "syspin_ml",
182
+ "dataset_name": "",
183
+ "path": "model_related/Kannada_Male",
184
+ "meta_file_train": "SyspinSpeakers/Kannada_Male.tsv",
185
+ "ignored_speakers": null,
186
+ "language": "kn",
187
+ "phonemizer": "",
188
+ "meta_file_val": "",
189
+ "meta_file_attn_mask": ""
190
+ },
191
+ {
192
+ "formatter": "syspin_ml",
193
+ "dataset_name": "",
194
+ "path": "model_related/Bhojpuri_Female",
195
+ "meta_file_train": "SyspinSpeakers/Bhojpuri_Female.tsv",
196
+ "ignored_speakers": null,
197
+ "language": "bho",
198
+ "phonemizer": "",
199
+ "meta_file_val": "",
200
+ "meta_file_attn_mask": ""
201
+ },
202
+ {
203
+ "formatter": "syspin_ml",
204
+ "dataset_name": "",
205
+ "path": "model_related/Kannada_Female",
206
+ "meta_file_train": "SyspinSpeakers/Kannada_Female.tsv",
207
+ "ignored_speakers": null,
208
+ "language": "kn",
209
+ "phonemizer": "",
210
+ "meta_file_val": "",
211
+ "meta_file_attn_mask": ""
212
+ },
213
+ {
214
+ "formatter": "syspin_ml",
215
+ "dataset_name": "",
216
+ "path": "model_related/Maithili_Male",
217
+ "meta_file_train": "SyspinSpeakers/Maithili_Male.tsv",
218
+ "ignored_speakers": null,
219
+ "language": "mai",
220
+ "phonemizer": "",
221
+ "meta_file_val": "",
222
+ "meta_file_attn_mask": ""
223
+ },
224
+ {
225
+ "formatter": "syspin_ml",
226
+ "dataset_name": "",
227
+ "path": "model_related/Telugu_Male",
228
+ "meta_file_train": "SyspinSpeakers/Telugu_Male.tsv",
229
+ "ignored_speakers": null,
230
+ "language": "te",
231
+ "phonemizer": "",
232
+ "meta_file_val": "",
233
+ "meta_file_attn_mask": ""
234
+ },
235
+ {
236
+ "formatter": "syspin_ml",
237
+ "dataset_name": "",
238
+ "path": "model_related/Telugu_Female",
239
+ "meta_file_train": "SyspinSpeakers/Telugu_Female.tsv",
240
+ "ignored_speakers": null,
241
+ "language": "te",
242
+ "phonemizer": "",
243
+ "meta_file_val": "",
244
+ "meta_file_attn_mask": ""
245
+ },
246
+ {
247
+ "formatter": "syspin_ml",
248
+ "dataset_name": "",
249
+ "path": "model_related/Bengali_Male",
250
+ "meta_file_train": "SyspinSpeakers/Bengali_Male.tsv",
251
+ "ignored_speakers": null,
252
+ "language": "bn",
253
+ "phonemizer": "",
254
+ "meta_file_val": "",
255
+ "meta_file_attn_mask": ""
256
+ },
257
+ {
258
+ "formatter": "syspin_ml",
259
+ "dataset_name": "",
260
+ "path": "model_related/Bhojpuri_Male",
261
+ "meta_file_train": "SyspinSpeakers/Bhojpuri_Male.tsv",
262
+ "ignored_speakers": null,
263
+ "language": "bho",
264
+ "phonemizer": "",
265
+ "meta_file_val": "",
266
+ "meta_file_attn_mask": ""
267
+ },
268
+ {
269
+ "formatter": "syspin_ml",
270
+ "dataset_name": "",
271
+ "path": "model_related/Gujarati_Female",
272
+ "meta_file_train": "SyspinSpeakers/Gujarati_Female.tsv",
273
+ "ignored_speakers": null,
274
+ "language": "gu",
275
+ "phonemizer": "",
276
+ "meta_file_val": "",
277
+ "meta_file_attn_mask": ""
278
+ },
279
+ {
280
+ "formatter": "syspin_ml",
281
+ "dataset_name": "",
282
+ "path": "model_related/Marathi_Female",
283
+ "meta_file_train": "SyspinSpeakers/Marathi_Female.tsv",
284
+ "ignored_speakers": null,
285
+ "language": "mr",
286
+ "phonemizer": "",
287
+ "meta_file_val": "",
288
+ "meta_file_attn_mask": ""
289
+ },
290
+ {
291
+ "formatter": "syspin_ml",
292
+ "dataset_name": "",
293
+ "path": "model_related/Hindi_Female",
294
+ "meta_file_train": "SyspinSpeakers/Hindi_Female.tsv",
295
+ "ignored_speakers": null,
296
+ "language": "hi",
297
+ "phonemizer": "",
298
+ "meta_file_val": "",
299
+ "meta_file_attn_mask": ""
300
+ },
301
+ {
302
+ "formatter": "syspin_ml",
303
+ "dataset_name": "",
304
+ "path": "model_related/Gujarati_Male",
305
+ "meta_file_train": "SyspinSpeakers/Gujarati_Male.tsv",
306
+ "ignored_speakers": null,
307
+ "language": "gu",
308
+ "phonemizer": "",
309
+ "meta_file_val": "",
310
+ "meta_file_attn_mask": ""
311
+ },
312
+ {
313
+ "formatter": "syspin_ml",
314
+ "dataset_name": "",
315
+ "path": "model_related/Hindi_Male",
316
+ "meta_file_train": "SyspinSpeakers/Hindi_Male.tsv",
317
+ "ignored_speakers": null,
318
+ "language": "hi",
319
+ "phonemizer": "",
320
+ "meta_file_val": "",
321
+ "meta_file_attn_mask": ""
322
+ },
323
+ {
324
+ "formatter": "syspin_ml",
325
+ "dataset_name": "",
326
+ "path": "model_related/Magahi_Female",
327
+ "meta_file_train": "SyspinSpeakers/Magahi_Female.tsv",
328
+ "ignored_speakers": null,
329
+ "language": "mag",
330
+ "phonemizer": "",
331
+ "meta_file_val": "",
332
+ "meta_file_attn_mask": ""
333
+ },
334
+ {
335
+ "formatter": "syspin_ml",
336
+ "dataset_name": "",
337
+ "path": "model_related/English_Female",
338
+ "meta_file_train": "SyspinSpeakers/English_Female.tsv",
339
+ "ignored_speakers": null,
340
+ "language": "en",
341
+ "phonemizer": "",
342
+ "meta_file_val": "",
343
+ "meta_file_attn_mask": ""
344
+ }
345
+ ],
346
+ "test_sentences": [
347
+ [
348
+ "\u091c\u093e\u092f\u0915\u0935\u093e\u0921\u0940 \u0927\u0930\u0923\u093e\u0924\u0942\u0928 \u0924\u092c\u094d\u092c\u0932 \u0905\u0921\u0940\u091a \u0924\u0947 \u0924\u0940\u0928 \u0932\u093e\u0916 \u0939\u0947\u0915\u094d\u091f\u0930 \u0936\u0947\u0924\u0940\u091a\u094d\u092f\u093e \u0938\u093f\u0902\u091a\u0928\u093e\u0938\u093e\u0920\u0940 \u092a\u093e\u0923\u0940 \u0938\u094b\u0921\u0932\u0902 \u091c\u093e\u0924\u0902",
349
+ "Marathi_Male",
350
+ null,
351
+ "mr"
352
+ ],
353
+ [
354
+ "\u091c\u093e\u092f\u0915\u0935\u093e\u0921\u0940 \u0927\u0930\u0923\u093e\u0924\u0942\u0928 \u0924\u092c\u094d\u092c\u0932 \u0905\u0921\u0940\u091a \u0924\u0947 \u0924\u0940\u0928 \u0932\u093e\u0916 \u0939\u0947\u0915\u094d\u091f\u0930 \u0936\u0947\u0924\u0940\u091a\u094d\u092f\u093e \u0938\u093f\u0902\u091a\u0928\u093e\u0938\u093e\u0920\u0940 \u092a\u093e\u0923\u0940 \u0938\u094b\u0921\u0932\u0902 \u091c\u093e\u0924\u0902",
355
+ "Marathi_Female",
356
+ null,
357
+ "mr"
358
+ ],
359
+ [
360
+ "\u0915\u0941\u091b \u0938\u092e\u092f \u092c\u093e\u0926 \u0935\u0947 \u0905\u0938\u0939\u093e\u092c\u0947 \u0938\u0941\u095e\u094d\u095e\u093e\u0939 \u0915\u0947 \u0928\u093e\u092e \u0938\u0947 \u092a\u094d\u0930\u0938\u093f\u0926\u094d\u0927 \u0939\u094b \u0917\u090f\u0964",
361
+ "Hindi_Male",
362
+ null,
363
+ "hi"
364
+ ],
365
+ [
366
+ "\u0915\u0941\u091b \u0938\u092e\u092f \u092c\u093e\u0926 \u0935\u0947 \u0905\u0938\u0939\u093e\u092c\u0947 \u0938\u0941\u095e\u094d\u095e\u093e\u0939 \u0915\u0947 \u0928\u093e\u092e \u0938\u0947 \u092a\u094d\u0930\u0938\u093f\u0926\u094d\u0927 \u0939\u094b \u0917\u090f\u0964",
367
+ "Hindi_Female",
368
+ null,
369
+ "hi"
370
+ ],
371
+ [
372
+ "\u0c35\u0c21\u0c4d\u0c30\u0c02\u0c17\u0c3f, \u0c15\u0c4d\u0c37\u0c41\u0c30\u0c15 \u0c35\u0c43\u0c24\u0c4d\u0c24\u0c41\u0c32\u0c32\u0c4b \u0c2a\u0c46\u0c1f\u0c4d\u0c1f\u0c41\u0c2c\u0c21\u0c3f \u0c2a\u0c4d\u0c30\u0c27\u0c3e\u0c28\u0c2e\u0c48 \u0c07\u0c24\u0c30\u0c41\u0c32\u0c41 \u0c15\u0c42\u0c21\u0c3e \u0c08 \u0c35\u0c43\u0c24\u0c4d\u0c24\u0c3f\u0c32\u0c4b \u0c2a\u0c4d\u0c30\u0c35\u0c47\u0c36\u0c3f\u0c02\u0c1a\u0c3f \u0c35\u0c4d\u0c2f\u0c3e\u0c2a\u0c3e\u0c30\u0c02\u0c17\u0c3e \u0c2e\u0c3e\u0c30\u0c4d\u0c1a\u0c47\u0c38\u0c3e\u0c30",
373
+ "Telugu_Female",
374
+ null,
375
+ "te"
376
+ ],
377
+ [
378
+ "\u0c35\u0c21\u0c4d\u0c30\u0c02\u0c17\u0c3f, \u0c15\u0c4d\u0c37\u0c41\u0c30\u0c15 \u0c35\u0c43\u0c24\u0c4d\u0c24\u0c41\u0c32\u0c32\u0c4b \u0c2a\u0c46\u0c1f\u0c4d\u0c1f\u0c41\u0c2c\u0c21\u0c3f \u0c2a\u0c4d\u0c30\u0c27\u0c3e\u0c28\u0c2e\u0c48 \u0c07\u0c24\u0c30\u0c41\u0c32\u0c41 \u0c15\u0c42\u0c21\u0c3e \u0c08 \u0c35\u0c43\u0c24\u0c4d\u0c24\u0c3f\u0c32\u0c4b \u0c2a\u0c4d\u0c30\u0c35\u0c47\u0c36\u0c3f\u0c02\u0c1a\u0c3f \u0c35\u0c4d\u0c2f\u0c3e\u0c2a\u0c3e\u0c30\u0c02\u0c17\u0c3e \u0c2e\u0c3e\u0c30\u0c4d\u0c1a\u0c47\u0c38\u0c3e\u0c30",
379
+ "Telugu_Male",
380
+ null,
381
+ "te"
382
+ ],
383
+ [
384
+ "\u0915\u0932\u0915\u0924\u094d\u0924\u093e \u091c\u093e\u092f \u0916\u093e\u0924\u093f\u0930 \u092a\u0941\u0937\u094d\u092a\u093e \u0939 \u0911\u0928\u0932\u093e\u0907\u0928 \u091f\u093f\u0915\u093f\u091f \u0915\u0930\u0935\u093e\u092f \u0930\u093f\u0939\u093f\u0938 \u0939\u0935\u092f",
385
+ "Chhattisgarhi_Female",
386
+ null,
387
+ "hne"
388
+ ],
389
+ [
390
+ "\u0915\u0932\u0915\u0924\u094d\u0924\u093e \u091c\u093e\u092f \u0916\u093e\u0924\u093f\u0930 \u092a\u0941\u0937\u094d\u092a\u093e \u0939 \u0911\u0928\u0932\u093e\u0907\u0928 \u091f\u093f\u0915\u093f\u091f \u0915\u0930\u0935\u093e\u092f \u0930\u093f\u0939\u093f\u0938 \u0939\u0935\u092f",
391
+ "Chhattisgarhi_Male",
392
+ null,
393
+ "hne"
394
+ ],
395
+ [
396
+ "\u09a8\u09bf\u09ae\u09cd\u09a8\u09cb\u0995\u09cd\u09a4 \u09b8\u09be\u09b0\u09a3\u09bf \u0985\u09ac\u09b2\u09ae\u09cd\u09ac\u09a8\u09c7 \u09ad\u09be\u09b0\u09a4\u09c0\u09df \u09ac\u09cd\u09af\u09ac\u09b8\u09cd\u09a5\u09be\u09df \u099c\u09c0\u09ac\u09bf\u0995\u09be\u09b0 \u0995\u09be\u09a0\u09be\u09ae\u09cb\u09b0 \u098f\u0995\u099f\u09bf \u09aa\u09be\u0987 \u099a\u09bf\u09a4\u09cd\u09b0 \u09a4\u09c8\u09b0\u09bf \u0995\u09b0\u09cb \u0995\u09c3\u09b7\u09bf \u09ad\u09b0\u09cd\u09a4\u09c1\u0995\u09bf\u09b0 \u09aa\u0995\u09cd\u09b7\u09c7 \u098f\u09ac\u0982 \u09ac\u09bf\u09aa\u0995\u09cd\u09b7\u09c7\u09b0 \u09af\u09c1\u0995\u09cd\u09a4\u09bf\u0997\u09c1\u09b2\u09cb \u09aa\u09b0\u09cd\u09af\u09be\u09b2\u09cb\u099a\u09a8\u09be \u0995\u09b0\u09cb\u0964",
397
+ "Bengali_Male",
398
+ null,
399
+ "bn"
400
+ ],
401
+ [
402
+ "\u09a8\u09bf\u09ae\u09cd\u09a8\u09cb\u0995\u09cd\u09a4 \u09b8\u09be\u09b0\u09a3\u09bf \u0985\u09ac\u09b2\u09ae\u09cd\u09ac\u09a8\u09c7 \u09ad\u09be\u09b0\u09a4\u09c0\u09df \u09ac\u09cd\u09af\u09ac\u09b8\u09cd\u09a5\u09be\u09df \u099c\u09c0\u09ac\u09bf\u0995\u09be\u09b0 \u0995\u09be\u09a0\u09be\u09ae\u09cb\u09b0 \u098f\u0995\u099f\u09bf \u09aa\u09be\u0987 \u099a\u09bf\u09a4\u09cd\u09b0 \u09a4\u09c8\u09b0\u09bf \u0995\u09b0\u09cb \u0995\u09c3\u09b7\u09bf \u09ad\u09b0\u09cd\u09a4\u09c1\u0995\u09bf\u09b0 \u09aa\u0995\u09cd\u09b7\u09c7 \u098f\u09ac\u0982 \u09ac\u09bf\u09aa\u0995\u09cd\u09b7\u09c7\u09b0 \u09af\u09c1\u0995\u09cd\u09a4\u09bf\u0997\u09c1\u09b2\u09cb \u09aa\u09b0\u09cd\u09af\u09be\u09b2\u09cb\u099a\u09a8\u09be \u0995\u09b0\u09cb\u0964",
403
+ "Bengali_Female",
404
+ null,
405
+ "bn"
406
+ ],
407
+ [
408
+ "\u0cb9\u0cb8\u0ccd\u0ca6\u0cc7\u0cb5\u0ccd \u0ca8\u0ca6\u0cbf, \u0cb0\u0cbf\u0cb9\u0c82\u0ca1\u0ccd \u0ca8\u0ca6\u0cbf \u0cae\u0ca4\u0ccd\u0ca4\u0cc1 \u0c95\u0ca8\u0ccd\u0cb9\u0cb0\u0ccd \u0ca8\u0ca6\u0cbf\u0c97\u0cb3\u0cc1 \u0cb8\u0cc1\u0cb0\u0ccd\u0c97\u0cc1\u0c9c\u0cbe\u0ca6 \u0cae\u0cc1\u0c96\u0c9c \u0cad\u0cc2\u0cae\u0cbf\u0caf\u0cb2\u0ccd\u0cb2\u0cbf \u0cb9\u0cb0\u0cbf\u0caf\u0cc1\u0ca4\u0ccd\u0ca4\u0cb5\u0cc6.",
409
+ "Kannada_Female",
410
+ null,
411
+ "kn"
412
+ ],
413
+ [
414
+ "\u0cb9\u0cb8\u0ccd\u0ca6\u0cc7\u0cb5\u0ccd \u0ca8\u0ca6\u0cbf, \u0cb0\u0cbf\u0cb9\u0c82\u0ca1\u0ccd \u0ca8\u0ca6\u0cbf \u0cae\u0ca4\u0ccd\u0ca4\u0cc1 \u0c95\u0ca8\u0ccd\u0cb9\u0cb0\u0ccd \u0ca8\u0ca6\u0cbf\u0c97\u0cb3\u0cc1 \u0cb8\u0cc1\u0cb0\u0ccd\u0c97\u0cc1\u0c9c\u0cbe\u0ca6 \u0cae\u0cc1\u0c96\u0c9c \u0cad\u0cc2\u0cae\u0cbf\u0caf\u0cb2\u0ccd\u0cb2\u0cbf \u0cb9\u0cb0\u0cbf\u0caf\u0cc1\u0ca4\u0ccd\u0ca4\u0cb5\u0cc6.",
415
+ "Kannada_Male",
416
+ null,
417
+ "kn"
418
+ ],
419
+ [
420
+ "the russian leader added that the united states and russia have a common interest in preventing nuclear proliferation, in north korea and elsewhere",
421
+ "English_Male",
422
+ null,
423
+ "en"
424
+ ],
425
+ [
426
+ "the russian leader added that the united states and russia have a common interest in preventing nuclear proliferation, in north korea and elsewhere",
427
+ "English_Female",
428
+ null,
429
+ "en"
430
+ ],
431
+ [
432
+ "\u0915\u093e\u0928\u0942\u0928 \u0915\u0947 \u0936\u093e\u0938\u0928 \u0915\u0947 \u0938\u0916\u094d\u0924 \u0905\u0928\u0941\u092a\u093e\u0932\u0928 \u0932\u094b\u0915\u0924\u0902\u0924\u094d\u0930 \u0915\u0947 \u092a\u094d\u0930\u092e\u0941\u0916 \u0906\u0932\u094b\u091a\u0928\u093e \u092e\u0947\u0902 \u0938\u0947 \u090f\u0917\u094b \u0939\u0908",
433
+ "Magahi_Male",
434
+ null,
435
+ "mag"
436
+ ],
437
+ [
438
+ "\u0915\u093e\u0928\u0942\u0928 \u0915\u0947 \u0936\u093e\u0938\u0928 \u0915\u0947 \u0938\u0916\u094d\u0924 \u0905\u0928\u0941\u092a\u093e\u0932\u0928 \u0932\u094b\u0915\u0924\u0902\u0924\u094d\u0930 \u0915\u0947 \u092a\u094d\u0930\u092e\u0941\u0916 \u0906\u0932\u094b\u091a\u0928\u093e \u092e\u0947\u0902 \u0938\u0947 \u090f\u0917\u094b \u0939\u0908",
439
+ "Magahi_Female",
440
+ null,
441
+ "mag"
442
+ ],
443
+ [
444
+ "\u092a\u093e\u0915\u0936\u093e\u0932\u093e \u0938\u0902\u092c\u0902\u0927\u0940 \u0915\u0932\u093e \u092e\u0947\u0902 \u092d\u094b\u091c\u0928 \u092a\u0915\u093e\u092c\u0948 \u0938\u093d \u0932\u092f \u0915\u093d \u0913\u0915\u0930 \u0915\u0941\u0936\u0932 \u092a\u094d\u0930\u092c\u0902\u0927\u0928 \u0914\u0930 \u092d\u093e\u0928\u0938 \u0918\u0930\u093d\u0915 \u0909\u091a\u093f\u0924 \u0930\u0916 \u0930\u0916\u093e\u0935 \u0938\u0947\u0939\u094b \u0936\u093e\u092e\u093f\u0932 \u091b\u0948\u0915",
445
+ "Maithili_Female",
446
+ null,
447
+ "mai"
448
+ ],
449
+ [
450
+ "\u092a\u093e\u0915\u0936\u093e\u0932\u093e \u0938\u0902\u092c\u0902\u0927\u0940 \u0915\u0932\u093e \u092e\u0947\u0902 \u092d\u094b\u091c\u0928 \u092a\u0915\u093e\u092c\u0948 \u0938\u093d \u0932\u092f \u0915\u093d \u0913\u0915\u0930 \u0915\u0941\u0936\u0932 \u092a\u094d\u0930\u092c\u0902\u0927\u0928 \u0914\u0930 \u092d\u093e\u0928\u0938 \u0918\u0930\u093d\u0915 \u0909\u091a\u093f\u0924 \u0930\u0916 \u0930\u0916\u093e\u0935 \u0938\u0947\u0939\u094b \u0936\u093e\u092e\u093f\u0932 \u091b\u0948\u0915",
451
+ "Maithili_Male",
452
+ null,
453
+ "mai"
454
+ ],
455
+ [
456
+ "\u0aa4\u0acd\u0aaf\u0abe\u0ab0\u0aac\u0abe\u0aa6 \u0aaa\u0abe\u0a9f\u0ac0\u0aa6\u0abe\u0ab0\u0acb \u0aa6\u0acd\u0ab5\u0abe\u0ab0\u0abe \u0a85\u0aa8\u0ac7\u0a95 \u0aa8\u0abe\u0aa8\u0abe\u0aae\u0acb\u0a9f\u0abe \u0a95\u0abe\u0ab0\u0acd\u0aaf\u0a95\u0acd\u0ab0\u0aae\u0acb \u0aaf\u0acb\u0a9c\u0ab5\u0abe\u0aae\u0abe\u0a82 \u0a86\u0ab5\u0aa4\u0abe \u0ab9\u0aa4\u0abe \u0a9c\u0acb\u0a95\u0ac7 \u0a8f\u0a95 \u0aaa\u0aa3 \u0a95\u0abe\u0ab0\u0acd\u0aaf\u0a95\u0acd\u0ab0\u0aae\u0aa8\u0ac7 \u0aa4\u0a82\u0aa4\u0acd\u0ab0 \u0aa6\u0acd\u0ab5\u0abe\u0ab0\u0abe \u0aae\u0a82\u0a9c\u0ac2\u0ab0\u0ac0 \u0a86\u0aaa\u0ab5\u0abe\u0aae\u0abe\u0a82 \u0a86\u0ab5\u0aa4\u0ac0 \u0aa8\u0ab9\u0acb\u0aa4",
457
+ "Gujarati_Female",
458
+ null,
459
+ "gu"
460
+ ],
461
+ [
462
+ "\u0aa4\u0acd\u0aaf\u0abe\u0ab0\u0aac\u0abe\u0aa6 \u0aaa\u0abe\u0a9f\u0ac0\u0aa6\u0abe\u0ab0\u0acb \u0aa6\u0acd\u0ab5\u0abe\u0ab0\u0abe \u0a85\u0aa8\u0ac7\u0a95 \u0aa8\u0abe\u0aa8\u0abe\u0aae\u0acb\u0a9f\u0abe \u0a95\u0abe\u0ab0\u0acd\u0aaf\u0a95\u0acd\u0ab0\u0aae\u0acb \u0aaf\u0acb\u0a9c\u0ab5\u0abe\u0aae\u0abe\u0a82 \u0a86\u0ab5\u0aa4\u0abe \u0ab9\u0aa4\u0abe \u0a9c\u0acb\u0a95\u0ac7 \u0a8f\u0a95 \u0aaa\u0aa3 \u0a95\u0abe\u0ab0\u0acd\u0aaf\u0a95\u0acd\u0ab0\u0aae\u0aa8\u0ac7 \u0aa4\u0a82\u0aa4\u0acd\u0ab0 \u0aa6\u0acd\u0ab5\u0abe\u0ab0\u0abe \u0aae\u0a82\u0a9c\u0ac2\u0ab0\u0ac0 \u0a86\u0aaa\u0ab5\u0abe\u0aae\u0abe\u0a82 \u0a86\u0ab5\u0aa4\u0ac0 \u0aa8\u0ab9\u0acb\u0aa4",
463
+ "Gujarati_Male",
464
+ null,
465
+ "gu"
466
+ ],
467
+ [
468
+ "\u090f\u0928\u094d\u091f\u094d\u0930\u093e\u092a\u0940 \u0915\u0902\u092a\u094d\u092f\u0942\u091f\u093f\u0902\u0917 \u092e\u0947\u0902 \u090f\u0928\u094d\u091f\u094d\u0930\u094b\u092a\u0940 \u090a \u0911\u092a\u0930\u0947\u091f\u093f\u0902\u0917 \u0938\u093f\u0938\u094d\u091f\u092e \u0939 \u091c\u0947 \u092a\u0947 \u0938\u0930\u093e \u0915\u094d\u0930\u093f\u092a\u094d\u091f\u094b\u0917\u094d\u0930\u093e\u092b\u093f\u0915 \u092b\u0902\u0915\u094d\u0936\u0928 \u0938\u092c \u0915\u093e\u092e \u0915\u0930\u0947 \u0932\u0947\u0902",
469
+ "Bhojpuri_Male",
470
+ null,
471
+ "bho"
472
+ ],
473
+ [
474
+ "\u090f\u0928\u094d\u091f\u094d\u0930\u093e\u092a\u0940 \u0915\u0902\u092a\u094d\u092f\u0942\u091f\u093f\u0902\u0917 \u092e\u0947\u0902 \u090f\u0928\u094d\u091f\u094d\u0930\u094b\u092a\u0940 \u090a \u0911\u092a\u0930\u0947\u091f\u093f\u0902\u0917 \u0938\u093f\u0938\u094d\u091f\u092e \u0939 \u091c\u0947 \u092a\u0947 \u0938\u0930\u093e \u0915\u094d\u0930\u093f\u092a\u094d\u091f\u094b\u0917\u094d\u0930\u093e\u092b\u093f\u0915 \u092b\u0902\u0915\u094d\u0936\u0928 \u0938\u092c \u0915\u093e\u092e \u0915\u0930\u0947 \u0932\u0947\u0902",
475
+ "Bhojpuri_Female",
476
+ null,
477
+ "bho"
478
+ ]
479
+ ],
480
+ "eval_split_max_size": 256,
481
+ "eval_split_size": 0.01,
482
+ "use_speaker_weighted_sampler": false,
483
+ "speaker_weighted_sampler_alpha": 1.0,
484
+ "use_language_weighted_sampler": false,
485
+ "language_weighted_sampler_alpha": 1.0,
486
+ "use_length_weighted_sampler": false,
487
+ "length_weighted_sampler_alpha": 1.0,
488
+ "model_args": {
489
+ "num_chars": 444,
490
+ "out_channels": 513,
491
+ "spec_segment_size": 32,
492
+ "hidden_channels": 192,
493
+ "hidden_channels_ffn_text_encoder": 768,
494
+ "num_heads_text_encoder": 2,
495
+ "num_layers_text_encoder": 10,
496
+ "kernel_size_text_encoder": 3,
497
+ "dropout_p_text_encoder": 0.1,
498
+ "dropout_p_duration_predictor": 0.5,
499
+ "kernel_size_posterior_encoder": 5,
500
+ "dilation_rate_posterior_encoder": 1,
501
+ "num_layers_posterior_encoder": 16,
502
+ "kernel_size_flow": 5,
503
+ "dilation_rate_flow": 1,
504
+ "num_layers_flow": 4,
505
+ "resblock_type_decoder": "2",
506
+ "resblock_kernel_sizes_decoder": [
507
+ 3,
508
+ 7,
509
+ 11
510
+ ],
511
+ "resblock_dilation_sizes_decoder": [
512
+ [
513
+ 1,
514
+ 3,
515
+ 5
516
+ ],
517
+ [
518
+ 1,
519
+ 3,
520
+ 5
521
+ ],
522
+ [
523
+ 1,
524
+ 3,
525
+ 5
526
+ ]
527
+ ],
528
+ "upsample_rates_decoder": [
529
+ 8,
530
+ 8,
531
+ 2,
532
+ 2
533
+ ],
534
+ "upsample_initial_channel_decoder": 512,
535
+ "upsample_kernel_sizes_decoder": [
536
+ 16,
537
+ 16,
538
+ 4,
539
+ 4
540
+ ],
541
+ "periods_multi_period_discriminator": [
542
+ 2,
543
+ 3,
544
+ 5,
545
+ 7,
546
+ 11
547
+ ],
548
+ "use_sdp": true,
549
+ "noise_scale": 1.0,
550
+ "inference_noise_scale": 0.667,
551
+ "length_scale": 1.0,
552
+ "noise_scale_dp": 1.0,
553
+ "inference_noise_scale_dp": 1.0,
554
+ "max_inference_len": null,
555
+ "init_discriminator": true,
556
+ "use_spectral_norm_disriminator": false,
557
+ "use_speaker_embedding": false,
558
+ "num_speakers": 0,
559
+ "speakers_file": "/app/models/speakers.pth",
560
+ "d_vector_file": [
561
+ "model_related/Bengali_Female/speakers.pth",
562
+ "model_related/Chhattisgarhi_Male/speakers.pth",
563
+ "model_related/Magahi_Male/speakers.pth",
564
+ "model_related/Marathi_Male/speakers.pth",
565
+ "model_related/Maithili_Female/speakers.pth",
566
+ "model_related/English_Male/speakers.pth",
567
+ "model_related/Chhattisgarhi_Female/speakers.pth",
568
+ "model_related/Kannada_Male/speakers.pth",
569
+ "model_related/Bhojpuri_Female/speakers.pth",
570
+ "model_related/Kannada_Female/speakers.pth",
571
+ "model_related/Maithili_Male/speakers.pth",
572
+ "model_related/Telugu_Male/speakers.pth",
573
+ "model_related/Telugu_Female/speakers.pth",
574
+ "model_related/Bengali_Male/speakers.pth",
575
+ "model_related/Bhojpuri_Male/speakers.pth",
576
+ "model_related/Gujarati_Female/speakers.pth",
577
+ "model_related/Marathi_Female/speakers.pth",
578
+ "model_related/Hindi_Female/speakers.pth",
579
+ "model_related/Gujarati_Male/speakers.pth",
580
+ "model_related/Hindi_Male/speakers.pth",
581
+ "model_related/Magahi_Female/speakers.pth",
582
+ "model_related/English_Female/speakers.pth"
583
+ ],
584
+ "speaker_embedding_channels": 256,
585
+ "use_d_vector_file": true,
586
+ "d_vector_dim": 512,
587
+ "detach_dp_input": true,
588
+ "use_language_embedding": true,
589
+ "embedded_language_dim": 4,
590
+ "num_languages": 11,
591
+ "language_ids_file": "/app/models/language_ids.json",
592
+ "use_speaker_encoder_as_loss": false,
593
+ "speaker_encoder_config_path": "https://github.com/coqui-ai/TTS/releases/download/speaker_encoder_model/config_se.json",
594
+ "speaker_encoder_model_path": "https://github.com/coqui-ai/TTS/releases/download/speaker_encoder_model/model_se.pth.tar",
595
+ "condition_dp_on_speaker": true,
596
+ "freeze_encoder": false,
597
+ "freeze_DP": false,
598
+ "freeze_PE": false,
599
+ "freeze_flow_decoder": false,
600
+ "freeze_waveform_decoder": false,
601
+ "encoder_sample_rate": null,
602
+ "interpolate_z": true,
603
+ "reinit_DP": false,
604
+ "reinit_text_encoder": false
605
+ },
606
+ "lr_gen": 0.0002,
607
+ "lr_disc": 0.0002,
608
+ "lr_scheduler_gen": "ExponentialLR",
609
+ "lr_scheduler_gen_params": {
610
+ "gamma": 0.999875,
611
+ "last_epoch": -1
612
+ },
613
+ "lr_scheduler_disc": "ExponentialLR",
614
+ "lr_scheduler_disc_params": {
615
+ "gamma": 0.999875,
616
+ "last_epoch": -1
617
+ },
618
+ "kl_loss_alpha": 1.0,
619
+ "disc_loss_alpha": 1.0,
620
+ "gen_loss_alpha": 1.0,
621
+ "feat_loss_alpha": 1.0,
622
+ "mel_loss_alpha": 45.0,
623
+ "dur_loss_alpha": 1.0,
624
+ "speaker_encoder_loss_alpha": 9.0,
625
+ "return_wav": true,
626
+ "use_weighted_sampler": true,
627
+ "weighted_sampler_attrs": {},
628
+ "weighted_sampler_multipliers": {},
629
+ "r": 1,
630
+ "num_speakers": 0,
631
+ "use_speaker_embedding": false,
632
+ "speakers_file": "/app/models/speakers.pth",
633
+ "speaker_embedding_channels": 256,
634
+ "language_ids_file": "/app/models/language_ids.json",
635
+ "use_language_embedding": true,
636
+ "use_d_vector_file": true,
637
+ "d_vector_file": [
638
+ "model_related/Bengali_Female/speakers.pth",
639
+ "model_related/Chhattisgarhi_Male/speakers.pth",
640
+ "model_related/Magahi_Male/speakers.pth",
641
+ "model_related/Marathi_Male/speakers.pth",
642
+ "model_related/Maithili_Female/speakers.pth",
643
+ "model_related/English_Male/speakers.pth",
644
+ "model_related/Chhattisgarhi_Female/speakers.pth",
645
+ "model_related/Kannada_Male/speakers.pth",
646
+ "model_related/Bhojpuri_Female/speakers.pth",
647
+ "model_related/Kannada_Female/speakers.pth",
648
+ "model_related/Maithili_Male/speakers.pth",
649
+ "model_related/Telugu_Male/speakers.pth",
650
+ "model_related/Telugu_Female/speakers.pth",
651
+ "model_related/Bengali_Male/speakers.pth",
652
+ "model_related/Bhojpuri_Male/speakers.pth",
653
+ "model_related/Gujarati_Female/speakers.pth",
654
+ "model_related/Marathi_Female/speakers.pth",
655
+ "model_related/Hindi_Female/speakers.pth",
656
+ "model_related/Gujarati_Male/speakers.pth",
657
+ "model_related/Hindi_Male/speakers.pth",
658
+ "model_related/Magahi_Female/speakers.pth",
659
+ "model_related/English_Female/speakers.pth"
660
+ ],
661
+ "d_vector_dim": 512
662
+ }
models/language_ids.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bho": 0,
3
+ "bn": 1,
4
+ "en": 2,
5
+ "gu": 3,
6
+ "hi": 4,
7
+ "hne": 5,
8
+ "kn": 6,
9
+ "mag": 7,
10
+ "mai": 8,
11
+ "mr": 9,
12
+ "te": 10
13
+ }
models/speakers.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d56ede16a2fa6a1575002ce54919618748a8280c7ae529ebaf2767505016128
3
+ size 129
reference_audio/bengali_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02f84af0a054bc5ba740d34a1e66bef87351f44ab1f3d512cec8f810a99b7ab6
3
+ size 297516
reference_audio/bengali_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:930dc0c17d6af6fa1985918e6e0bf56f88905cab46c3ec186c11af4f1096cae1
3
+ size 268332
reference_audio/bhojpuri_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01dabe9e3e1b3dbbf41d84c7c4d6e9fe852ae14e585d4d5fe969669681963e90
3
+ size 248108
reference_audio/bhojpuri_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd2aa4e3b4b29fb21c5327abbbf469afab8bc0d3844407d20142f0d00dd4a2a1
3
+ size 291372
reference_audio/chhattisgarhi_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2c3745dd76f07c36bcc4787e1fde6616bf206d79b5802e74743ea240cab8705
3
+ size 271916
reference_audio/chhattisgarhi_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e701dcc6ac9438b40009e3f5ae5514c29724b5ef65fe4401358e8bddc25c7bf
3
+ size 259884
reference_audio/english_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f6aa5f72c8810df348f05b63561a94e65b3f56211b571680be0aa2379502a8e
3
+ size 291884
reference_audio/english_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:293fa875e14b220dcfa2f634801a814c78a306205c398a4b5f06fd1291a8cf59
3
+ size 114732
reference_audio/gujarati_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed3f3dcdb4b8a593c42bee2b85ac5c37fb2f182b91ec2dbef7efcef3af42b7c2
3
+ size 1033260
reference_audio/gujarati_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0de01b4153576afdb1b7de4e72a299737f44c8ce67f73882e0278afaec90bcb
3
+ size 206892
reference_audio/hindi_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b629d66b52a63c3c9aeafeb1b19abf701969ce3d40ad0fb3019cee3d5b6cd167
3
+ size 252460
reference_audio/hindi_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9907ea9933f7700a72a852109c9e958ef57555f3d49de80ac8b4e0fe35a0338
3
+ size 215084
reference_audio/kannada_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8a2c9c19255e246b78aa968c3c3dcc01942e42f0e4bb10cfe31265b4a0ab698
3
+ size 638508
reference_audio/kannada_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0fada49154dae650adb4fbea0c83f16222eecd83591d11af55e8d68de91fba0
3
+ size 203308
reference_audio/magahi_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1cbb361ed678f9e37d7f54d763014c98d2935d3e371e7a8e327684029af7cea
3
+ size 212524
reference_audio/magahi_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12d7a67d7379cb4c565e26b8c3b3b02e27c6c4df3577209684a732ac3c1ec1e7
3
+ size 229932
reference_audio/maithili_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4abbc686a785b50fe403cde53abc0993e0af0ccce899eb2bc5721807a20b08d0
3
+ size 124460
reference_audio/maithili_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0de0229bb6358008f6cafc02019d00fd820240a5b8c1314e8b67985ccd3215d1
3
+ size 198700
reference_audio/marathi_female.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4252210496fced3d6c744ec938b3bb235ba8d4ea7ead9174e883cf7b23d251b0
3
+ size 401452
reference_audio/marathi_male.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2091c5bdeafdba6166db62a64f2468453bc9249d1a1076b693c90c456baf03b
3
+ size 437292