Roxxas96 commited on
Commit
55c9644
·
unverified ·
1 Parent(s): daa9219

feat: add dataset generator

Browse files

Signed-off-by: Alexandre Gomez <gomez.a.corneille@gmail.com>

dataset-generator.ipynb ADDED
@@ -0,0 +1,138 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "code",
5
+ "execution_count": null,
6
+ "metadata": {},
7
+ "outputs": [],
8
+ "source": [
9
+ "import os\n",
10
+ "import torch\n",
11
+ "\n",
12
+ "device = torch.device(\"cpu\")\n",
13
+ "torch.set_num_threads(4)\n",
14
+ "local_file = \"model.pt\"\n",
15
+ "\n",
16
+ "if not os.path.isfile(local_file):\n",
17
+ " torch.hub.download_url_to_file(\"https://models.silero.ai/models/tts/fr/v3_fr.pt\",\n",
18
+ " local_file) \n",
19
+ "\n",
20
+ "model = torch.package.PackageImporter(local_file).load_pickle(\"tts_models\", \"model\")\n",
21
+ "model.to(device)\n",
22
+ "\n",
23
+ "sample_rate = 48000\n",
24
+ "num_files = 10\n",
25
+ "texts = [\n",
26
+ " # Dis Cyril\n",
27
+ " {\n",
28
+ " \"text\": \"Dis Cyril\",\n",
29
+ " \"yes\": True\n",
30
+ " },\n",
31
+ " # Dis Cyril\n",
32
+ " {\n",
33
+ " \"text\": \"Dis Cyril\",\n",
34
+ " \"yes\": True\n",
35
+ " },\n",
36
+ " # Dis Cyril\n",
37
+ " {\n",
38
+ " \"text\": \"Dis Cyril\",\n",
39
+ " \"yes\": True\n",
40
+ " },\n",
41
+ " # Dis Cyril\n",
42
+ " {\n",
43
+ " \"text\": \"Dis Cyril\",\n",
44
+ " \"yes\": True\n",
45
+ " },\n",
46
+ " # Dis Cyril\n",
47
+ " {\n",
48
+ " \"text\": \"Dis Cyril\",\n",
49
+ " \"yes\": True\n",
50
+ " },\n",
51
+ " # Comment tu t'appelles ?\n",
52
+ " {\n",
53
+ " \"text\": \"Comment tu t'appelles ?\",\n",
54
+ " \"yes\": False\n",
55
+ " },\n",
56
+ " # Quel est ton nom ?\n",
57
+ " {\n",
58
+ " \"text\": \"Quel est ton nom ?\",\n",
59
+ " \"yes\": False\n",
60
+ " },\n",
61
+ " # Tu t'appelles comment ?\n",
62
+ " {\n",
63
+ " \"text\": \"Tu t'appelles comment ?\",\n",
64
+ " \"yes\": False\n",
65
+ " },\n",
66
+ " # Comment dois-je t'appeler ?\n",
67
+ " {\n",
68
+ " \"text\": \"Comment dois-je t'appeler ?\",\n",
69
+ " \"yes\": False\n",
70
+ " },\n",
71
+ " # Peux-tu me dire ton nom ?\n",
72
+ " {\n",
73
+ " \"text\": \"Peux-tu me dire ton nom ?\",\n",
74
+ " \"yes\": False\n",
75
+ " },\n",
76
+ " # Quelle heure est-il ?\n",
77
+ " {\n",
78
+ " \"text\": \"Quelle heure est-il ?\",\n",
79
+ " \"yes\": False\n",
80
+ " },\n",
81
+ " # Peux-tu me donner la météo de demain ?\n",
82
+ " {\n",
83
+ " \"text\": \"Peux-tu me donner la météo de demain ?\",\n",
84
+ " \"yes\": False\n",
85
+ " },\n",
86
+ " # Comment cuisiner une omelette ?\n",
87
+ " {\n",
88
+ " \"text\": \"Comment cuisiner une omelette ?\",\n",
89
+ " \"yes\": False\n",
90
+ " },\n",
91
+ " # Raconte-moi une blague.\n",
92
+ " {\n",
93
+ " \"text\": \"Raconte-moi une blague.\",\n",
94
+ " \"yes\": False\n",
95
+ " },\n",
96
+ " # Quel est le sens de la vie ?\n",
97
+ " {\n",
98
+ " \"text\": \"Quel est le sens de la vie ?\",\n",
99
+ " \"yes\": False\n",
100
+ " },\n",
101
+ " # Comment se rendre à Paris depuis Lyon ?\n",
102
+ " {\n",
103
+ " \"text\": \"Comment se rendre à Paris depuis Lyon ?\",\n",
104
+ " \"yes\": False\n",
105
+ " },\n",
106
+ " # Quels sont les meilleurs films de 2020 ?\n",
107
+ " {\n",
108
+ " \"text\": \"Quels sont les meilleurs films de 2020 ?\",\n",
109
+ " \"yes\": False\n",
110
+ " },\n",
111
+ "]\n",
112
+ "speaker = \"random\"\n",
113
+ "\n",
114
+ "for index, text in enumerate(texts):\n",
115
+ " for i in range(num_files):\n",
116
+ " audio_paths = model.save_wav(text=text,\n",
117
+ " speaker=speaker,\n",
118
+ " sample_rate=sample_rate)\n",
119
+ " \n",
120
+ " # Rename the file to test_(1...1000)\n",
121
+ " os.rename('test.wav', f'../dataset/{\"yes\" if text == \"Dis Cyril\" else \"no\"}/{i + index * num_files}.wav')"
122
+ ]
123
+ }
124
+ ],
125
+ "metadata": {
126
+ "kernelspec": {
127
+ "display_name": ".venv",
128
+ "language": "python",
129
+ "name": "python3"
130
+ },
131
+ "language_info": {
132
+ "name": "python",
133
+ "version": "3.12.1"
134
+ }
135
+ },
136
+ "nbformat": 4,
137
+ "nbformat_minor": 2
138
+ }
dataset/no/.gitkeep ADDED
File without changes
dataset/yes/.gitkeep ADDED
File without changes