lighteternal commited on
Commit
626bc84
1 Parent(s): 75ed774

Added new model weights and info, trained on CV and CSS

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .ipynb_checkpoints/ASR_Inference-checkpoint.ipynb +498 -135
  2. ASR_Inference.ipynb +498 -135
  3. README.md +8 -6
  4. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429242.mp3 +0 -0
  5. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429243.mp3 +0 -0
  6. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429245.mp3 +0 -0
  7. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429246.mp3 +0 -0
  8. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429247.mp3 +0 -0
  9. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429253.mp3 +0 -0
  10. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429254.mp3 +0 -0
  11. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429255.mp3 +0 -0
  12. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429256.mp3 +0 -0
  13. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429257.mp3 +0 -0
  14. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429268.mp3 +0 -0
  15. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429269.mp3 +0 -0
  16. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429270.mp3 +0 -0
  17. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429271.mp3 +0 -0
  18. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429272.mp3 +0 -0
  19. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429278.mp3 +0 -0
  20. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429280.mp3 +0 -0
  21. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429283.mp3 +0 -0
  22. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429285.mp3 +0 -0
  23. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429288.mp3 +0 -0
  24. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429298.mp3 +0 -0
  25. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429299.mp3 +0 -0
  26. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429300.mp3 +0 -0
  27. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429301.mp3 +0 -0
  28. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429302.mp3 +0 -0
  29. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429308.mp3 +0 -0
  30. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429309.mp3 +0 -0
  31. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429310.mp3 +0 -0
  32. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429312.mp3 +0 -0
  33. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429314.mp3 +0 -0
  34. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429328.mp3 +0 -0
  35. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429329.mp3 +0 -0
  36. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429330.mp3 +0 -0
  37. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429331.mp3 +0 -0
  38. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429332.mp3 +0 -0
  39. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429407.mp3 +0 -0
  40. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429408.mp3 +0 -0
  41. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429410.mp3 +0 -0
  42. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429411.mp3 +0 -0
  43. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429412.mp3 +0 -0
  44. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429418.mp3 +0 -0
  45. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429419.mp3 +0 -0
  46. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429420.mp3 +0 -0
  47. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429421.mp3 +0 -0
  48. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429422.mp3 +0 -0
  49. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429438.mp3 +0 -0
  50. cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429439.mp3 +0 -0
.ipynb_checkpoints/ASR_Inference-checkpoint.ipynb CHANGED
@@ -5,8 +5,8 @@
5
  "execution_count": 1,
6
  "metadata": {
7
  "ExecuteTime": {
8
- "end_time": "2021-03-14T19:32:40.765119Z",
9
- "start_time": "2021-03-14T19:32:39.314790Z"
10
  }
11
  },
12
  "outputs": [
@@ -36,8 +36,8 @@
36
  "execution_count": 2,
37
  "metadata": {
38
  "ExecuteTime": {
39
- "end_time": "2021-03-14T19:32:40.774860Z",
40
- "start_time": "2021-03-14T19:32:40.771235Z"
41
  }
42
  },
43
  "outputs": [],
@@ -75,11 +75,11 @@
75
  },
76
  {
77
  "cell_type": "code",
78
- "execution_count": 3,
79
  "metadata": {
80
  "ExecuteTime": {
81
- "end_time": "2021-03-14T19:32:49.565850Z",
82
- "start_time": "2021-03-14T19:32:41.891601Z"
83
  }
84
  },
85
  "outputs": [
@@ -98,11 +98,11 @@
98
  },
99
  {
100
  "cell_type": "code",
101
- "execution_count": 4,
102
  "metadata": {
103
  "ExecuteTime": {
104
- "end_time": "2021-03-14T19:33:03.514113Z",
105
- "start_time": "2021-03-14T19:33:00.953049Z"
106
  }
107
  },
108
  "outputs": [
@@ -110,8 +110,120 @@
110
  "name": "stderr",
111
  "output_type": "stream",
112
  "text": [
113
- "Using custom data configuration el-afd0a157f05ee080\n",
114
- "Reusing dataset common_voice (/home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564)\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
115
  ]
116
  }
117
  ],
@@ -121,11 +233,11 @@
121
  },
122
  {
123
  "cell_type": "code",
124
- "execution_count": 5,
125
  "metadata": {
126
  "ExecuteTime": {
127
- "end_time": "2021-03-14T19:33:03.528699Z",
128
- "start_time": "2021-03-14T19:33:03.525034Z"
129
  }
130
  },
131
  "outputs": [],
@@ -135,19 +247,33 @@
135
  },
136
  {
137
  "cell_type": "code",
138
- "execution_count": 6,
139
  "metadata": {
140
  "ExecuteTime": {
141
- "end_time": "2021-03-14T19:33:03.542260Z",
142
- "start_time": "2021-03-14T19:33:03.538498Z"
143
  }
144
  },
145
  "outputs": [
146
  {
147
- "name": "stderr",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
148
  "output_type": "stream",
149
  "text": [
150
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-0ce2ebca66096fff.arrow\n"
151
  ]
152
  }
153
  ],
@@ -157,19 +283,33 @@
157
  },
158
  {
159
  "cell_type": "code",
160
- "execution_count": 7,
161
  "metadata": {
162
  "ExecuteTime": {
163
- "end_time": "2021-03-14T19:33:03.561798Z",
164
- "start_time": "2021-03-14T19:33:03.554256Z"
165
  }
166
  },
167
  "outputs": [
168
  {
169
- "name": "stderr",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
170
  "output_type": "stream",
171
  "text": [
172
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-38a09981767eff59.arrow\n"
173
  ]
174
  }
175
  ],
@@ -179,11 +319,11 @@
179
  },
180
  {
181
  "cell_type": "code",
182
- "execution_count": 8,
183
  "metadata": {
184
  "ExecuteTime": {
185
- "end_time": "2021-03-14T19:33:04.357229Z",
186
- "start_time": "2021-03-14T19:33:03.570805Z"
187
  }
188
  },
189
  "outputs": [
@@ -191,112 +331,133 @@
191
  "name": "stdout",
192
  "output_type": "stream",
193
  "text": [
194
- " "
195
- ]
196
- },
197
- {
198
- "name": "stderr",
199
- "output_type": "stream",
200
- "text": [
201
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-ba8c6dd59eb8ccf2.arrow\n"
202
- ]
203
- },
204
- {
205
- "name": "stdout",
206
- "output_type": "stream",
207
- "text": [
208
- " "
209
- ]
210
- },
211
- {
212
- "name": "stderr",
213
- "output_type": "stream",
214
- "text": [
215
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-2e240883a5f827fd.arrow\n"
216
- ]
217
- },
218
- {
219
- "name": "stdout",
220
- "output_type": "stream",
221
- "text": [
222
- " "
223
- ]
224
- },
225
- {
226
- "name": "stderr",
227
- "output_type": "stream",
228
- "text": [
229
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-485c00dc9048ed50.arrow\n"
230
  ]
231
  },
232
  {
233
- "name": "stdout",
234
- "output_type": "stream",
235
- "text": [
236
- " "
237
- ]
 
 
 
 
 
 
 
238
  },
239
  {
240
- "name": "stderr",
241
- "output_type": "stream",
242
- "text": [
243
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-44bf1791baae8e2e.arrow\n"
244
- ]
 
 
 
 
 
 
 
245
  },
246
  {
247
- "name": "stdout",
248
- "output_type": "stream",
249
- "text": [
250
- " "
251
- ]
 
 
 
 
 
 
 
252
  },
253
  {
254
- "name": "stderr",
255
- "output_type": "stream",
256
- "text": [
257
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-ecc0dfac5615a58e.arrow\n"
258
- ]
 
 
 
 
 
 
 
259
  },
260
  {
261
- "name": "stdout",
262
- "output_type": "stream",
263
- "text": [
264
- " "
265
- ]
 
 
 
 
 
 
 
266
  },
267
  {
268
- "name": "stderr",
269
- "output_type": "stream",
270
- "text": [
271
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-923d905502a8661d.arrow\n"
272
- ]
 
 
 
 
 
 
 
273
  },
274
  {
275
- "name": "stdout",
276
- "output_type": "stream",
277
- "text": [
278
- " "
279
- ]
 
 
 
 
 
 
 
280
  },
281
  {
282
- "name": "stderr",
283
- "output_type": "stream",
284
- "text": [
285
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-bb54bb00dae79669.arrow\n"
286
- ]
 
 
 
 
 
 
 
287
  },
288
  {
289
  "name": "stdout",
290
  "output_type": "stream",
291
  "text": [
292
- " "
293
- ]
294
- },
295
- {
296
- "name": "stderr",
297
- "output_type": "stream",
298
- "text": [
299
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-062aeafc3b8816c1.arrow\n"
300
  ]
301
  }
302
  ],
@@ -306,11 +467,11 @@
306
  },
307
  {
308
  "cell_type": "code",
309
- "execution_count": 9,
310
  "metadata": {
311
  "ExecuteTime": {
312
- "end_time": "2021-03-14T19:33:11.205598Z",
313
- "start_time": "2021-03-14T19:33:04.368615Z"
314
  }
315
  },
316
  "outputs": [
@@ -332,12 +493,12 @@
332
  {
333
  "data": {
334
  "application/vnd.jupyter.widget-view+json": {
335
- "model_id": "b179696d93284b739cc550511ca28b78",
336
  "version_major": 2,
337
  "version_minor": 0
338
  },
339
  "text/plain": [
340
- "HBox(children=(IntProgress(value=0, description='#1', max=24, style=ProgressStyle(description_width='initial')…"
341
  ]
342
  },
343
  "metadata": {},
@@ -346,12 +507,12 @@
346
  {
347
  "data": {
348
  "application/vnd.jupyter.widget-view+json": {
349
- "model_id": "2aa538a2fdcb4d56a55cd612c879044f",
350
  "version_major": 2,
351
  "version_minor": 0
352
  },
353
  "text/plain": [
354
- "HBox(children=(IntProgress(value=0, description='#0', max=24, style=ProgressStyle(description_width='initial')…"
355
  ]
356
  },
357
  "metadata": {},
@@ -360,12 +521,12 @@
360
  {
361
  "data": {
362
  "application/vnd.jupyter.widget-view+json": {
363
- "model_id": "073b156d7b7541e08ad20ec377efb05b",
364
  "version_major": 2,
365
  "version_minor": 0
366
  },
367
  "text/plain": [
368
- "HBox(children=(IntProgress(value=0, description='#2', max=24, style=ProgressStyle(description_width='initial')…"
369
  ]
370
  },
371
  "metadata": {},
@@ -374,12 +535,12 @@
374
  {
375
  "data": {
376
  "application/vnd.jupyter.widget-view+json": {
377
- "model_id": "dcaa10621a674699a7bf17357cd75a4a",
378
  "version_major": 2,
379
  "version_minor": 0
380
  },
381
  "text/plain": [
382
- "HBox(children=(IntProgress(value=0, description='#4', max=24, style=ProgressStyle(description_width='initial')…"
383
  ]
384
  },
385
  "metadata": {},
@@ -388,12 +549,12 @@
388
  {
389
  "data": {
390
  "application/vnd.jupyter.widget-view+json": {
391
- "model_id": "9ee2184681db4e16802387bbc1acfef3",
392
  "version_major": 2,
393
  "version_minor": 0
394
  },
395
  "text/plain": [
396
- "HBox(children=(IntProgress(value=0, description='#3', max=24, style=ProgressStyle(description_width='initial')…"
397
  ]
398
  },
399
  "metadata": {},
@@ -402,12 +563,12 @@
402
  {
403
  "data": {
404
  "application/vnd.jupyter.widget-view+json": {
405
- "model_id": "36c3bcde96114167a1dc6942d9d551f1",
406
  "version_major": 2,
407
  "version_minor": 0
408
  },
409
  "text/plain": [
410
- "HBox(children=(IntProgress(value=0, description='#6', max=24, style=ProgressStyle(description_width='initial')…"
411
  ]
412
  },
413
  "metadata": {},
@@ -416,12 +577,12 @@
416
  {
417
  "data": {
418
  "application/vnd.jupyter.widget-view+json": {
419
- "model_id": "b0ad190f479d40a599e74cfa9deddec8",
420
  "version_major": 2,
421
  "version_minor": 0
422
  },
423
  "text/plain": [
424
- "HBox(children=(IntProgress(value=0, description='#5', max=24, style=ProgressStyle(description_width='initial')…"
425
  ]
426
  },
427
  "metadata": {},
@@ -430,7 +591,7 @@
430
  {
431
  "data": {
432
  "application/vnd.jupyter.widget-view+json": {
433
- "model_id": "138f7261158c4a9ab84414a20954de01",
434
  "version_major": 2,
435
  "version_minor": 0
436
  },
@@ -462,11 +623,11 @@
462
  },
463
  {
464
  "cell_type": "code",
465
- "execution_count": 10,
466
  "metadata": {
467
  "ExecuteTime": {
468
- "end_time": "2021-03-14T19:33:14.391497Z",
469
- "start_time": "2021-03-14T19:33:11.216118Z"
470
  }
471
  },
472
  "outputs": [
@@ -474,8 +635,120 @@
474
  "name": "stderr",
475
  "output_type": "stream",
476
  "text": [
477
- "Using custom data configuration el-ac779bf2c9f7c09b\n",
478
- "Reusing dataset common_voice (/home/earendil/.cache/huggingface/datasets/common_voice/el-ac779bf2c9f7c09b/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564)\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
479
  ]
480
  }
481
  ],
@@ -536,6 +809,96 @@
536
  "# πού θέλεις να πάμε; ρώτησε φοβισμένα ο βασιλιάς."
537
  ]
538
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
539
  {
540
  "cell_type": "code",
541
  "execution_count": null,
5
  "execution_count": 1,
6
  "metadata": {
7
  "ExecuteTime": {
8
+ "end_time": "2021-03-17T11:10:25.794375Z",
9
+ "start_time": "2021-03-17T11:10:24.301013Z"
10
  }
11
  },
12
  "outputs": [
36
  "execution_count": 2,
37
  "metadata": {
38
  "ExecuteTime": {
39
+ "end_time": "2021-03-17T11:10:29.608803Z",
40
+ "start_time": "2021-03-17T11:10:29.599700Z"
41
  }
42
  },
43
  "outputs": [],
75
  },
76
  {
77
  "cell_type": "code",
78
+ "execution_count": 4,
79
  "metadata": {
80
  "ExecuteTime": {
81
+ "end_time": "2021-03-17T11:11:02.120225Z",
82
+ "start_time": "2021-03-17T11:10:56.182488Z"
83
  }
84
  },
85
  "outputs": [
98
  },
99
  {
100
  "cell_type": "code",
101
+ "execution_count": 6,
102
  "metadata": {
103
  "ExecuteTime": {
104
+ "end_time": "2021-03-17T11:12:18.847005Z",
105
+ "start_time": "2021-03-17T11:12:14.919077Z"
106
  }
107
  },
108
  "outputs": [
110
  "name": "stderr",
111
  "output_type": "stream",
112
  "text": [
113
+ "Using custom data configuration el-afd0a157f05ee080\n"
114
+ ]
115
+ },
116
+ {
117
+ "name": "stdout",
118
+ "output_type": "stream",
119
+ "text": [
120
+ "Downloading and preparing dataset common_voice/el (download: 363.89 MiB, generated: 4.75 MiB, post-processed: Unknown size, total: 368.64 MiB) to /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f...\n"
121
+ ]
122
+ },
123
+ {
124
+ "data": {
125
+ "application/vnd.jupyter.widget-view+json": {
126
+ "model_id": "",
127
+ "version_major": 2,
128
+ "version_minor": 0
129
+ },
130
+ "text/plain": [
131
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
132
+ ]
133
+ },
134
+ "metadata": {},
135
+ "output_type": "display_data"
136
+ },
137
+ {
138
+ "name": "stdout",
139
+ "output_type": "stream",
140
+ "text": [
141
+ "\r"
142
+ ]
143
+ },
144
+ {
145
+ "data": {
146
+ "application/vnd.jupyter.widget-view+json": {
147
+ "model_id": "",
148
+ "version_major": 2,
149
+ "version_minor": 0
150
+ },
151
+ "text/plain": [
152
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
153
+ ]
154
+ },
155
+ "metadata": {},
156
+ "output_type": "display_data"
157
+ },
158
+ {
159
+ "name": "stdout",
160
+ "output_type": "stream",
161
+ "text": [
162
+ "\r"
163
+ ]
164
+ },
165
+ {
166
+ "data": {
167
+ "application/vnd.jupyter.widget-view+json": {
168
+ "model_id": "",
169
+ "version_major": 2,
170
+ "version_minor": 0
171
+ },
172
+ "text/plain": [
173
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
174
+ ]
175
+ },
176
+ "metadata": {},
177
+ "output_type": "display_data"
178
+ },
179
+ {
180
+ "name": "stdout",
181
+ "output_type": "stream",
182
+ "text": [
183
+ "\r"
184
+ ]
185
+ },
186
+ {
187
+ "data": {
188
+ "application/vnd.jupyter.widget-view+json": {
189
+ "model_id": "",
190
+ "version_major": 2,
191
+ "version_minor": 0
192
+ },
193
+ "text/plain": [
194
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
195
+ ]
196
+ },
197
+ "metadata": {},
198
+ "output_type": "display_data"
199
+ },
200
+ {
201
+ "name": "stdout",
202
+ "output_type": "stream",
203
+ "text": [
204
+ "\r"
205
+ ]
206
+ },
207
+ {
208
+ "data": {
209
+ "application/vnd.jupyter.widget-view+json": {
210
+ "model_id": "",
211
+ "version_major": 2,
212
+ "version_minor": 0
213
+ },
214
+ "text/plain": [
215
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
216
+ ]
217
+ },
218
+ "metadata": {},
219
+ "output_type": "display_data"
220
+ },
221
+ {
222
+ "name": "stdout",
223
+ "output_type": "stream",
224
+ "text": [
225
+ "\r",
226
+ "Dataset common_voice downloaded and prepared to /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f. Subsequent calls will reuse this data.\n"
227
  ]
228
  }
229
  ],
233
  },
234
  {
235
  "cell_type": "code",
236
+ "execution_count": 7,
237
  "metadata": {
238
  "ExecuteTime": {
239
+ "end_time": "2021-03-17T11:12:18.860240Z",
240
+ "start_time": "2021-03-17T11:12:18.857252Z"
241
  }
242
  },
243
  "outputs": [],
247
  },
248
  {
249
  "cell_type": "code",
250
+ "execution_count": 8,
251
  "metadata": {
252
  "ExecuteTime": {
253
+ "end_time": "2021-03-17T11:12:18.928497Z",
254
+ "start_time": "2021-03-17T11:12:18.869198Z"
255
  }
256
  },
257
  "outputs": [
258
  {
259
+ "data": {
260
+ "application/vnd.jupyter.widget-view+json": {
261
+ "model_id": "9869698af86e44bca75c4252996ff1a3",
262
+ "version_major": 2,
263
+ "version_minor": 0
264
+ },
265
+ "text/plain": [
266
+ "HBox(children=(IntProgress(value=0, max=1522), HTML(value='')))"
267
+ ]
268
+ },
269
+ "metadata": {},
270
+ "output_type": "display_data"
271
+ },
272
+ {
273
+ "name": "stdout",
274
  "output_type": "stream",
275
  "text": [
276
+ "\n"
277
  ]
278
  }
279
  ],
283
  },
284
  {
285
  "cell_type": "code",
286
+ "execution_count": 9,
287
  "metadata": {
288
  "ExecuteTime": {
289
+ "end_time": "2021-03-17T11:12:40.824595Z",
290
+ "start_time": "2021-03-17T11:12:18.937930Z"
291
  }
292
  },
293
  "outputs": [
294
  {
295
+ "data": {
296
+ "application/vnd.jupyter.widget-view+json": {
297
+ "model_id": "d232b2bb009543e0bb2542bce273c554",
298
+ "version_major": 2,
299
+ "version_minor": 0
300
+ },
301
+ "text/plain": [
302
+ "HBox(children=(IntProgress(value=0, max=1522), HTML(value='')))"
303
+ ]
304
+ },
305
+ "metadata": {},
306
+ "output_type": "display_data"
307
+ },
308
+ {
309
+ "name": "stdout",
310
  "output_type": "stream",
311
  "text": [
312
+ "\n"
313
  ]
314
  }
315
  ],
319
  },
320
  {
321
  "cell_type": "code",
322
+ "execution_count": 10,
323
  "metadata": {
324
  "ExecuteTime": {
325
+ "end_time": "2021-03-17T11:13:18.078738Z",
326
+ "start_time": "2021-03-17T11:12:40.834398Z"
327
  }
328
  },
329
  "outputs": [
331
  "name": "stdout",
332
  "output_type": "stream",
333
  "text": [
334
+ " "
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
335
  ]
336
  },
337
  {
338
+ "data": {
339
+ "application/vnd.jupyter.widget-view+json": {
340
+ "model_id": "ffd787bc4ed048ae8f4977f2c539bedb",
341
+ "version_major": 2,
342
+ "version_minor": 0
343
+ },
344
+ "text/plain": [
345
+ "HBox(children=(IntProgress(value=0, description='#0', max=191, style=ProgressStyle(description_width='initial'…"
346
+ ]
347
+ },
348
+ "metadata": {},
349
+ "output_type": "display_data"
350
  },
351
  {
352
+ "data": {
353
+ "application/vnd.jupyter.widget-view+json": {
354
+ "model_id": "79c51995d4f84ad8812230480d14b8cd",
355
+ "version_major": 2,
356
+ "version_minor": 0
357
+ },
358
+ "text/plain": [
359
+ "HBox(children=(IntProgress(value=0, description='#2', max=190, style=ProgressStyle(description_width='initial'…"
360
+ ]
361
+ },
362
+ "metadata": {},
363
+ "output_type": "display_data"
364
  },
365
  {
366
+ "data": {
367
+ "application/vnd.jupyter.widget-view+json": {
368
+ "model_id": "52963d9cfd814346af070b2cc4e105cf",
369
+ "version_major": 2,
370
+ "version_minor": 0
371
+ },
372
+ "text/plain": [
373
+ "HBox(children=(IntProgress(value=0, description='#5', max=190, style=ProgressStyle(description_width='initial'…"
374
+ ]
375
+ },
376
+ "metadata": {},
377
+ "output_type": "display_data"
378
  },
379
  {
380
+ "data": {
381
+ "application/vnd.jupyter.widget-view+json": {
382
+ "model_id": "3b940160575143c7acfa142564e9f7d2",
383
+ "version_major": 2,
384
+ "version_minor": 0
385
+ },
386
+ "text/plain": [
387
+ "HBox(children=(IntProgress(value=0, description='#3', max=190, style=ProgressStyle(description_width='initial'…"
388
+ ]
389
+ },
390
+ "metadata": {},
391
+ "output_type": "display_data"
392
  },
393
  {
394
+ "data": {
395
+ "application/vnd.jupyter.widget-view+json": {
396
+ "model_id": "aa540f67ba894d7aa64e12fcdfab5ce0",
397
+ "version_major": 2,
398
+ "version_minor": 0
399
+ },
400
+ "text/plain": [
401
+ "HBox(children=(IntProgress(value=0, description='#1', max=191, style=ProgressStyle(description_width='initial'…"
402
+ ]
403
+ },
404
+ "metadata": {},
405
+ "output_type": "display_data"
406
  },
407
  {
408
+ "data": {
409
+ "application/vnd.jupyter.widget-view+json": {
410
+ "model_id": "4962bdefdbbc44a7a44591480d8d6406",
411
+ "version_major": 2,
412
+ "version_minor": 0
413
+ },
414
+ "text/plain": [
415
+ "HBox(children=(IntProgress(value=0, description='#4', max=190, style=ProgressStyle(description_width='initial'…"
416
+ ]
417
+ },
418
+ "metadata": {},
419
+ "output_type": "display_data"
420
  },
421
  {
422
+ "data": {
423
+ "application/vnd.jupyter.widget-view+json": {
424
+ "model_id": "e77f088bfe5644548fe2c4277d0c86da",
425
+ "version_major": 2,
426
+ "version_minor": 0
427
+ },
428
+ "text/plain": [
429
+ "HBox(children=(IntProgress(value=0, description='#7', max=190, style=ProgressStyle(description_width='initial'…"
430
+ ]
431
+ },
432
+ "metadata": {},
433
+ "output_type": "display_data"
434
  },
435
  {
436
+ "data": {
437
+ "application/vnd.jupyter.widget-view+json": {
438
+ "model_id": "5827f93e99994fe9919aac53f0fb9444",
439
+ "version_major": 2,
440
+ "version_minor": 0
441
+ },
442
+ "text/plain": [
443
+ "HBox(children=(IntProgress(value=0, description='#6', max=190, style=ProgressStyle(description_width='initial'…"
444
+ ]
445
+ },
446
+ "metadata": {},
447
+ "output_type": "display_data"
448
  },
449
  {
450
  "name": "stdout",
451
  "output_type": "stream",
452
  "text": [
453
+ "\n",
454
+ "\n",
455
+ "\n",
456
+ "\n",
457
+ "\n",
458
+ "\n",
459
+ "\n",
460
+ "\n"
461
  ]
462
  }
463
  ],
467
  },
468
  {
469
  "cell_type": "code",
470
+ "execution_count": 11,
471
  "metadata": {
472
  "ExecuteTime": {
473
+ "end_time": "2021-03-17T11:13:25.145155Z",
474
+ "start_time": "2021-03-17T11:13:18.091929Z"
475
  }
476
  },
477
  "outputs": [
493
  {
494
  "data": {
495
  "application/vnd.jupyter.widget-view+json": {
496
+ "model_id": "ae326a173a044b1494793e2a70d76a87",
497
  "version_major": 2,
498
  "version_minor": 0
499
  },
500
  "text/plain": [
501
+ "HBox(children=(IntProgress(value=0, description='#0', max=24, style=ProgressStyle(description_width='initial')…"
502
  ]
503
  },
504
  "metadata": {},
507
  {
508
  "data": {
509
  "application/vnd.jupyter.widget-view+json": {
510
+ "model_id": "21ab1ef2af5a4a4fb23c68b0c5cf32f8",
511
  "version_major": 2,
512
  "version_minor": 0
513
  },
514
  "text/plain": [
515
+ "HBox(children=(IntProgress(value=0, description='#1', max=24, style=ProgressStyle(description_width='initial')…"
516
  ]
517
  },
518
  "metadata": {},
521
  {
522
  "data": {
523
  "application/vnd.jupyter.widget-view+json": {
524
+ "model_id": "d331c5f4f888477daceffe370f6cd89f",
525
  "version_major": 2,
526
  "version_minor": 0
527
  },
528
  "text/plain": [
529
+ "HBox(children=(IntProgress(value=0, description='#3', max=24, style=ProgressStyle(description_width='initial')…"
530
  ]
531
  },
532
  "metadata": {},
535
  {
536
  "data": {
537
  "application/vnd.jupyter.widget-view+json": {
538
+ "model_id": "6fa790118aa340e4afb9f83e71403a13",
539
  "version_major": 2,
540
  "version_minor": 0
541
  },
542
  "text/plain": [
543
+ "HBox(children=(IntProgress(value=0, description='#2', max=24, style=ProgressStyle(description_width='initial')…"
544
  ]
545
  },
546
  "metadata": {},
549
  {
550
  "data": {
551
  "application/vnd.jupyter.widget-view+json": {
552
+ "model_id": "c8092e2f59a9404596dc2bab206edf2c",
553
  "version_major": 2,
554
  "version_minor": 0
555
  },
556
  "text/plain": [
557
+ "HBox(children=(IntProgress(value=0, description='#5', max=24, style=ProgressStyle(description_width='initial')…"
558
  ]
559
  },
560
  "metadata": {},
563
  {
564
  "data": {
565
  "application/vnd.jupyter.widget-view+json": {
566
+ "model_id": "20f913f0caf8401098743b9e5051fc52",
567
  "version_major": 2,
568
  "version_minor": 0
569
  },
570
  "text/plain": [
571
+ "HBox(children=(IntProgress(value=0, description='#4', max=24, style=ProgressStyle(description_width='initial')…"
572
  ]
573
  },
574
  "metadata": {},
577
  {
578
  "data": {
579
  "application/vnd.jupyter.widget-view+json": {
580
+ "model_id": "7c7e15e24384494cb49a72106ce41ccd",
581
  "version_major": 2,
582
  "version_minor": 0
583
  },
584
  "text/plain": [
585
+ "HBox(children=(IntProgress(value=0, description='#6', max=24, style=ProgressStyle(description_width='initial')…"
586
  ]
587
  },
588
  "metadata": {},
591
  {
592
  "data": {
593
  "application/vnd.jupyter.widget-view+json": {
594
+ "model_id": "73245add55e24ee2a6dbe0713d5073d9",
595
  "version_major": 2,
596
  "version_minor": 0
597
  },
623
  },
624
  {
625
  "cell_type": "code",
626
+ "execution_count": 12,
627
  "metadata": {
628
  "ExecuteTime": {
629
+ "end_time": "2021-03-17T11:14:12.721500Z",
630
+ "start_time": "2021-03-17T11:14:08.198478Z"
631
  }
632
  },
633
  "outputs": [
635
  "name": "stderr",
636
  "output_type": "stream",
637
  "text": [
638
+ "Using custom data configuration el-ac779bf2c9f7c09b\n"
639
+ ]
640
+ },
641
+ {
642
+ "name": "stdout",
643
+ "output_type": "stream",
644
+ "text": [
645
+ "Downloading and preparing dataset common_voice/el (download: 363.89 MiB, generated: 4.75 MiB, post-processed: Unknown size, total: 368.64 MiB) to /home/earendil/.cache/huggingface/datasets/common_voice/el-ac779bf2c9f7c09b/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f...\n"
646
+ ]
647
+ },
648
+ {
649
+ "data": {
650
+ "application/vnd.jupyter.widget-view+json": {
651
+ "model_id": "",
652
+ "version_major": 2,
653
+ "version_minor": 0
654
+ },
655
+ "text/plain": [
656
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
657
+ ]
658
+ },
659
+ "metadata": {},
660
+ "output_type": "display_data"
661
+ },
662
+ {
663
+ "name": "stdout",
664
+ "output_type": "stream",
665
+ "text": [
666
+ "\r"
667
+ ]
668
+ },
669
+ {
670
+ "data": {
671
+ "application/vnd.jupyter.widget-view+json": {
672
+ "model_id": "",
673
+ "version_major": 2,
674
+ "version_minor": 0
675
+ },
676
+ "text/plain": [
677
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
678
+ ]
679
+ },
680
+ "metadata": {},
681
+ "output_type": "display_data"
682
+ },
683
+ {
684
+ "name": "stdout",
685
+ "output_type": "stream",
686
+ "text": [
687
+ "\r"
688
+ ]
689
+ },
690
+ {
691
+ "data": {
692
+ "application/vnd.jupyter.widget-view+json": {
693
+ "model_id": "",
694
+ "version_major": 2,
695
+ "version_minor": 0
696
+ },
697
+ "text/plain": [
698
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
699
+ ]
700
+ },
701
+ "metadata": {},
702
+ "output_type": "display_data"
703
+ },
704
+ {
705
+ "name": "stdout",
706
+ "output_type": "stream",
707
+ "text": [
708
+ "\r"
709
+ ]
710
+ },
711
+ {
712
+ "data": {
713
+ "application/vnd.jupyter.widget-view+json": {
714
+ "model_id": "",
715
+ "version_major": 2,
716
+ "version_minor": 0
717
+ },
718
+ "text/plain": [
719
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
720
+ ]
721
+ },
722
+ "metadata": {},
723
+ "output_type": "display_data"
724
+ },
725
+ {
726
+ "name": "stdout",
727
+ "output_type": "stream",
728
+ "text": [
729
+ "\r"
730
+ ]
731
+ },
732
+ {
733
+ "data": {
734
+ "application/vnd.jupyter.widget-view+json": {
735
+ "model_id": "",
736
+ "version_major": 2,
737
+ "version_minor": 0
738
+ },
739
+ "text/plain": [
740
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
741
+ ]
742
+ },
743
+ "metadata": {},
744
+ "output_type": "display_data"
745
+ },
746
+ {
747
+ "name": "stdout",
748
+ "output_type": "stream",
749
+ "text": [
750
+ "\r",
751
+ "Dataset common_voice downloaded and prepared to /home/earendil/.cache/huggingface/datasets/common_voice/el-ac779bf2c9f7c09b/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f. Subsequent calls will reuse this data.\n"
752
  ]
753
  }
754
  ],
809
  "# πού θέλεις να πάμε; ρώτησε φοβισμένα ο βασιλιάς."
810
  ]
811
  },
812
+ {
813
+ "cell_type": "code",
814
+ "execution_count": 13,
815
+ "metadata": {
816
+ "ExecuteTime": {
817
+ "end_time": "2021-03-17T11:15:35.637739Z",
818
+ "start_time": "2021-03-17T11:14:14.689842Z"
819
+ }
820
+ },
821
+ "outputs": [
822
+ {
823
+ "data": {
824
+ "application/vnd.jupyter.widget-view+json": {
825
+ "model_id": "1f7ba9e12187401f870555d20a6a9458",
826
+ "version_major": 2,
827
+ "version_minor": 0
828
+ },
829
+ "text/plain": [
830
+ "HBox(children=(IntProgress(value=0, max=1522), HTML(value='')))"
831
+ ]
832
+ },
833
+ "metadata": {},
834
+ "output_type": "display_data"
835
+ },
836
+ {
837
+ "name": "stdout",
838
+ "output_type": "stream",
839
+ "text": [
840
+ "\n"
841
+ ]
842
+ }
843
+ ],
844
+ "source": [
845
+ "def map_to_result(batch):\n",
846
+ " model.to(\"cuda\")\n",
847
+ " input_values = processor(\n",
848
+ " batch[\"input_values\"], \n",
849
+ " sampling_rate=16_000, \n",
850
+ " return_tensors=\"pt\"\n",
851
+ " ).input_values.to(\"cuda\")\n",
852
+ "\n",
853
+ " with torch.no_grad():\n",
854
+ " logits = model(input_values).logits\n",
855
+ "\n",
856
+ " pred_ids = torch.argmax(logits, dim=-1)\n",
857
+ " batch[\"pred_str\"] = processor.batch_decode(pred_ids)[0]\n",
858
+ "\n",
859
+ " return batch\n",
860
+ "\n",
861
+ "results = common_voice_test.map(map_to_result)\n"
862
+ ]
863
+ },
864
+ {
865
+ "cell_type": "code",
866
+ "execution_count": 16,
867
+ "metadata": {
868
+ "ExecuteTime": {
869
+ "end_time": "2021-03-17T11:17:11.951524Z",
870
+ "start_time": "2021-03-17T11:17:08.856552Z"
871
+ }
872
+ },
873
+ "outputs": [
874
+ {
875
+ "name": "stdout",
876
+ "output_type": "stream",
877
+ "text": [
878
+ "Test WER: 0.396\n"
879
+ ]
880
+ }
881
+ ],
882
+ "source": [
883
+ "def compute_metrics(pred):\n",
884
+ " pred_logits = pred.predictions\n",
885
+ " pred_ids = np.argmax(pred_logits, axis=-1)\n",
886
+ "\n",
887
+ " pred.label_ids[pred.label_ids == -100] = processor.tokenizer.pad_token_id\n",
888
+ "\n",
889
+ " pred_str = processor.batch_decode(pred_ids)\n",
890
+ " # we do not want to group tokens when computing the metrics\n",
891
+ " label_str = processor.batch_decode(pred.label_ids, group_tokens=False)\n",
892
+ "\n",
893
+ " wer = wer_metric.compute(predictions=pred_str, references=label_str)\n",
894
+ "\n",
895
+ " return {\"wer\": wer}\n",
896
+ "\n",
897
+ "wer_metric = load_metric(\"wer\")\n",
898
+ "\n",
899
+ "print(\"Test WER: {:.3f}\".format(wer_metric.compute(predictions=results[\"pred_str\"], references= [item.lower() for item in common_voice_test_transcription['sentence']])))"
900
+ ]
901
+ },
902
  {
903
  "cell_type": "code",
904
  "execution_count": null,
ASR_Inference.ipynb CHANGED
@@ -5,8 +5,8 @@
5
  "execution_count": 1,
6
  "metadata": {
7
  "ExecuteTime": {
8
- "end_time": "2021-03-14T19:32:40.765119Z",
9
- "start_time": "2021-03-14T19:32:39.314790Z"
10
  }
11
  },
12
  "outputs": [
@@ -36,8 +36,8 @@
36
  "execution_count": 2,
37
  "metadata": {
38
  "ExecuteTime": {
39
- "end_time": "2021-03-14T19:32:40.774860Z",
40
- "start_time": "2021-03-14T19:32:40.771235Z"
41
  }
42
  },
43
  "outputs": [],
@@ -75,11 +75,11 @@
75
  },
76
  {
77
  "cell_type": "code",
78
- "execution_count": 3,
79
  "metadata": {
80
  "ExecuteTime": {
81
- "end_time": "2021-03-14T19:32:49.565850Z",
82
- "start_time": "2021-03-14T19:32:41.891601Z"
83
  }
84
  },
85
  "outputs": [
@@ -98,11 +98,11 @@
98
  },
99
  {
100
  "cell_type": "code",
101
- "execution_count": 4,
102
  "metadata": {
103
  "ExecuteTime": {
104
- "end_time": "2021-03-14T19:33:03.514113Z",
105
- "start_time": "2021-03-14T19:33:00.953049Z"
106
  }
107
  },
108
  "outputs": [
@@ -110,8 +110,120 @@
110
  "name": "stderr",
111
  "output_type": "stream",
112
  "text": [
113
- "Using custom data configuration el-afd0a157f05ee080\n",
114
- "Reusing dataset common_voice (/home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564)\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
115
  ]
116
  }
117
  ],
@@ -121,11 +233,11 @@
121
  },
122
  {
123
  "cell_type": "code",
124
- "execution_count": 5,
125
  "metadata": {
126
  "ExecuteTime": {
127
- "end_time": "2021-03-14T19:33:03.528699Z",
128
- "start_time": "2021-03-14T19:33:03.525034Z"
129
  }
130
  },
131
  "outputs": [],
@@ -135,19 +247,33 @@
135
  },
136
  {
137
  "cell_type": "code",
138
- "execution_count": 6,
139
  "metadata": {
140
  "ExecuteTime": {
141
- "end_time": "2021-03-14T19:33:03.542260Z",
142
- "start_time": "2021-03-14T19:33:03.538498Z"
143
  }
144
  },
145
  "outputs": [
146
  {
147
- "name": "stderr",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
148
  "output_type": "stream",
149
  "text": [
150
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-0ce2ebca66096fff.arrow\n"
151
  ]
152
  }
153
  ],
@@ -157,19 +283,33 @@
157
  },
158
  {
159
  "cell_type": "code",
160
- "execution_count": 7,
161
  "metadata": {
162
  "ExecuteTime": {
163
- "end_time": "2021-03-14T19:33:03.561798Z",
164
- "start_time": "2021-03-14T19:33:03.554256Z"
165
  }
166
  },
167
  "outputs": [
168
  {
169
- "name": "stderr",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
170
  "output_type": "stream",
171
  "text": [
172
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-38a09981767eff59.arrow\n"
173
  ]
174
  }
175
  ],
@@ -179,11 +319,11 @@
179
  },
180
  {
181
  "cell_type": "code",
182
- "execution_count": 8,
183
  "metadata": {
184
  "ExecuteTime": {
185
- "end_time": "2021-03-14T19:33:04.357229Z",
186
- "start_time": "2021-03-14T19:33:03.570805Z"
187
  }
188
  },
189
  "outputs": [
@@ -191,112 +331,133 @@
191
  "name": "stdout",
192
  "output_type": "stream",
193
  "text": [
194
- " "
195
- ]
196
- },
197
- {
198
- "name": "stderr",
199
- "output_type": "stream",
200
- "text": [
201
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-ba8c6dd59eb8ccf2.arrow\n"
202
- ]
203
- },
204
- {
205
- "name": "stdout",
206
- "output_type": "stream",
207
- "text": [
208
- " "
209
- ]
210
- },
211
- {
212
- "name": "stderr",
213
- "output_type": "stream",
214
- "text": [
215
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-2e240883a5f827fd.arrow\n"
216
- ]
217
- },
218
- {
219
- "name": "stdout",
220
- "output_type": "stream",
221
- "text": [
222
- " "
223
- ]
224
- },
225
- {
226
- "name": "stderr",
227
- "output_type": "stream",
228
- "text": [
229
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-485c00dc9048ed50.arrow\n"
230
  ]
231
  },
232
  {
233
- "name": "stdout",
234
- "output_type": "stream",
235
- "text": [
236
- " "
237
- ]
 
 
 
 
 
 
 
238
  },
239
  {
240
- "name": "stderr",
241
- "output_type": "stream",
242
- "text": [
243
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-44bf1791baae8e2e.arrow\n"
244
- ]
 
 
 
 
 
 
 
245
  },
246
  {
247
- "name": "stdout",
248
- "output_type": "stream",
249
- "text": [
250
- " "
251
- ]
 
 
 
 
 
 
 
252
  },
253
  {
254
- "name": "stderr",
255
- "output_type": "stream",
256
- "text": [
257
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-ecc0dfac5615a58e.arrow\n"
258
- ]
 
 
 
 
 
 
 
259
  },
260
  {
261
- "name": "stdout",
262
- "output_type": "stream",
263
- "text": [
264
- " "
265
- ]
 
 
 
 
 
 
 
266
  },
267
  {
268
- "name": "stderr",
269
- "output_type": "stream",
270
- "text": [
271
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-923d905502a8661d.arrow\n"
272
- ]
 
 
 
 
 
 
 
273
  },
274
  {
275
- "name": "stdout",
276
- "output_type": "stream",
277
- "text": [
278
- " "
279
- ]
 
 
 
 
 
 
 
280
  },
281
  {
282
- "name": "stderr",
283
- "output_type": "stream",
284
- "text": [
285
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-bb54bb00dae79669.arrow\n"
286
- ]
 
 
 
 
 
 
 
287
  },
288
  {
289
  "name": "stdout",
290
  "output_type": "stream",
291
  "text": [
292
- " "
293
- ]
294
- },
295
- {
296
- "name": "stderr",
297
- "output_type": "stream",
298
- "text": [
299
- "Loading cached processed dataset at /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564/cache-062aeafc3b8816c1.arrow\n"
300
  ]
301
  }
302
  ],
@@ -306,11 +467,11 @@
306
  },
307
  {
308
  "cell_type": "code",
309
- "execution_count": 9,
310
  "metadata": {
311
  "ExecuteTime": {
312
- "end_time": "2021-03-14T19:33:11.205598Z",
313
- "start_time": "2021-03-14T19:33:04.368615Z"
314
  }
315
  },
316
  "outputs": [
@@ -332,12 +493,12 @@
332
  {
333
  "data": {
334
  "application/vnd.jupyter.widget-view+json": {
335
- "model_id": "b179696d93284b739cc550511ca28b78",
336
  "version_major": 2,
337
  "version_minor": 0
338
  },
339
  "text/plain": [
340
- "HBox(children=(IntProgress(value=0, description='#1', max=24, style=ProgressStyle(description_width='initial')…"
341
  ]
342
  },
343
  "metadata": {},
@@ -346,12 +507,12 @@
346
  {
347
  "data": {
348
  "application/vnd.jupyter.widget-view+json": {
349
- "model_id": "2aa538a2fdcb4d56a55cd612c879044f",
350
  "version_major": 2,
351
  "version_minor": 0
352
  },
353
  "text/plain": [
354
- "HBox(children=(IntProgress(value=0, description='#0', max=24, style=ProgressStyle(description_width='initial')…"
355
  ]
356
  },
357
  "metadata": {},
@@ -360,12 +521,12 @@
360
  {
361
  "data": {
362
  "application/vnd.jupyter.widget-view+json": {
363
- "model_id": "073b156d7b7541e08ad20ec377efb05b",
364
  "version_major": 2,
365
  "version_minor": 0
366
  },
367
  "text/plain": [
368
- "HBox(children=(IntProgress(value=0, description='#2', max=24, style=ProgressStyle(description_width='initial')…"
369
  ]
370
  },
371
  "metadata": {},
@@ -374,12 +535,12 @@
374
  {
375
  "data": {
376
  "application/vnd.jupyter.widget-view+json": {
377
- "model_id": "dcaa10621a674699a7bf17357cd75a4a",
378
  "version_major": 2,
379
  "version_minor": 0
380
  },
381
  "text/plain": [
382
- "HBox(children=(IntProgress(value=0, description='#4', max=24, style=ProgressStyle(description_width='initial')…"
383
  ]
384
  },
385
  "metadata": {},
@@ -388,12 +549,12 @@
388
  {
389
  "data": {
390
  "application/vnd.jupyter.widget-view+json": {
391
- "model_id": "9ee2184681db4e16802387bbc1acfef3",
392
  "version_major": 2,
393
  "version_minor": 0
394
  },
395
  "text/plain": [
396
- "HBox(children=(IntProgress(value=0, description='#3', max=24, style=ProgressStyle(description_width='initial')…"
397
  ]
398
  },
399
  "metadata": {},
@@ -402,12 +563,12 @@
402
  {
403
  "data": {
404
  "application/vnd.jupyter.widget-view+json": {
405
- "model_id": "36c3bcde96114167a1dc6942d9d551f1",
406
  "version_major": 2,
407
  "version_minor": 0
408
  },
409
  "text/plain": [
410
- "HBox(children=(IntProgress(value=0, description='#6', max=24, style=ProgressStyle(description_width='initial')…"
411
  ]
412
  },
413
  "metadata": {},
@@ -416,12 +577,12 @@
416
  {
417
  "data": {
418
  "application/vnd.jupyter.widget-view+json": {
419
- "model_id": "b0ad190f479d40a599e74cfa9deddec8",
420
  "version_major": 2,
421
  "version_minor": 0
422
  },
423
  "text/plain": [
424
- "HBox(children=(IntProgress(value=0, description='#5', max=24, style=ProgressStyle(description_width='initial')…"
425
  ]
426
  },
427
  "metadata": {},
@@ -430,7 +591,7 @@
430
  {
431
  "data": {
432
  "application/vnd.jupyter.widget-view+json": {
433
- "model_id": "138f7261158c4a9ab84414a20954de01",
434
  "version_major": 2,
435
  "version_minor": 0
436
  },
@@ -462,11 +623,11 @@
462
  },
463
  {
464
  "cell_type": "code",
465
- "execution_count": 10,
466
  "metadata": {
467
  "ExecuteTime": {
468
- "end_time": "2021-03-14T19:33:14.391497Z",
469
- "start_time": "2021-03-14T19:33:11.216118Z"
470
  }
471
  },
472
  "outputs": [
@@ -474,8 +635,120 @@
474
  "name": "stderr",
475
  "output_type": "stream",
476
  "text": [
477
- "Using custom data configuration el-ac779bf2c9f7c09b\n",
478
- "Reusing dataset common_voice (/home/earendil/.cache/huggingface/datasets/common_voice/el-ac779bf2c9f7c09b/6.1.0/32954a9015faa0d840f6c6894938545c5d12bc5d8936a80079af74bf50d71564)\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
479
  ]
480
  }
481
  ],
@@ -536,6 +809,96 @@
536
  "# πού θέλεις να πάμε; ρώτησε φοβισμένα ο βασιλιάς."
537
  ]
538
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
539
  {
540
  "cell_type": "code",
541
  "execution_count": null,
5
  "execution_count": 1,
6
  "metadata": {
7
  "ExecuteTime": {
8
+ "end_time": "2021-03-17T11:10:25.794375Z",
9
+ "start_time": "2021-03-17T11:10:24.301013Z"
10
  }
11
  },
12
  "outputs": [
36
  "execution_count": 2,
37
  "metadata": {
38
  "ExecuteTime": {
39
+ "end_time": "2021-03-17T11:10:29.608803Z",
40
+ "start_time": "2021-03-17T11:10:29.599700Z"
41
  }
42
  },
43
  "outputs": [],
75
  },
76
  {
77
  "cell_type": "code",
78
+ "execution_count": 4,
79
  "metadata": {
80
  "ExecuteTime": {
81
+ "end_time": "2021-03-17T11:11:02.120225Z",
82
+ "start_time": "2021-03-17T11:10:56.182488Z"
83
  }
84
  },
85
  "outputs": [
98
  },
99
  {
100
  "cell_type": "code",
101
+ "execution_count": 6,
102
  "metadata": {
103
  "ExecuteTime": {
104
+ "end_time": "2021-03-17T11:12:18.847005Z",
105
+ "start_time": "2021-03-17T11:12:14.919077Z"
106
  }
107
  },
108
  "outputs": [
110
  "name": "stderr",
111
  "output_type": "stream",
112
  "text": [
113
+ "Using custom data configuration el-afd0a157f05ee080\n"
114
+ ]
115
+ },
116
+ {
117
+ "name": "stdout",
118
+ "output_type": "stream",
119
+ "text": [
120
+ "Downloading and preparing dataset common_voice/el (download: 363.89 MiB, generated: 4.75 MiB, post-processed: Unknown size, total: 368.64 MiB) to /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f...\n"
121
+ ]
122
+ },
123
+ {
124
+ "data": {
125
+ "application/vnd.jupyter.widget-view+json": {
126
+ "model_id": "",
127
+ "version_major": 2,
128
+ "version_minor": 0
129
+ },
130
+ "text/plain": [
131
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
132
+ ]
133
+ },
134
+ "metadata": {},
135
+ "output_type": "display_data"
136
+ },
137
+ {
138
+ "name": "stdout",
139
+ "output_type": "stream",
140
+ "text": [
141
+ "\r"
142
+ ]
143
+ },
144
+ {
145
+ "data": {
146
+ "application/vnd.jupyter.widget-view+json": {
147
+ "model_id": "",
148
+ "version_major": 2,
149
+ "version_minor": 0
150
+ },
151
+ "text/plain": [
152
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
153
+ ]
154
+ },
155
+ "metadata": {},
156
+ "output_type": "display_data"
157
+ },
158
+ {
159
+ "name": "stdout",
160
+ "output_type": "stream",
161
+ "text": [
162
+ "\r"
163
+ ]
164
+ },
165
+ {
166
+ "data": {
167
+ "application/vnd.jupyter.widget-view+json": {
168
+ "model_id": "",
169
+ "version_major": 2,
170
+ "version_minor": 0
171
+ },
172
+ "text/plain": [
173
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
174
+ ]
175
+ },
176
+ "metadata": {},
177
+ "output_type": "display_data"
178
+ },
179
+ {
180
+ "name": "stdout",
181
+ "output_type": "stream",
182
+ "text": [
183
+ "\r"
184
+ ]
185
+ },
186
+ {
187
+ "data": {
188
+ "application/vnd.jupyter.widget-view+json": {
189
+ "model_id": "",
190
+ "version_major": 2,
191
+ "version_minor": 0
192
+ },
193
+ "text/plain": [
194
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
195
+ ]
196
+ },
197
+ "metadata": {},
198
+ "output_type": "display_data"
199
+ },
200
+ {
201
+ "name": "stdout",
202
+ "output_type": "stream",
203
+ "text": [
204
+ "\r"
205
+ ]
206
+ },
207
+ {
208
+ "data": {
209
+ "application/vnd.jupyter.widget-view+json": {
210
+ "model_id": "",
211
+ "version_major": 2,
212
+ "version_minor": 0
213
+ },
214
+ "text/plain": [
215
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
216
+ ]
217
+ },
218
+ "metadata": {},
219
+ "output_type": "display_data"
220
+ },
221
+ {
222
+ "name": "stdout",
223
+ "output_type": "stream",
224
+ "text": [
225
+ "\r",
226
+ "Dataset common_voice downloaded and prepared to /home/earendil/.cache/huggingface/datasets/common_voice/el-afd0a157f05ee080/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f. Subsequent calls will reuse this data.\n"
227
  ]
228
  }
229
  ],
233
  },
234
  {
235
  "cell_type": "code",
236
+ "execution_count": 7,
237
  "metadata": {
238
  "ExecuteTime": {
239
+ "end_time": "2021-03-17T11:12:18.860240Z",
240
+ "start_time": "2021-03-17T11:12:18.857252Z"
241
  }
242
  },
243
  "outputs": [],
247
  },
248
  {
249
  "cell_type": "code",
250
+ "execution_count": 8,
251
  "metadata": {
252
  "ExecuteTime": {
253
+ "end_time": "2021-03-17T11:12:18.928497Z",
254
+ "start_time": "2021-03-17T11:12:18.869198Z"
255
  }
256
  },
257
  "outputs": [
258
  {
259
+ "data": {
260
+ "application/vnd.jupyter.widget-view+json": {
261
+ "model_id": "9869698af86e44bca75c4252996ff1a3",
262
+ "version_major": 2,
263
+ "version_minor": 0
264
+ },
265
+ "text/plain": [
266
+ "HBox(children=(IntProgress(value=0, max=1522), HTML(value='')))"
267
+ ]
268
+ },
269
+ "metadata": {},
270
+ "output_type": "display_data"
271
+ },
272
+ {
273
+ "name": "stdout",
274
  "output_type": "stream",
275
  "text": [
276
+ "\n"
277
  ]
278
  }
279
  ],
283
  },
284
  {
285
  "cell_type": "code",
286
+ "execution_count": 9,
287
  "metadata": {
288
  "ExecuteTime": {
289
+ "end_time": "2021-03-17T11:12:40.824595Z",
290
+ "start_time": "2021-03-17T11:12:18.937930Z"
291
  }
292
  },
293
  "outputs": [
294
  {
295
+ "data": {
296
+ "application/vnd.jupyter.widget-view+json": {
297
+ "model_id": "d232b2bb009543e0bb2542bce273c554",
298
+ "version_major": 2,
299
+ "version_minor": 0
300
+ },
301
+ "text/plain": [
302
+ "HBox(children=(IntProgress(value=0, max=1522), HTML(value='')))"
303
+ ]
304
+ },
305
+ "metadata": {},
306
+ "output_type": "display_data"
307
+ },
308
+ {
309
+ "name": "stdout",
310
  "output_type": "stream",
311
  "text": [
312
+ "\n"
313
  ]
314
  }
315
  ],
319
  },
320
  {
321
  "cell_type": "code",
322
+ "execution_count": 10,
323
  "metadata": {
324
  "ExecuteTime": {
325
+ "end_time": "2021-03-17T11:13:18.078738Z",
326
+ "start_time": "2021-03-17T11:12:40.834398Z"
327
  }
328
  },
329
  "outputs": [
331
  "name": "stdout",
332
  "output_type": "stream",
333
  "text": [
334
+ " "
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
335
  ]
336
  },
337
  {
338
+ "data": {
339
+ "application/vnd.jupyter.widget-view+json": {
340
+ "model_id": "ffd787bc4ed048ae8f4977f2c539bedb",
341
+ "version_major": 2,
342
+ "version_minor": 0
343
+ },
344
+ "text/plain": [
345
+ "HBox(children=(IntProgress(value=0, description='#0', max=191, style=ProgressStyle(description_width='initial'…"
346
+ ]
347
+ },
348
+ "metadata": {},
349
+ "output_type": "display_data"
350
  },
351
  {
352
+ "data": {
353
+ "application/vnd.jupyter.widget-view+json": {
354
+ "model_id": "79c51995d4f84ad8812230480d14b8cd",
355
+ "version_major": 2,
356
+ "version_minor": 0
357
+ },
358
+ "text/plain": [
359
+ "HBox(children=(IntProgress(value=0, description='#2', max=190, style=ProgressStyle(description_width='initial'…"
360
+ ]
361
+ },
362
+ "metadata": {},
363
+ "output_type": "display_data"
364
  },
365
  {
366
+ "data": {
367
+ "application/vnd.jupyter.widget-view+json": {
368
+ "model_id": "52963d9cfd814346af070b2cc4e105cf",
369
+ "version_major": 2,
370
+ "version_minor": 0
371
+ },
372
+ "text/plain": [
373
+ "HBox(children=(IntProgress(value=0, description='#5', max=190, style=ProgressStyle(description_width='initial'…"
374
+ ]
375
+ },
376
+ "metadata": {},
377
+ "output_type": "display_data"
378
  },
379
  {
380
+ "data": {
381
+ "application/vnd.jupyter.widget-view+json": {
382
+ "model_id": "3b940160575143c7acfa142564e9f7d2",
383
+ "version_major": 2,
384
+ "version_minor": 0
385
+ },
386
+ "text/plain": [
387
+ "HBox(children=(IntProgress(value=0, description='#3', max=190, style=ProgressStyle(description_width='initial'…"
388
+ ]
389
+ },
390
+ "metadata": {},
391
+ "output_type": "display_data"
392
  },
393
  {
394
+ "data": {
395
+ "application/vnd.jupyter.widget-view+json": {
396
+ "model_id": "aa540f67ba894d7aa64e12fcdfab5ce0",
397
+ "version_major": 2,
398
+ "version_minor": 0
399
+ },
400
+ "text/plain": [
401
+ "HBox(children=(IntProgress(value=0, description='#1', max=191, style=ProgressStyle(description_width='initial'…"
402
+ ]
403
+ },
404
+ "metadata": {},
405
+ "output_type": "display_data"
406
  },
407
  {
408
+ "data": {
409
+ "application/vnd.jupyter.widget-view+json": {
410
+ "model_id": "4962bdefdbbc44a7a44591480d8d6406",
411
+ "version_major": 2,
412
+ "version_minor": 0
413
+ },
414
+ "text/plain": [
415
+ "HBox(children=(IntProgress(value=0, description='#4', max=190, style=ProgressStyle(description_width='initial'…"
416
+ ]
417
+ },
418
+ "metadata": {},
419
+ "output_type": "display_data"
420
  },
421
  {
422
+ "data": {
423
+ "application/vnd.jupyter.widget-view+json": {
424
+ "model_id": "e77f088bfe5644548fe2c4277d0c86da",
425
+ "version_major": 2,
426
+ "version_minor": 0
427
+ },
428
+ "text/plain": [
429
+ "HBox(children=(IntProgress(value=0, description='#7', max=190, style=ProgressStyle(description_width='initial'…"
430
+ ]
431
+ },
432
+ "metadata": {},
433
+ "output_type": "display_data"
434
  },
435
  {
436
+ "data": {
437
+ "application/vnd.jupyter.widget-view+json": {
438
+ "model_id": "5827f93e99994fe9919aac53f0fb9444",
439
+ "version_major": 2,
440
+ "version_minor": 0
441
+ },
442
+ "text/plain": [
443
+ "HBox(children=(IntProgress(value=0, description='#6', max=190, style=ProgressStyle(description_width='initial'…"
444
+ ]
445
+ },
446
+ "metadata": {},
447
+ "output_type": "display_data"
448
  },
449
  {
450
  "name": "stdout",
451
  "output_type": "stream",
452
  "text": [
453
+ "\n",
454
+ "\n",
455
+ "\n",
456
+ "\n",
457
+ "\n",
458
+ "\n",
459
+ "\n",
460
+ "\n"
461
  ]
462
  }
463
  ],
467
  },
468
  {
469
  "cell_type": "code",
470
+ "execution_count": 11,
471
  "metadata": {
472
  "ExecuteTime": {
473
+ "end_time": "2021-03-17T11:13:25.145155Z",
474
+ "start_time": "2021-03-17T11:13:18.091929Z"
475
  }
476
  },
477
  "outputs": [
493
  {
494
  "data": {
495
  "application/vnd.jupyter.widget-view+json": {
496
+ "model_id": "ae326a173a044b1494793e2a70d76a87",
497
  "version_major": 2,
498
  "version_minor": 0
499
  },
500
  "text/plain": [
501
+ "HBox(children=(IntProgress(value=0, description='#0', max=24, style=ProgressStyle(description_width='initial')…"
502
  ]
503
  },
504
  "metadata": {},
507
  {
508
  "data": {
509
  "application/vnd.jupyter.widget-view+json": {
510
+ "model_id": "21ab1ef2af5a4a4fb23c68b0c5cf32f8",
511
  "version_major": 2,
512
  "version_minor": 0
513
  },
514
  "text/plain": [
515
+ "HBox(children=(IntProgress(value=0, description='#1', max=24, style=ProgressStyle(description_width='initial')…"
516
  ]
517
  },
518
  "metadata": {},
521
  {
522
  "data": {
523
  "application/vnd.jupyter.widget-view+json": {
524
+ "model_id": "d331c5f4f888477daceffe370f6cd89f",
525
  "version_major": 2,
526
  "version_minor": 0
527
  },
528
  "text/plain": [
529
+ "HBox(children=(IntProgress(value=0, description='#3', max=24, style=ProgressStyle(description_width='initial')…"
530
  ]
531
  },
532
  "metadata": {},
535
  {
536
  "data": {
537
  "application/vnd.jupyter.widget-view+json": {
538
+ "model_id": "6fa790118aa340e4afb9f83e71403a13",
539
  "version_major": 2,
540
  "version_minor": 0
541
  },
542
  "text/plain": [
543
+ "HBox(children=(IntProgress(value=0, description='#2', max=24, style=ProgressStyle(description_width='initial')…"
544
  ]
545
  },
546
  "metadata": {},
549
  {
550
  "data": {
551
  "application/vnd.jupyter.widget-view+json": {
552
+ "model_id": "c8092e2f59a9404596dc2bab206edf2c",
553
  "version_major": 2,
554
  "version_minor": 0
555
  },
556
  "text/plain": [
557
+ "HBox(children=(IntProgress(value=0, description='#5', max=24, style=ProgressStyle(description_width='initial')…"
558
  ]
559
  },
560
  "metadata": {},
563
  {
564
  "data": {
565
  "application/vnd.jupyter.widget-view+json": {
566
+ "model_id": "20f913f0caf8401098743b9e5051fc52",
567
  "version_major": 2,
568
  "version_minor": 0
569
  },
570
  "text/plain": [
571
+ "HBox(children=(IntProgress(value=0, description='#4', max=24, style=ProgressStyle(description_width='initial')…"
572
  ]
573
  },
574
  "metadata": {},
577
  {
578
  "data": {
579
  "application/vnd.jupyter.widget-view+json": {
580
+ "model_id": "7c7e15e24384494cb49a72106ce41ccd",
581
  "version_major": 2,
582
  "version_minor": 0
583
  },
584
  "text/plain": [
585
+ "HBox(children=(IntProgress(value=0, description='#6', max=24, style=ProgressStyle(description_width='initial')…"
586
  ]
587
  },
588
  "metadata": {},
591
  {
592
  "data": {
593
  "application/vnd.jupyter.widget-view+json": {
594
+ "model_id": "73245add55e24ee2a6dbe0713d5073d9",
595
  "version_major": 2,
596
  "version_minor": 0
597
  },
623
  },
624
  {
625
  "cell_type": "code",
626
+ "execution_count": 12,
627
  "metadata": {
628
  "ExecuteTime": {
629
+ "end_time": "2021-03-17T11:14:12.721500Z",
630
+ "start_time": "2021-03-17T11:14:08.198478Z"
631
  }
632
  },
633
  "outputs": [
635
  "name": "stderr",
636
  "output_type": "stream",
637
  "text": [
638
+ "Using custom data configuration el-ac779bf2c9f7c09b\n"
639
+ ]
640
+ },
641
+ {
642
+ "name": "stdout",
643
+ "output_type": "stream",
644
+ "text": [
645
+ "Downloading and preparing dataset common_voice/el (download: 363.89 MiB, generated: 4.75 MiB, post-processed: Unknown size, total: 368.64 MiB) to /home/earendil/.cache/huggingface/datasets/common_voice/el-ac779bf2c9f7c09b/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f...\n"
646
+ ]
647
+ },
648
+ {
649
+ "data": {
650
+ "application/vnd.jupyter.widget-view+json": {
651
+ "model_id": "",
652
+ "version_major": 2,
653
+ "version_minor": 0
654
+ },
655
+ "text/plain": [
656
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
657
+ ]
658
+ },
659
+ "metadata": {},
660
+ "output_type": "display_data"
661
+ },
662
+ {
663
+ "name": "stdout",
664
+ "output_type": "stream",
665
+ "text": [
666
+ "\r"
667
+ ]
668
+ },
669
+ {
670
+ "data": {
671
+ "application/vnd.jupyter.widget-view+json": {
672
+ "model_id": "",
673
+ "version_major": 2,
674
+ "version_minor": 0
675
+ },
676
+ "text/plain": [
677
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
678
+ ]
679
+ },
680
+ "metadata": {},
681
+ "output_type": "display_data"
682
+ },
683
+ {
684
+ "name": "stdout",
685
+ "output_type": "stream",
686
+ "text": [
687
+ "\r"
688
+ ]
689
+ },
690
+ {
691
+ "data": {
692
+ "application/vnd.jupyter.widget-view+json": {
693
+ "model_id": "",
694
+ "version_major": 2,
695
+ "version_minor": 0
696
+ },
697
+ "text/plain": [
698
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
699
+ ]
700
+ },
701
+ "metadata": {},
702
+ "output_type": "display_data"
703
+ },
704
+ {
705
+ "name": "stdout",
706
+ "output_type": "stream",
707
+ "text": [
708
+ "\r"
709
+ ]
710
+ },
711
+ {
712
+ "data": {
713
+ "application/vnd.jupyter.widget-view+json": {
714
+ "model_id": "",
715
+ "version_major": 2,
716
+ "version_minor": 0
717
+ },
718
+ "text/plain": [
719
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
720
+ ]
721
+ },
722
+ "metadata": {},
723
+ "output_type": "display_data"
724
+ },
725
+ {
726
+ "name": "stdout",
727
+ "output_type": "stream",
728
+ "text": [
729
+ "\r"
730
+ ]
731
+ },
732
+ {
733
+ "data": {
734
+ "application/vnd.jupyter.widget-view+json": {
735
+ "model_id": "",
736
+ "version_major": 2,
737
+ "version_minor": 0
738
+ },
739
+ "text/plain": [
740
+ "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))"
741
+ ]
742
+ },
743
+ "metadata": {},
744
+ "output_type": "display_data"
745
+ },
746
+ {
747
+ "name": "stdout",
748
+ "output_type": "stream",
749
+ "text": [
750
+ "\r",
751
+ "Dataset common_voice downloaded and prepared to /home/earendil/.cache/huggingface/datasets/common_voice/el-ac779bf2c9f7c09b/6.1.0/0041e06ab061b91d0a23234a2221e87970a19cf3a81b20901474cffffeb7869f. Subsequent calls will reuse this data.\n"
752
  ]
753
  }
754
  ],
809
  "# πού θέλεις να πάμε; ρώτησε φοβισμένα ο βασιλιάς."
810
  ]
811
  },
812
+ {
813
+ "cell_type": "code",
814
+ "execution_count": 13,
815
+ "metadata": {
816
+ "ExecuteTime": {
817
+ "end_time": "2021-03-17T11:15:35.637739Z",
818
+ "start_time": "2021-03-17T11:14:14.689842Z"
819
+ }
820
+ },
821
+ "outputs": [
822
+ {
823
+ "data": {
824
+ "application/vnd.jupyter.widget-view+json": {
825
+ "model_id": "1f7ba9e12187401f870555d20a6a9458",
826
+ "version_major": 2,
827
+ "version_minor": 0
828
+ },
829
+ "text/plain": [
830
+ "HBox(children=(IntProgress(value=0, max=1522), HTML(value='')))"
831
+ ]
832
+ },
833
+ "metadata": {},
834
+ "output_type": "display_data"
835
+ },
836
+ {
837
+ "name": "stdout",
838
+ "output_type": "stream",
839
+ "text": [
840
+ "\n"
841
+ ]
842
+ }
843
+ ],
844
+ "source": [
845
+ "def map_to_result(batch):\n",
846
+ " model.to(\"cuda\")\n",
847
+ " input_values = processor(\n",
848
+ " batch[\"input_values\"], \n",
849
+ " sampling_rate=16_000, \n",
850
+ " return_tensors=\"pt\"\n",
851
+ " ).input_values.to(\"cuda\")\n",
852
+ "\n",
853
+ " with torch.no_grad():\n",
854
+ " logits = model(input_values).logits\n",
855
+ "\n",
856
+ " pred_ids = torch.argmax(logits, dim=-1)\n",
857
+ " batch[\"pred_str\"] = processor.batch_decode(pred_ids)[0]\n",
858
+ "\n",
859
+ " return batch\n",
860
+ "\n",
861
+ "results = common_voice_test.map(map_to_result)\n"
862
+ ]
863
+ },
864
+ {
865
+ "cell_type": "code",
866
+ "execution_count": 16,
867
+ "metadata": {
868
+ "ExecuteTime": {
869
+ "end_time": "2021-03-17T11:17:11.951524Z",
870
+ "start_time": "2021-03-17T11:17:08.856552Z"
871
+ }
872
+ },
873
+ "outputs": [
874
+ {
875
+ "name": "stdout",
876
+ "output_type": "stream",
877
+ "text": [
878
+ "Test WER: 0.396\n"
879
+ ]
880
+ }
881
+ ],
882
+ "source": [
883
+ "def compute_metrics(pred):\n",
884
+ " pred_logits = pred.predictions\n",
885
+ " pred_ids = np.argmax(pred_logits, axis=-1)\n",
886
+ "\n",
887
+ " pred.label_ids[pred.label_ids == -100] = processor.tokenizer.pad_token_id\n",
888
+ "\n",
889
+ " pred_str = processor.batch_decode(pred_ids)\n",
890
+ " # we do not want to group tokens when computing the metrics\n",
891
+ " label_str = processor.batch_decode(pred.label_ids, group_tokens=False)\n",
892
+ "\n",
893
+ " wer = wer_metric.compute(predictions=pred_str, references=label_str)\n",
894
+ "\n",
895
+ " return {\"wer\": wer}\n",
896
+ "\n",
897
+ "wer_metric = load_metric(\"wer\")\n",
898
+ "\n",
899
+ "print(\"Test WER: {:.3f}\".format(wer_metric.compute(predictions=results[\"pred_str\"], references= [item.lower() for item in common_voice_test_transcription['sentence']])))"
900
+ ]
901
+ },
902
  {
903
  "cell_type": "code",
904
  "execution_count": null,
README.md CHANGED
@@ -21,7 +21,7 @@ model-index:
21
  metrics:
22
  - name: Test WER
23
  type: wer
24
- value: 31.05
25
  ---
26
 
27
  # Greek (el) version of the XLSR-Wav2Vec2 automatic speech recognition (ASR) model
@@ -29,12 +29,14 @@ model-index:
29
 
30
  * language: el
31
  * licence: apache-2.0
32
- * dataset: CommonVoice (EL), 364MB: https://commonvoice.mozilla.org/el/datasets
33
- * model: XLSR-Wav2Vec2, trained for 60 epochs
34
  * metrics: Word Error Rate (WER)
35
 
36
  ## Model description
37
 
 
 
38
  Wav2Vec2 is a pretrained model for Automatic Speech Recognition (ASR) and was released in September 2020 by Alexei Baevski, Michael Auli, and Alex Conneau. Soon after the superior performance of Wav2Vec2 was demonstrated on the English ASR dataset LibriSpeech, Facebook AI presented XLSR-Wav2Vec2. XLSR stands for cross-lingual speech representations and refers to XLSR-Wav2Vec2`s ability to learn speech representations that are useful across multiple languages.
39
 
40
  Similar to Wav2Vec2, XLSR-Wav2Vec2 learns powerful speech representations from hundreds of thousands of hours of speech in more than 50 languages of unlabeled speech. Similar, to BERT's masked language modeling, the model learns contextualized speech representations by randomly masking feature vectors before passing them to a transformer network.
@@ -189,7 +191,7 @@ result = test_dataset.map(evaluate, batched=True, batch_size=8)
189
  print("WER: {:2f}".format(100 * wer.compute(predictions=result["pred_strings"], references=result["sentence"])))
190
  ```
191
 
192
- **Test Result**: 31.05 %
193
 
194
  ### How to use for training:
195
 
@@ -200,9 +202,9 @@ Instructions and code to replicate the process are provided in the Fine_Tune_XLS
200
 
201
  | Metric | Value |
202
  | ----------- | ----------- |
203
- | Training Loss | 0.0287 |
204
  | Validation Loss | 0.6062 |
205
- | WER on CommonVoice Test *| 0.3105 |
206
  * Reference transcripts were lower-cased and striped of punctuation and special characters.
207
 
208
  Full metrics log here:
21
  metrics:
22
  - name: Test WER
23
  type: wer
24
+ value: 10.497628
25
  ---
26
 
27
  # Greek (el) version of the XLSR-Wav2Vec2 automatic speech recognition (ASR) model
29
 
30
  * language: el
31
  * licence: apache-2.0
32
+ * dataset: CommonVoice (EL), 364MB: https://commonvoice.mozilla.org/el/datasets + CSS10 (EL), 1.22GB: https://github.com/Kyubyong/css10
33
+ * model: XLSR-Wav2Vec2, trained for 50 epochs
34
  * metrics: Word Error Rate (WER)
35
 
36
  ## Model description
37
 
38
+ UPDATE: We repeated the fine-tuning process using an additional 1.22GB dataset from CSS10.
39
+
40
  Wav2Vec2 is a pretrained model for Automatic Speech Recognition (ASR) and was released in September 2020 by Alexei Baevski, Michael Auli, and Alex Conneau. Soon after the superior performance of Wav2Vec2 was demonstrated on the English ASR dataset LibriSpeech, Facebook AI presented XLSR-Wav2Vec2. XLSR stands for cross-lingual speech representations and refers to XLSR-Wav2Vec2`s ability to learn speech representations that are useful across multiple languages.
41
 
42
  Similar to Wav2Vec2, XLSR-Wav2Vec2 learns powerful speech representations from hundreds of thousands of hours of speech in more than 50 languages of unlabeled speech. Similar, to BERT's masked language modeling, the model learns contextualized speech representations by randomly masking feature vectors before passing them to a transformer network.
191
  print("WER: {:2f}".format(100 * wer.compute(predictions=result["pred_strings"], references=result["sentence"])))
192
  ```
193
 
194
+ **Test Result**: 10.497628 %
195
 
196
  ### How to use for training:
197
 
202
 
203
  | Metric | Value |
204
  | ----------- | ----------- |
205
+ | Training Loss | 0.0545 |
206
  | Validation Loss | 0.6062 |
207
+ | WER on CommonVoice Test (%) *| 10.497628 |
208
  * Reference transcripts were lower-cased and striped of punctuation and special characters.
209
 
210
  Full metrics log here:
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429242.mp3 DELETED
Binary file (55.5 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429243.mp3 DELETED
Binary file (50.2 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429245.mp3 DELETED
Binary file (46.3 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429246.mp3 DELETED
Binary file (34.4 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429247.mp3 DELETED
Binary file (48.2 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429253.mp3 DELETED
Binary file (45.9 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429254.mp3 DELETED
Binary file (32.5 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429255.mp3 DELETED
Binary file (33.5 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429256.mp3 DELETED
Binary file (48.8 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429257.mp3 DELETED
Binary file (47.3 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429268.mp3 DELETED
Binary file (43.4 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429269.mp3 DELETED
Binary file (27.1 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429270.mp3 DELETED
Binary file (36.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429271.mp3 DELETED
Binary file (25.8 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429272.mp3 DELETED
Binary file (27.1 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429278.mp3 DELETED
Binary file (33.5 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429280.mp3 DELETED
Binary file (24.8 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429283.mp3 DELETED
Binary file (22.3 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429285.mp3 DELETED
Binary file (26.2 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429288.mp3 DELETED
Binary file (36.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429298.mp3 DELETED
Binary file (31 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429299.mp3 DELETED
Binary file (37.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429300.mp3 DELETED
Binary file (26.2 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429301.mp3 DELETED
Binary file (30.6 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429302.mp3 DELETED
Binary file (20 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429308.mp3 DELETED
Binary file (27.1 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429309.mp3 DELETED
Binary file (35.8 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429310.mp3 DELETED
Binary file (36.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429312.mp3 DELETED
Binary file (44 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429314.mp3 DELETED
Binary file (34.4 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429328.mp3 DELETED
Binary file (27.1 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429329.mp3 DELETED
Binary file (25.2 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429330.mp3 DELETED
Binary file (37.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429331.mp3 DELETED
Binary file (28.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429332.mp3 DELETED
Binary file (41.5 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429407.mp3 DELETED
Binary file (38.6 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429408.mp3 DELETED
Binary file (41.1 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429410.mp3 DELETED
Binary file (45.9 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429411.mp3 DELETED
Binary file (36.3 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429412.mp3 DELETED
Binary file (40.6 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429418.mp3 DELETED
Binary file (46.3 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429419.mp3 DELETED
Binary file (25.2 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429420.mp3 DELETED
Binary file (46.3 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429421.mp3 DELETED
Binary file (27.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429422.mp3 DELETED
Binary file (38.6 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429438.mp3 DELETED
Binary file (27.7 kB)
cv-corpus-6.1-2020-12-11/el/clips/common_voice_el_20429439.mp3 DELETED
Binary file (30 kB)