emilios commited on
Commit
d6004cb
1 Parent(s): d0a02bf

End of training

Browse files
Files changed (17) hide show
  1. e5_interleaving-cl.ipynb +137 -253
  2. e5_interleaving-resume.ipynb +0 -0
  3. pytorch_model.bin +1 -1
  4. runs/Dec13_21-29-08_129-146-102-49/1670966960.518305/events.out.tfevents.1670966960.129-146-102-49.882304.1 +3 -0
  5. runs/Dec13_21-29-08_129-146-102-49/events.out.tfevents.1670966960.129-146-102-49.882304.0 +3 -0
  6. runs/Dec13_21-57-38_129-146-102-49/1670968669.9597044/events.out.tfevents.1670968669.129-146-102-49.882304.3 +3 -0
  7. runs/Dec13_21-57-38_129-146-102-49/events.out.tfevents.1670968669.129-146-102-49.882304.2 +3 -0
  8. runs/Dec13_22-18-00_129-146-102-49/1670969892.775061/events.out.tfevents.1670969892.129-146-102-49.1014402.1 +3 -0
  9. runs/Dec13_22-18-00_129-146-102-49/1670995449.379962/events.out.tfevents.1670995449.129-146-102-49.1014402.2 +3 -0
  10. runs/Dec13_22-18-00_129-146-102-49/events.out.tfevents.1670969892.129-146-102-49.1014402.0 +3 -0
  11. runs/Dec14_05-46-08_129-146-102-49/1670996781.2697837/events.out.tfevents.1670996781.129-146-102-49.1113148.1 +3 -0
  12. runs/Dec14_05-46-08_129-146-102-49/events.out.tfevents.1670996781.129-146-102-49.1113148.0 +3 -0
  13. runs/Dec14_09-33-49_129-146-102-49/1671010439.939292/events.out.tfevents.1671010439.129-146-102-49.1212260.1 +3 -0
  14. runs/Dec14_09-33-49_129-146-102-49/events.out.tfevents.1671010439.129-146-102-49.1212260.0 +3 -0
  15. runs/Dec14_10-24-09_129-146-102-49/1671013461.8981154/events.out.tfevents.1671013461.129-146-102-49.1508853.1 +3 -0
  16. runs/Dec14_10-24-09_129-146-102-49/events.out.tfevents.1671013461.129-146-102-49.1508853.0 +3 -0
  17. training_args.bin +1 -1
e5_interleaving-cl.ipynb CHANGED
@@ -125,20 +125,20 @@
125
  "Requirement already satisfied: torch in ./.local/lib/python3.8/site-packages (1.13.0)\n",
126
  "Requirement already satisfied: torchaudio in ./.local/lib/python3.8/site-packages (0.13.0)\n",
127
  "Requirement already satisfied: torchvision in ./.local/lib/python3.8/site-packages (0.14.0)\n",
 
 
128
  "Requirement already satisfied: nvidia-cublas-cu11==11.10.3.66 in ./.local/lib/python3.8/site-packages (from torch) (11.10.3.66)\n",
129
- "Requirement already satisfied: nvidia-cuda-nvrtc-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
130
  "Requirement already satisfied: typing-extensions in ./.local/lib/python3.8/site-packages (from torch) (4.4.0)\n",
131
- "Requirement already satisfied: nvidia-cudnn-cu11==8.5.0.96 in ./.local/lib/python3.8/site-packages (from torch) (8.5.0.96)\n",
132
- "Requirement already satisfied: nvidia-cuda-runtime-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
133
- "Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (45.2.0)\n",
134
  "Requirement already satisfied: wheel in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (0.34.2)\n",
135
- "Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from torchvision) (2.28.1)\n",
136
  "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /usr/lib/python3/dist-packages (from torchvision) (7.0.0)\n",
 
137
  "Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from torchvision) (1.23.5)\n",
138
- "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->torchvision) (1.26.13)\n",
139
  "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->torchvision) (2019.11.28)\n",
140
- "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->torchvision) (2.8)\n",
141
- "Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests->torchvision) (2.1.1)\n"
 
142
  ]
143
  }
144
  ],
@@ -200,7 +200,7 @@
200
  "name": "stdout",
201
  "output_type": "stream",
202
  "text": [
203
- "Tue Dec 13 19:10:09 2022 \n",
204
  "+-----------------------------------------------------------------------------+\n",
205
  "| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
206
  "|-------------------------------+----------------------+----------------------+\n",
@@ -209,7 +209,7 @@
209
  "| | | MIG M. |\n",
210
  "|===============================+======================+======================|\n",
211
  "| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
212
- "| N/A 31C P0 46W / 400W | 0MiB / 40960MiB | 0% Default |\n",
213
  "| | | Disabled |\n",
214
  "+-------------------------------+----------------------+----------------------+\n",
215
  " \n",
@@ -260,42 +260,43 @@
260
  "name": "stdout",
261
  "output_type": "stream",
262
  "text": [
263
- "Hit:1 https://download.docker.com/linux/ubuntu focal InRelease\n",
264
- "Get:2 https://nvidia.github.io/libnvidia-container/stable/ubuntu18.04/amd64 InRelease [1484 B]\n",
265
- "Hit:3 https://nvidia.github.io/nvidia-container-runtime/stable/ubuntu18.04/amd64 InRelease\n",
266
- "Get:4 https://packages.cloud.google.com/apt cloud-sdk InRelease [6751 B] \n",
267
- "Hit:5 http://archive.lambdalabs.com/ubuntu focal InRelease \n",
268
- "Get:6 http://security.ubuntu.com/ubuntu focal-security InRelease [114 kB] \n",
269
- "Hit:7 https://packages.microsoft.com/repos/azure-cli focal InRelease \n",
270
- "Get:8 https://packages.cloud.google.com/apt cloud-sdk/main amd64 Packages [368 kB]\n",
271
  "Ign:9 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal InRelease \n",
272
- "Hit:10 http://archive.ubuntu.com/ubuntu focal InRelease \n",
273
  "Hit:11 https://pkg.cloudflare.com/cloudflared focal InRelease \n",
274
- "Get:12 http://archive.ubuntu.com/ubuntu focal-updates InRelease [114 kB] \n",
275
- "Err:13 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release \n",
276
  " 404 Not Found [IP: 185.125.190.52 80]\n",
277
- "Hit:14 https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu focal InRelease \n",
278
- "Get:15 http://archive.ubuntu.com/ubuntu focal-backports InRelease [108 kB]\n",
279
- "Reading package lists... Done \n",
 
 
280
  "E: The repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\n",
281
  "N: Updating from such a repository can't be done securely, and is therefore disabled by default.\n",
282
  "N: See apt-secure(8) manpage for repository creation and user configuration details.\n",
283
- "Hit:1 https://download.docker.com/linux/ubuntu focal InRelease\n",
284
- "Get:2 https://nvidia.github.io/libnvidia-container/stable/ubuntu18.04/amd64 InRelease [1484 B]\n",
285
- "Hit:3 https://nvidia.github.io/nvidia-container-runtime/stable/ubuntu18.04/amd64 InRelease\n",
286
  "Hit:4 http://archive.lambdalabs.com/ubuntu focal InRelease \u001b[0m\n",
287
- "Get:5 http://security.ubuntu.com/ubuntu focal-security InRelease [114 kB] \u001b[0m\u001b[33m\n",
288
- "Hit:6 https://packages.microsoft.com/repos/azure-cli focal InRelease \u001b[0m\u001b[33m\n",
289
- "Hit:7 https://packages.cloud.google.com/apt cloud-sdk InRelease \u001b[0m\u001b[33m\n",
290
- "Ign:8 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal InRelease \u001b[0m\n",
291
- "Hit:9 http://archive.ubuntu.com/ubuntu focal InRelease \u001b[0m\u001b[33m\n",
292
- "Hit:10 https://pkg.cloudflare.com/cloudflared focal InRelease \u001b[0m\u001b[33m\n",
293
- "Get:11 http://archive.ubuntu.com/ubuntu focal-updates InRelease [114 kB] \u001b[0m\n",
294
- "Err:12 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release \u001b[0m\u001b[33m\u001b[33m\u001b[33m\n",
 
295
  " 404 Not Found [IP: 185.125.190.52 80]\n",
296
- "Hit:13 https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu focal InRelease \n",
297
- "Get:14 http://archive.ubuntu.com/ubuntu focal-backports InRelease [108 kB]\n",
298
- "Reading package lists... Done \u001b[0m33m\u001b[33m\u001b[33m\n",
299
  "\u001b[1;31mE: \u001b[0mThe repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\u001b[0m\n",
300
  "\u001b[33mN: \u001b[0mUpdating from such a repository can't be done securely, and is therefore disabled by default.\u001b[0m\n",
301
  "\u001b[33mN: \u001b[0mSee apt-secure(8) manpage for repository creation and user configuration details.\u001b[0m\n",
@@ -346,33 +347,33 @@
346
  "text": [
347
  "Defaulting to user installation because normal site-packages is not writeable\n",
348
  "Collecting git+https://github.com/huggingface/datasets\n",
349
- " Cloning https://github.com/huggingface/datasets to /tmp/pip-req-build-4yfcrkqv\n",
350
- " Running command git clone --filter=blob:none --quiet https://github.com/huggingface/datasets /tmp/pip-req-build-4yfcrkqv\n",
351
  " Resolved https://github.com/huggingface/datasets to commit c902456677116a081f762fa2b4aad13a0aa04d6e\n",
352
  " Installing build dependencies ... \u001b[?25ldone\n",
353
  "\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
354
  "\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
355
  "\u001b[?25hRequirement already satisfied: dill<0.3.7 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.3.6)\n",
 
 
 
356
  "Requirement already satisfied: packaging in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (22.0)\n",
357
  "Requirement already satisfied: xxhash in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (3.1.0)\n",
358
- "Requirement already satisfied: aiohttp in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (3.8.3)\n",
359
- "Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.23.5)\n",
360
- "Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.5.1)\n",
361
- "Requirement already satisfied: fsspec[http]>=2021.11.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2022.11.0)\n",
362
- "Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from datasets==2.7.1.dev0) (5.3.1)\n",
363
  "Requirement already satisfied: responses<0.19 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.18.0)\n",
 
 
 
364
  "Requirement already satisfied: tqdm>=4.62.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (4.64.1)\n",
365
- "Requirement already satisfied: pyarrow>=6.0.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (10.0.1)\n",
366
- "Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2.28.1)\n",
367
  "Requirement already satisfied: huggingface-hub<1.0.0,>=0.2.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.11.1)\n",
368
- "Requirement already satisfied: multiprocess in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.70.14)\n",
369
- "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (2.1.1)\n",
370
- "Requirement already satisfied: multidict<7.0,>=4.5 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (6.0.3)\n",
371
- "Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.3)\n",
372
- "Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.1)\n",
373
  "Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.8.2)\n",
374
- "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (4.0.2)\n",
 
375
  "Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->datasets==2.7.1.dev0) (19.3.0)\n",
 
 
 
376
  "Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (3.0.12)\n",
377
  "Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (4.4.0)\n",
378
  "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->datasets==2.7.1.dev0) (2019.11.28)\n",
@@ -383,49 +384,49 @@
383
  "Requirement already satisfied: six>=1.5 in /usr/lib/python3/dist-packages (from python-dateutil>=2.8.1->pandas->datasets==2.7.1.dev0) (1.14.0)\n",
384
  "Defaulting to user installation because normal site-packages is not writeable\n",
385
  "Collecting git+https://github.com/huggingface/transformers\n",
386
- " Cloning https://github.com/huggingface/transformers to /tmp/pip-req-build-kaly439h\n",
387
- " Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers /tmp/pip-req-build-kaly439h\n",
388
- " Resolved https://github.com/huggingface/transformers to commit ba9da49aa298345022f35a0b7be44ce4c72b85c2\n",
389
  " Installing build dependencies ... \u001b[?25ldone\n",
390
  "\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
391
  "\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
392
- "\u001b[?25hRequirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (22.0)\n",
393
- "Requirement already satisfied: regex!=2019.12.17 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (2022.10.31)\n",
394
- "Requirement already satisfied: tokenizers!=0.11.3,<0.14,>=0.11.1 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (0.13.2)\n",
395
  "Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (1.23.5)\n",
 
396
  "Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (5.3.1)\n",
397
  "Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (2.28.1)\n",
398
- "Requirement already satisfied: huggingface-hub<1.0,>=0.10.0 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (0.11.1)\n",
399
  "Requirement already satisfied: tqdm>=4.27 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (4.64.1)\n",
400
- "Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (3.0.12)\n",
401
  "Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0,>=0.10.0->transformers==4.26.0.dev0) (4.4.0)\n",
402
- "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (1.26.13)\n",
403
- "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2019.11.28)\n",
404
- "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2.8)\n",
405
  "Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (2.1.1)\n",
 
 
 
406
  "Defaulting to user installation because normal site-packages is not writeable\n",
407
  "Requirement already satisfied: librosa in ./.local/lib/python3.8/site-packages (0.9.2)\n",
 
408
  "Requirement already satisfied: joblib>=0.14 in ./.local/lib/python3.8/site-packages (from librosa) (1.2.0)\n",
 
 
 
409
  "Requirement already satisfied: decorator>=4.0.10 in /usr/lib/python3/dist-packages (from librosa) (4.4.2)\n",
410
- "Requirement already satisfied: scipy>=1.2.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.9.3)\n",
411
- "Requirement already satisfied: numba>=0.45.1 in ./.local/lib/python3.8/site-packages (from librosa) (0.56.4)\n",
412
  "Requirement already satisfied: audioread>=2.1.9 in ./.local/lib/python3.8/site-packages (from librosa) (3.0.0)\n",
413
- "Requirement already satisfied: pooch>=1.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.6.0)\n",
 
414
  "Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from librosa) (22.0)\n",
415
- "Requirement already satisfied: numpy>=1.17.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.23.5)\n",
416
- "Requirement already satisfied: scikit-learn>=0.19.1 in /usr/lib/python3/dist-packages (from librosa) (0.22.2.post1)\n",
417
  "Requirement already satisfied: resampy>=0.2.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.4.2)\n",
418
- "Requirement already satisfied: soundfile>=0.10.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.11.0)\n",
419
  "Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from numba>=0.45.1->librosa) (45.2.0)\n",
420
- "Requirement already satisfied: importlib-metadata in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (5.0.0)\n",
421
  "Requirement already satisfied: llvmlite<0.40,>=0.39.0dev0 in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (0.39.1)\n",
422
- "Requirement already satisfied: appdirs>=1.3.0 in /usr/lib/python3/dist-packages (from pooch>=1.0->librosa) (1.4.3)\n",
423
  "Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from pooch>=1.0->librosa) (2.28.1)\n",
 
424
  "Requirement already satisfied: cffi>=1.0 in /usr/lib/python3/dist-packages (from soundfile>=0.10.2->librosa) (1.14.0)\n",
425
- "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (1.26.13)\n",
426
  "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2019.11.28)\n",
427
- "Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.1.1)\n",
428
  "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.8)\n",
 
 
429
  "Requirement already satisfied: zipp>=0.5 in /usr/lib/python3/dist-packages (from importlib-metadata->numba>=0.45.1->librosa) (1.0.0)\n",
430
  "Defaulting to user installation because normal site-packages is not writeable\n",
431
  "Requirement already satisfied: jiwer in ./.local/lib/python3.8/site-packages (2.5.1)\n",
@@ -433,59 +434,59 @@
433
  "Requirement already satisfied: rapidfuzz<3.0.0,>=2.3.0 in ./.local/lib/python3.8/site-packages (from levenshtein==0.20.2->jiwer) (2.13.6)\n",
434
  "Defaulting to user installation because normal site-packages is not writeable\n",
435
  "Requirement already satisfied: gradio in ./.local/lib/python3.8/site-packages (3.13.0)\n",
436
- "Requirement already satisfied: fastapi in ./.local/lib/python3.8/site-packages (from gradio) (0.88.0)\n",
437
- "Requirement already satisfied: uvicorn in ./.local/lib/python3.8/site-packages (from gradio) (0.20.0)\n",
438
- "Requirement already satisfied: markdown-it-py[linkify,plugins] in ./.local/lib/python3.8/site-packages (from gradio) (2.1.0)\n",
439
- "Requirement already satisfied: pillow in /usr/lib/python3/dist-packages (from gradio) (7.0.0)\n",
440
- "Requirement already satisfied: paramiko in ./.local/lib/python3.8/site-packages (from gradio) (2.12.0)\n",
441
  "Requirement already satisfied: aiohttp in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
442
- "Requirement already satisfied: matplotlib in ./.local/lib/python3.8/site-packages (from gradio) (3.5.3)\n",
443
- "Requirement already satisfied: fsspec in ./.local/lib/python3.8/site-packages (from gradio) (2022.11.0)\n",
444
- "Requirement already satisfied: websockets>=10.0 in ./.local/lib/python3.8/site-packages (from gradio) (10.4)\n",
445
  "Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from gradio) (1.5.1)\n",
446
- "Requirement already satisfied: httpx in ./.local/lib/python3.8/site-packages (from gradio) (0.23.1)\n",
447
- "Requirement already satisfied: python-multipart in ./.local/lib/python3.8/site-packages (from gradio) (0.0.5)\n",
448
- "Requirement already satisfied: jinja2 in ./.local/lib/python3.8/site-packages (from gradio) (3.1.2)\n",
449
- "Requirement already satisfied: orjson in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
450
- "Requirement already satisfied: ffmpy in ./.local/lib/python3.8/site-packages (from gradio) (0.3.0)\n",
451
- "Requirement already satisfied: pydantic in ./.local/lib/python3.8/site-packages (from gradio) (1.10.2)\n",
452
  "Requirement already satisfied: pydub in ./.local/lib/python3.8/site-packages (from gradio) (0.25.1)\n",
 
 
 
 
 
 
453
  "Requirement already satisfied: h11<0.13,>=0.11 in ./.local/lib/python3.8/site-packages (from gradio) (0.12.0)\n",
454
- "Requirement already satisfied: pyyaml in /usr/lib/python3/dist-packages (from gradio) (5.3.1)\n",
455
  "Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from gradio) (2.28.1)\n",
 
 
 
 
 
 
 
 
 
456
  "Requirement already satisfied: pycryptodome in ./.local/lib/python3.8/site-packages (from gradio) (3.16.0)\n",
457
- "Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from gradio) (1.23.5)\n",
458
- "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (2.1.1)\n",
459
- "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (4.0.2)\n",
460
  "Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.3)\n",
461
  "Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->gradio) (19.3.0)\n",
462
- "Requirement already satisfied: multidict<7.0,>=4.5 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (6.0.3)\n",
 
463
  "Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.8.2)\n",
464
- "Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.1)\n",
465
  "Requirement already satisfied: starlette==0.22.0 in ./.local/lib/python3.8/site-packages (from fastapi->gradio) (0.22.0)\n",
466
  "Requirement already satisfied: typing-extensions>=3.10.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (4.4.0)\n",
467
  "Requirement already satisfied: anyio<5,>=3.4.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (3.6.2)\n",
468
- "Requirement already satisfied: httpcore<0.17.0,>=0.15.0 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (0.15.0)\n",
469
- "Requirement already satisfied: certifi in /usr/lib/python3/dist-packages (from httpx->gradio) (2019.11.28)\n",
470
  "Requirement already satisfied: rfc3986[idna2008]<2,>=1.3 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.5.0)\n",
471
  "Requirement already satisfied: sniffio in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.3.0)\n",
 
 
472
  "Requirement already satisfied: MarkupSafe>=2.0 in ./.local/lib/python3.8/site-packages (from jinja2->gradio) (2.1.1)\n",
473
  "Requirement already satisfied: mdurl~=0.1 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.1.2)\n",
474
- "Requirement already satisfied: mdit-py-plugins in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.3.3)\n",
475
  "Requirement already satisfied: linkify-it-py~=1.0 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (1.0.3)\n",
476
- "Requirement already satisfied: fonttools>=4.22.0 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (4.38.0)\n",
 
477
  "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (1.0.1)\n",
478
- "Requirement already satisfied: pyparsing>=2.2.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (2.4.6)\n",
479
  "Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (22.0)\n",
480
- "Requirement already satisfied: python-dateutil>=2.7 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (2.8.2)\n",
481
  "Requirement already satisfied: cycler>=0.10 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (0.10.0)\n",
 
 
482
  "Requirement already satisfied: pytz>=2020.1 in ./.local/lib/python3.8/site-packages (from pandas->gradio) (2022.5)\n",
 
483
  "Requirement already satisfied: six in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.14.0)\n",
484
  "Requirement already satisfied: pynacl>=1.0.1 in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.3.0)\n",
485
- "Requirement already satisfied: bcrypt>=3.1.3 in ./.local/lib/python3.8/site-packages (from paramiko->gradio) (4.0.1)\n",
486
  "Requirement already satisfied: cryptography>=2.5 in /usr/lib/python3/dist-packages (from paramiko->gradio) (2.8)\n",
487
- "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->gradio) (2.8)\n",
488
  "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->gradio) (1.26.13)\n",
 
489
  "Requirement already satisfied: click>=7.0 in /usr/lib/python3/dist-packages (from uvicorn->gradio) (7.0)\n",
490
  "Requirement already satisfied: uc-micro-py in ./.local/lib/python3.8/site-packages (from linkify-it-py~=1.0->markdown-it-py[linkify,plugins]->gradio) (1.0.1)\n",
491
  "Defaulting to user installation because normal site-packages is not writeable\n",
@@ -554,7 +555,7 @@
554
  {
555
  "data": {
556
  "application/vnd.jupyter.widget-view+json": {
557
- "model_id": "1ac74505b6d84e499c03b22286c4baa9",
558
  "version_major": 2,
559
  "version_minor": 0
560
  },
@@ -713,7 +714,7 @@
713
  " all_datasets = []\n",
714
  " # iterate over the datasets we want to interleave\n",
715
  " for i, dataset_name in enumerate(dataset_names):\n",
716
- " dataset = load_dataset(dataset_name, dataset_config_names[i], split=splits[i], streaming=True, **kwargs)\n",
717
  " # resample to specified sampling rate\n",
718
  " dataset = dataset.cast_column(\"audio\", Audio(sampling_rate))\n",
719
  " # normalise columns to [\"audio\", \"sentence\"]\n",
@@ -738,16 +739,7 @@
738
  "id": "qOwlctMhNmCG",
739
  "tags": []
740
  },
741
- "outputs": [
742
- {
743
- "name": "stderr",
744
- "output_type": "stream",
745
- "text": [
746
- "Found cached dataset common_voice_11_0 (/home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f)\n",
747
- "Found cached dataset fleurs (/home/ubuntu/.cache/huggingface/datasets/google___fleurs/el_gr/2.0.0/aabb39fb29739c495517ac904e2886819b6e344702f0a5b5283cb178b087c94a)\n"
748
- ]
749
- }
750
- ],
751
  "source": [
752
  "ds = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
753
  "\n"
@@ -770,23 +762,13 @@
770
  "metadata": {
771
  "id": "imRHJOpm4V_j"
772
  },
773
- "outputs": [
774
- {
775
- "name": "stderr",
776
- "output_type": "stream",
777
- "text": [
778
- "Found cached dataset common_voice_11_0 (/home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f)\n",
779
- "Found cached dataset fleurs (/home/ubuntu/.cache/huggingface/datasets/google___fleurs/el_gr/2.0.0/aabb39fb29739c495517ac904e2886819b6e344702f0a5b5283cb178b087c94a)\n",
780
- "Found cached dataset common_voice_11_0 (/home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f)\n"
781
- ]
782
- }
783
- ],
784
  "source": [
785
  "from datasets import IterableDatasetDict\n",
786
  "raw_datasets = IterableDatasetDict()\n",
787
  "\n",
788
  "raw_datasets[\"train\"] = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
789
- "raw_datasets[\"test\"] = load_dataset(\"mozilla-foundation/common_voice_11_0\", \"el\", split=\"test\", streaming=True, use_auth_token=True)\n",
790
  "\n",
791
  "\n",
792
  "#raw_datasets = raw_datasets.remove_columns([\"accent\", \"age\", \"client_id\", \"down_votes\", \"gender\", \"locale\", \"path\", \"segment\", \"up_votes\"])\n",
@@ -1013,29 +995,7 @@
1013
  "metadata": {
1014
  "id": "a37a7cdb-9013-427f-8de9-6a8d0e9dc684"
1015
  },
1016
- "outputs": [
1017
- {
1018
- "data": {
1019
- "application/vnd.jupyter.widget-view+json": {
1020
- "model_id": "5eb200f925f84e14bc08341ee8620fd9",
1021
- "version_major": 2,
1022
- "version_minor": 0
1023
- },
1024
- "text/plain": [
1025
- " 0%| | 0/6430 [00:00<?, ?ex/s]"
1026
- ]
1027
- },
1028
- "metadata": {},
1029
- "output_type": "display_data"
1030
- },
1031
- {
1032
- "name": "stderr",
1033
- "output_type": "stream",
1034
- "text": [
1035
- "Loading cached processed dataset at /home/ubuntu/.cache/huggingface/datasets/mozilla-foundation___common_voice_11_0/el/11.0.0/f8e47235d9b4e68fa24ed71d63266a02018ccf7194b2a8c9c598a5f3ab304d9f/cache-52a8b70c074fdab6.arrow\n"
1036
- ]
1037
- }
1038
- ],
1039
  "source": [
1040
  "vectorized_datasets = raw_datasets.map(prepare_dataset, remove_columns=list(next(iter(raw_datasets.values())).features)).with_format(\"torch\")"
1041
  ]
@@ -1052,32 +1012,12 @@
1052
  },
1053
  {
1054
  "cell_type": "code",
1055
- "execution_count": 24,
1056
  "id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c",
1057
  "metadata": {
1058
  "id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c"
1059
  },
1060
- "outputs": [
1061
- {
1062
- "name": "stdout",
1063
- "output_type": "stream",
1064
- "text": [
1065
- "{'input_features': tensor([[-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
1066
- " [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
1067
- " [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
1068
- " ...,\n",
1069
- " [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
1070
- " [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154],\n",
1071
- " [-0.8154, -0.8154, -0.8154, ..., -0.8154, -0.8154, -0.8154]]), 'input_length': tensor(6.6000), 'labels': tensor([50258, 50281, 50359, 50363, 7068, 26263, 11383, 3596, 2080, 3659,\n",
1072
- " 10073, 30599, 5691, 6744, 8828, 11658, 3371, 17321, 30320, 11383,\n",
1073
- " 3659, 5337, 4339, 20511, 4915, 3371, 33908, 44035, 3721, 19264,\n",
1074
- " 25090, 7597, 17928, 24841, 8385, 3835, 4903, 2080, 2805, 8385,\n",
1075
- " 3721, 39320, 8335, 3596, 21457, 4339, 5074, 1800, 8715, 6956,\n",
1076
- " 1800, 5958, 14836, 8385, 1800, 34079, 8385, 16946, 8066, 5733,\n",
1077
- " 24296, 9137, 9903, 50257])}\n"
1078
- ]
1079
- }
1080
- ],
1081
  "source": [
1082
  "vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].shuffle(\n",
1083
  " #buffer_size=500,\n",
@@ -1100,7 +1040,7 @@
1100
  },
1101
  {
1102
  "cell_type": "code",
1103
- "execution_count": 25,
1104
  "id": "01cb25ef-4bb0-4325-9461-f59198acadf6",
1105
  "metadata": {
1106
  "id": "01cb25ef-4bb0-4325-9461-f59198acadf6"
@@ -1125,27 +1065,12 @@
1125
  },
1126
  {
1127
  "cell_type": "code",
1128
- "execution_count": 26,
1129
  "id": "333f7f6e-6053-4d3b-8924-c733c79b82ac",
1130
  "metadata": {
1131
  "id": "333f7f6e-6053-4d3b-8924-c733c79b82ac"
1132
  },
1133
- "outputs": [
1134
- {
1135
- "data": {
1136
- "application/vnd.jupyter.widget-view+json": {
1137
- "model_id": "aefbdf517ed24020b4fd372739f37e5f",
1138
- "version_major": 2,
1139
- "version_minor": 0
1140
- },
1141
- "text/plain": [
1142
- " 0%| | 0/7 [00:00<?, ?ba/s]"
1143
- ]
1144
- },
1145
- "metadata": {},
1146
- "output_type": "display_data"
1147
- }
1148
- ],
1149
  "source": [
1150
  "vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].filter(\n",
1151
  " is_audio_in_length_range,\n",
@@ -1220,7 +1145,7 @@
1220
  },
1221
  {
1222
  "cell_type": "code",
1223
- "execution_count": 27,
1224
  "id": "8326221e-ec13-4731-bb4e-51e5fc1486c5",
1225
  "metadata": {
1226
  "id": "8326221e-ec13-4731-bb4e-51e5fc1486c5"
@@ -1272,7 +1197,7 @@
1272
  },
1273
  {
1274
  "cell_type": "code",
1275
- "execution_count": 28,
1276
  "id": "fc834702-c0d3-4a96-b101-7b87be32bf42",
1277
  "metadata": {
1278
  "id": "fc834702-c0d3-4a96-b101-7b87be32bf42"
@@ -1305,7 +1230,7 @@
1305
  },
1306
  {
1307
  "cell_type": "code",
1308
- "execution_count": 29,
1309
  "id": "b22b4011-f31f-4b57-b684-c52332f92890",
1310
  "metadata": {
1311
  "colab": {
@@ -1356,7 +1281,7 @@
1356
  },
1357
  {
1358
  "cell_type": "code",
1359
- "execution_count": 30,
1360
  "id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb",
1361
  "metadata": {
1362
  "id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb"
@@ -1405,7 +1330,7 @@
1405
  },
1406
  {
1407
  "cell_type": "code",
1408
- "execution_count": 31,
1409
  "id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
1410
  "metadata": {
1411
  "colab": {
@@ -1443,21 +1368,7 @@
1443
  {
1444
  "data": {
1445
  "application/vnd.jupyter.widget-view+json": {
1446
- "model_id": "27fec52020a2407fa93dd57e98de8fc9",
1447
- "version_major": 2,
1448
- "version_minor": 0
1449
- },
1450
- "text/plain": [
1451
- "Downloading: 0%| | 0.00/1.04k [00:00<?, ?B/s]"
1452
- ]
1453
- },
1454
- "metadata": {},
1455
- "output_type": "display_data"
1456
- },
1457
- {
1458
- "data": {
1459
- "application/vnd.jupyter.widget-view+json": {
1460
- "model_id": "f8c10225aa194c909eeb19170ac75d1f",
1461
  "version_major": 2,
1462
  "version_minor": 0
1463
  },
@@ -1490,7 +1401,7 @@
1490
  },
1491
  {
1492
  "cell_type": "code",
1493
- "execution_count": 32,
1494
  "id": "62038ba3-88ed-4fce-84db-338f50dcd04f",
1495
  "metadata": {
1496
  "id": "62038ba3-88ed-4fce-84db-338f50dcd04f"
@@ -1527,7 +1438,7 @@
1527
  },
1528
  {
1529
  "cell_type": "code",
1530
- "execution_count": 33,
1531
  "id": "0ae3e9af-97b7-4aa0-ae85-20b23b5bcb3a",
1532
  "metadata": {
1533
  "colab": {
@@ -1570,7 +1481,7 @@
1570
  },
1571
  {
1572
  "cell_type": "code",
1573
- "execution_count": 34,
1574
  "id": "o72eOpGzD_sK",
1575
  "metadata": {
1576
  "colab": {
@@ -1584,7 +1495,7 @@
1584
  "name": "stdout",
1585
  "output_type": "stream",
1586
  "text": [
1587
- "Tue Dec 13 19:33:07 2022 \n",
1588
  "+-----------------------------------------------------------------------------+\n",
1589
  "| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
1590
  "|-------------------------------+----------------------+----------------------+\n",
@@ -1593,7 +1504,7 @@
1593
  "| | | MIG M. |\n",
1594
  "|===============================+======================+======================|\n",
1595
  "| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
1596
- "| N/A 31C P0 46W / 400W | 2MiB / 40960MiB | 0% Default |\n",
1597
  "| | | Disabled |\n",
1598
  "+-------------------------------+----------------------+----------------------+\n",
1599
  " \n",
@@ -1634,7 +1545,7 @@
1634
  },
1635
  {
1636
  "cell_type": "code",
1637
- "execution_count": 35,
1638
  "id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2",
1639
  "metadata": {
1640
  "id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2"
@@ -1667,7 +1578,7 @@
1667
  },
1668
  {
1669
  "cell_type": "code",
1670
- "execution_count": 36,
1671
  "id": "d546d7fe-0543-479a-b708-2ebabec19493",
1672
  "metadata": {
1673
  "colab": {
@@ -2281,7 +2192,7 @@
2281
  },
2282
  {
2283
  "cell_type": "code",
2284
- "execution_count": 37,
2285
  "id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672",
2286
  "metadata": {
2287
  "id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672"
@@ -2374,21 +2285,22 @@
2374
  "name": "stderr",
2375
  "output_type": "stream",
2376
  "text": [
2377
- "Loading model from ./whisper-medium-el/checkpoint-3000.\n",
2378
- "The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
2379
  "/home/ubuntu/.local/lib/python3.8/site-packages/transformers/optimization.py:306: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
2380
  " warnings.warn(\n",
2381
  "***** Running training *****\n",
2382
- " Num examples = 6428\n",
2383
- " Num Epochs = 25\n",
2384
  " Instantaneous batch size per device = 32\n",
2385
  " Total train batch size (w. parallel, distributed & accumulation) = 32\n",
2386
  " Gradient Accumulation steps = 1\n",
2387
  " Total optimization steps = 5000\n",
2388
  " Number of trainable parameters = 763857920\n",
2389
  " Continuing training from checkpoint, will skip to saved global_step\n",
2390
- " Continuing training from epoch 14\n",
2391
- " Continuing training from global step 3000\n"
 
 
2392
  ]
2393
  },
2394
  {
@@ -2397,8 +2309,8 @@
2397
  "\n",
2398
  " <div>\n",
2399
  " \n",
2400
- " <progress value='4122' max='5000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
2401
- " [4122/5000 1:52:06 < 1:27:52, 0.17 it/s, Epoch 19.58/25]\n",
2402
  " </div>\n",
2403
  " <table border=\"1\" class=\"dataframe\">\n",
2404
  " <thead>\n",
@@ -2406,16 +2318,9 @@
2406
  " <th>Step</th>\n",
2407
  " <th>Training Loss</th>\n",
2408
  " <th>Validation Loss</th>\n",
2409
- " <th>Wer</th>\n",
2410
  " </tr>\n",
2411
  " </thead>\n",
2412
  " <tbody>\n",
2413
- " <tr>\n",
2414
- " <td>4000</td>\n",
2415
- " <td>0.000300</td>\n",
2416
- " <td>0.367278</td>\n",
2417
- " <td>11.534175</td>\n",
2418
- " </tr>\n",
2419
  " </tbody>\n",
2420
  "</table><p>"
2421
  ],
@@ -2425,27 +2330,6 @@
2425
  },
2426
  "metadata": {},
2427
  "output_type": "display_data"
2428
- },
2429
- {
2430
- "name": "stderr",
2431
- "output_type": "stream",
2432
- "text": [
2433
- "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: path, input_length, gender, accent, up_votes, client_id, locale, age, segment, down_votes. If path, input_length, gender, accent, up_votes, client_id, locale, age, segment, down_votes are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
2434
- "***** Running Evaluation *****\n",
2435
- " Num examples = 1696\n",
2436
- " Batch size = 16\n",
2437
- "Saving model checkpoint to ./whisper-medium-el/checkpoint-4000\n",
2438
- "Configuration saved in ./whisper-medium-el/checkpoint-4000/config.json\n",
2439
- "Model weights saved in ./whisper-medium-el/checkpoint-4000/pytorch_model.bin\n",
2440
- "Feature extractor saved in ./whisper-medium-el/checkpoint-4000/preprocessor_config.json\n",
2441
- "tokenizer config file saved in ./whisper-medium-el/checkpoint-4000/tokenizer_config.json\n",
2442
- "Special tokens file saved in ./whisper-medium-el/checkpoint-4000/special_tokens_map.json\n",
2443
- "added tokens file saved in ./whisper-medium-el/checkpoint-4000/added_tokens.json\n",
2444
- "Feature extractor saved in ./whisper-medium-el/preprocessor_config.json\n",
2445
- "tokenizer config file saved in ./whisper-medium-el/tokenizer_config.json\n",
2446
- "Special tokens file saved in ./whisper-medium-el/special_tokens_map.json\n",
2447
- "added tokens file saved in ./whisper-medium-el/added_tokens.json\n"
2448
- ]
2449
  }
2450
  ],
2451
  "source": [
 
125
  "Requirement already satisfied: torch in ./.local/lib/python3.8/site-packages (1.13.0)\n",
126
  "Requirement already satisfied: torchaudio in ./.local/lib/python3.8/site-packages (0.13.0)\n",
127
  "Requirement already satisfied: torchvision in ./.local/lib/python3.8/site-packages (0.14.0)\n",
128
+ "Requirement already satisfied: nvidia-cuda-runtime-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
129
+ "Requirement already satisfied: nvidia-cudnn-cu11==8.5.0.96 in ./.local/lib/python3.8/site-packages (from torch) (8.5.0.96)\n",
130
  "Requirement already satisfied: nvidia-cublas-cu11==11.10.3.66 in ./.local/lib/python3.8/site-packages (from torch) (11.10.3.66)\n",
 
131
  "Requirement already satisfied: typing-extensions in ./.local/lib/python3.8/site-packages (from torch) (4.4.0)\n",
132
+ "Requirement already satisfied: nvidia-cuda-nvrtc-cu11==11.7.99 in ./.local/lib/python3.8/site-packages (from torch) (11.7.99)\n",
 
 
133
  "Requirement already satisfied: wheel in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (0.34.2)\n",
134
+ "Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from nvidia-cublas-cu11==11.10.3.66->torch) (45.2.0)\n",
135
  "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /usr/lib/python3/dist-packages (from torchvision) (7.0.0)\n",
136
+ "Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from torchvision) (2.28.1)\n",
137
  "Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from torchvision) (1.23.5)\n",
 
138
  "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->torchvision) (2019.11.28)\n",
139
+ "Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests->torchvision) (2.1.1)\n",
140
+ "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->torchvision) (1.26.13)\n",
141
+ "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->torchvision) (2.8)\n"
142
  ]
143
  }
144
  ],
 
200
  "name": "stdout",
201
  "output_type": "stream",
202
  "text": [
203
+ "Tue Dec 13 21:26:01 2022 \n",
204
  "+-----------------------------------------------------------------------------+\n",
205
  "| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
206
  "|-------------------------------+----------------------+----------------------+\n",
 
209
  "| | | MIG M. |\n",
210
  "|===============================+======================+======================|\n",
211
  "| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
212
+ "| N/A 41C P0 50W / 400W | 0MiB / 40960MiB | 0% Default |\n",
213
  "| | | Disabled |\n",
214
  "+-------------------------------+----------------------+----------------------+\n",
215
  " \n",
 
260
  "name": "stdout",
261
  "output_type": "stream",
262
  "text": [
263
+ "Get:1 https://nvidia.github.io/libnvidia-container/stable/ubuntu18.04/amd64 InRelease [1484 B]\n",
264
+ "Hit:2 https://nvidia.github.io/nvidia-container-runtime/stable/ubuntu18.04/amd64 InRelease\n",
265
+ "Get:3 https://packages.cloud.google.com/apt cloud-sdk InRelease [6751 B] \n",
266
+ "Hit:4 http://archive.lambdalabs.com/ubuntu focal InRelease \n",
267
+ "Hit:5 https://download.docker.com/linux/ubuntu focal InRelease \n",
268
+ "Hit:6 https://packages.microsoft.com/repos/azure-cli focal InRelease \n",
269
+ "Hit:7 http://archive.ubuntu.com/ubuntu focal InRelease \n",
270
+ "Get:8 http://security.ubuntu.com/ubuntu focal-security InRelease [114 kB] \n",
271
  "Ign:9 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal InRelease \n",
272
+ "Get:10 http://archive.ubuntu.com/ubuntu focal-updates InRelease [114 kB] \n",
273
  "Hit:11 https://pkg.cloudflare.com/cloudflared focal InRelease \n",
274
+ "Err:12 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release \n",
 
275
  " 404 Not Found [IP: 185.125.190.52 80]\n",
276
+ "Hit:13 https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu focal InRelease \n",
277
+ "Get:14 http://archive.ubuntu.com/ubuntu focal-backports InRelease [108 kB] \n",
278
+ "Get:15 http://archive.ubuntu.com/ubuntu focal-updates/main amd64 Packages [2269 kB]\n",
279
+ "Get:16 http://archive.ubuntu.com/ubuntu focal-updates/universe amd64 Packages [1009 kB]\n",
280
+ "Reading package lists... Done \n",
281
  "E: The repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\n",
282
  "N: Updating from such a repository can't be done securely, and is therefore disabled by default.\n",
283
  "N: See apt-secure(8) manpage for repository creation and user configuration details.\n",
284
+ "Get:1 https://nvidia.github.io/libnvidia-container/stable/ubuntu18.04/amd64 InRelease [1484 B]\n",
285
+ "Hit:2 https://nvidia.github.io/nvidia-container-runtime/stable/ubuntu18.04/amd64 InRelease\n",
286
+ "Hit:3 https://packages.cloud.google.com/apt cloud-sdk InRelease \u001b[0m\u001b[33m\n",
287
  "Hit:4 http://archive.lambdalabs.com/ubuntu focal InRelease \u001b[0m\n",
288
+ "Hit:5 https://download.docker.com/linux/ubuntu focal InRelease \u001b[0m\n",
289
+ "Ign:6 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal InRelease \u001b[0m\u001b[33m\u001b[33m\u001b[33m\n",
290
+ "Hit:7 http://archive.ubuntu.com/ubuntu focal InRelease \u001b[0m\n",
291
+ "Hit:8 https://packages.microsoft.com/repos/azure-cli focal InRelease \u001b[0m\n",
292
+ "Hit:9 http://security.ubuntu.com/ubuntu focal-security InRelease \u001b[0m\n",
293
+ "Hit:10 https://pkg.cloudflare.com/cloudflared focal InRelease \u001b[0m\u001b[33m\u001b[33m\n",
294
+ "Hit:11 http://archive.ubuntu.com/ubuntu focal-updates InRelease \u001b[0m\n",
295
+ "Hit:12 http://archive.ubuntu.com/ubuntu focal-backports InRelease \u001b[0m \u001b[0m\u001b[33m\u001b[33m\u001b[33m\n",
296
+ "Err:13 http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release\n",
297
  " 404 Not Found [IP: 185.125.190.52 80]\n",
298
+ "Hit:14 https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu focal InRelease\n",
299
+ "Reading package lists... Done\u001b[33m\u001b[33m\n",
 
300
  "\u001b[1;31mE: \u001b[0mThe repository 'http://ppa.launchpad.net/jonathonf/ffmpeg-4/ubuntu focal Release' does not have a Release file.\u001b[0m\n",
301
  "\u001b[33mN: \u001b[0mUpdating from such a repository can't be done securely, and is therefore disabled by default.\u001b[0m\n",
302
  "\u001b[33mN: \u001b[0mSee apt-secure(8) manpage for repository creation and user configuration details.\u001b[0m\n",
 
347
  "text": [
348
  "Defaulting to user installation because normal site-packages is not writeable\n",
349
  "Collecting git+https://github.com/huggingface/datasets\n",
350
+ " Cloning https://github.com/huggingface/datasets to /tmp/pip-req-build-ju8bkpld\n",
351
+ " Running command git clone --filter=blob:none --quiet https://github.com/huggingface/datasets /tmp/pip-req-build-ju8bkpld\n",
352
  " Resolved https://github.com/huggingface/datasets to commit c902456677116a081f762fa2b4aad13a0aa04d6e\n",
353
  " Installing build dependencies ... \u001b[?25ldone\n",
354
  "\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
355
  "\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
356
  "\u001b[?25hRequirement already satisfied: dill<0.3.7 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.3.6)\n",
357
+ "Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2.28.1)\n",
358
+ "Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.23.5)\n",
359
+ "Requirement already satisfied: aiohttp in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (3.8.3)\n",
360
  "Requirement already satisfied: packaging in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (22.0)\n",
361
  "Requirement already satisfied: xxhash in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (3.1.0)\n",
362
+ "Requirement already satisfied: pyarrow>=6.0.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (10.0.1)\n",
 
 
 
 
363
  "Requirement already satisfied: responses<0.19 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.18.0)\n",
364
+ "Requirement already satisfied: multiprocess in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.70.14)\n",
365
+ "Requirement already satisfied: fsspec[http]>=2021.11.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (2022.11.0)\n",
366
+ "Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (1.5.1)\n",
367
  "Requirement already satisfied: tqdm>=4.62.1 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (4.64.1)\n",
368
+ "Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from datasets==2.7.1.dev0) (5.3.1)\n",
 
369
  "Requirement already satisfied: huggingface-hub<1.0.0,>=0.2.0 in ./.local/lib/python3.8/site-packages (from datasets==2.7.1.dev0) (0.11.1)\n",
 
 
 
 
 
370
  "Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.8.2)\n",
371
+ "Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.1)\n",
372
+ "Requirement already satisfied: multidict<7.0,>=4.5 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (6.0.3)\n",
373
  "Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->datasets==2.7.1.dev0) (19.3.0)\n",
374
+ "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (4.0.2)\n",
375
+ "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (2.1.1)\n",
376
+ "Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->datasets==2.7.1.dev0) (1.3.3)\n",
377
  "Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (3.0.12)\n",
378
  "Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0.0,>=0.2.0->datasets==2.7.1.dev0) (4.4.0)\n",
379
  "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->datasets==2.7.1.dev0) (2019.11.28)\n",
 
384
  "Requirement already satisfied: six>=1.5 in /usr/lib/python3/dist-packages (from python-dateutil>=2.8.1->pandas->datasets==2.7.1.dev0) (1.14.0)\n",
385
  "Defaulting to user installation because normal site-packages is not writeable\n",
386
  "Collecting git+https://github.com/huggingface/transformers\n",
387
+ " Cloning https://github.com/huggingface/transformers to /tmp/pip-req-build-9scgt3ru\n",
388
+ " Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers /tmp/pip-req-build-9scgt3ru\n",
389
+ " Resolved https://github.com/huggingface/transformers to commit d994473b05a83ea398d9f10ca458855df095e22d\n",
390
  " Installing build dependencies ... \u001b[?25ldone\n",
391
  "\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n",
392
  "\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n",
393
+ "\u001b[?25hRequirement already satisfied: tokenizers!=0.11.3,<0.14,>=0.11.1 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (0.13.2)\n",
394
+ "Requirement already satisfied: huggingface-hub<1.0,>=0.10.0 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (0.11.1)\n",
395
+ "Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (22.0)\n",
396
  "Requirement already satisfied: numpy>=1.17 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (1.23.5)\n",
397
+ "Requirement already satisfied: filelock in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (3.0.12)\n",
398
  "Requirement already satisfied: pyyaml>=5.1 in /usr/lib/python3/dist-packages (from transformers==4.26.0.dev0) (5.3.1)\n",
399
  "Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (2.28.1)\n",
400
+ "Requirement already satisfied: regex!=2019.12.17 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (2022.10.31)\n",
401
  "Requirement already satisfied: tqdm>=4.27 in ./.local/lib/python3.8/site-packages (from transformers==4.26.0.dev0) (4.64.1)\n",
 
402
  "Requirement already satisfied: typing-extensions>=3.7.4.3 in ./.local/lib/python3.8/site-packages (from huggingface-hub<1.0,>=0.10.0->transformers==4.26.0.dev0) (4.4.0)\n",
 
 
 
403
  "Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (2.1.1)\n",
404
+ "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2.8)\n",
405
+ "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests->transformers==4.26.0.dev0) (2019.11.28)\n",
406
+ "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->transformers==4.26.0.dev0) (1.26.13)\n",
407
  "Defaulting to user installation because normal site-packages is not writeable\n",
408
  "Requirement already satisfied: librosa in ./.local/lib/python3.8/site-packages (0.9.2)\n",
409
+ "Requirement already satisfied: scikit-learn>=0.19.1 in /usr/lib/python3/dist-packages (from librosa) (0.22.2.post1)\n",
410
  "Requirement already satisfied: joblib>=0.14 in ./.local/lib/python3.8/site-packages (from librosa) (1.2.0)\n",
411
+ "Requirement already satisfied: soundfile>=0.10.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.11.0)\n",
412
+ "Requirement already satisfied: numpy>=1.17.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.23.5)\n",
413
+ "Requirement already satisfied: pooch>=1.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.6.0)\n",
414
  "Requirement already satisfied: decorator>=4.0.10 in /usr/lib/python3/dist-packages (from librosa) (4.4.2)\n",
 
 
415
  "Requirement already satisfied: audioread>=2.1.9 in ./.local/lib/python3.8/site-packages (from librosa) (3.0.0)\n",
416
+ "Requirement already satisfied: numba>=0.45.1 in ./.local/lib/python3.8/site-packages (from librosa) (0.56.4)\n",
417
+ "Requirement already satisfied: scipy>=1.2.0 in ./.local/lib/python3.8/site-packages (from librosa) (1.9.3)\n",
418
  "Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from librosa) (22.0)\n",
 
 
419
  "Requirement already satisfied: resampy>=0.2.2 in ./.local/lib/python3.8/site-packages (from librosa) (0.4.2)\n",
 
420
  "Requirement already satisfied: setuptools in /usr/lib/python3/dist-packages (from numba>=0.45.1->librosa) (45.2.0)\n",
 
421
  "Requirement already satisfied: llvmlite<0.40,>=0.39.0dev0 in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (0.39.1)\n",
422
+ "Requirement already satisfied: importlib-metadata in ./.local/lib/python3.8/site-packages (from numba>=0.45.1->librosa) (5.0.0)\n",
423
  "Requirement already satisfied: requests>=2.19.0 in ./.local/lib/python3.8/site-packages (from pooch>=1.0->librosa) (2.28.1)\n",
424
+ "Requirement already satisfied: appdirs>=1.3.0 in /usr/lib/python3/dist-packages (from pooch>=1.0->librosa) (1.4.3)\n",
425
  "Requirement already satisfied: cffi>=1.0 in /usr/lib/python3/dist-packages (from soundfile>=0.10.2->librosa) (1.14.0)\n",
 
426
  "Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2019.11.28)\n",
 
427
  "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.8)\n",
428
+ "Requirement already satisfied: charset-normalizer<3,>=2 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.1.1)\n",
429
+ "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (1.26.13)\n",
430
  "Requirement already satisfied: zipp>=0.5 in /usr/lib/python3/dist-packages (from importlib-metadata->numba>=0.45.1->librosa) (1.0.0)\n",
431
  "Defaulting to user installation because normal site-packages is not writeable\n",
432
  "Requirement already satisfied: jiwer in ./.local/lib/python3.8/site-packages (2.5.1)\n",
 
434
  "Requirement already satisfied: rapidfuzz<3.0.0,>=2.3.0 in ./.local/lib/python3.8/site-packages (from levenshtein==0.20.2->jiwer) (2.13.6)\n",
435
  "Defaulting to user installation because normal site-packages is not writeable\n",
436
  "Requirement already satisfied: gradio in ./.local/lib/python3.8/site-packages (3.13.0)\n",
437
+ "Requirement already satisfied: pyyaml in /usr/lib/python3/dist-packages (from gradio) (5.3.1)\n",
 
 
 
 
438
  "Requirement already satisfied: aiohttp in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
 
 
 
439
  "Requirement already satisfied: pandas in ./.local/lib/python3.8/site-packages (from gradio) (1.5.1)\n",
 
 
 
 
 
 
440
  "Requirement already satisfied: pydub in ./.local/lib/python3.8/site-packages (from gradio) (0.25.1)\n",
441
+ "Requirement already satisfied: websockets>=10.0 in ./.local/lib/python3.8/site-packages (from gradio) (10.4)\n",
442
+ "Requirement already satisfied: httpx in ./.local/lib/python3.8/site-packages (from gradio) (0.23.1)\n",
443
+ "Requirement already satisfied: pillow in /usr/lib/python3/dist-packages (from gradio) (7.0.0)\n",
444
+ "Requirement already satisfied: uvicorn in ./.local/lib/python3.8/site-packages (from gradio) (0.20.0)\n",
445
+ "Requirement already satisfied: paramiko in ./.local/lib/python3.8/site-packages (from gradio) (2.12.0)\n",
446
+ "Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from gradio) (1.23.5)\n",
447
  "Requirement already satisfied: h11<0.13,>=0.11 in ./.local/lib/python3.8/site-packages (from gradio) (0.12.0)\n",
 
448
  "Requirement already satisfied: requests in ./.local/lib/python3.8/site-packages (from gradio) (2.28.1)\n",
449
+ "Requirement already satisfied: fsspec in ./.local/lib/python3.8/site-packages (from gradio) (2022.11.0)\n",
450
+ "Requirement already satisfied: orjson in ./.local/lib/python3.8/site-packages (from gradio) (3.8.3)\n",
451
+ "Requirement already satisfied: python-multipart in ./.local/lib/python3.8/site-packages (from gradio) (0.0.5)\n",
452
+ "Requirement already satisfied: pydantic in ./.local/lib/python3.8/site-packages (from gradio) (1.10.2)\n",
453
+ "Requirement already satisfied: markdown-it-py[linkify,plugins] in ./.local/lib/python3.8/site-packages (from gradio) (2.1.0)\n",
454
+ "Requirement already satisfied: ffmpy in ./.local/lib/python3.8/site-packages (from gradio) (0.3.0)\n",
455
+ "Requirement already satisfied: fastapi in ./.local/lib/python3.8/site-packages (from gradio) (0.88.0)\n",
456
+ "Requirement already satisfied: jinja2 in ./.local/lib/python3.8/site-packages (from gradio) (3.1.2)\n",
457
+ "Requirement already satisfied: matplotlib in ./.local/lib/python3.8/site-packages (from gradio) (3.5.3)\n",
458
  "Requirement already satisfied: pycryptodome in ./.local/lib/python3.8/site-packages (from gradio) (3.16.0)\n",
459
+ "Requirement already satisfied: aiosignal>=1.1.2 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.1)\n",
460
+ "Requirement already satisfied: multidict<7.0,>=4.5 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (6.0.3)\n",
 
461
  "Requirement already satisfied: frozenlist>=1.1.1 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.3.3)\n",
462
  "Requirement already satisfied: attrs>=17.3.0 in /usr/lib/python3/dist-packages (from aiohttp->gradio) (19.3.0)\n",
463
+ "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (4.0.2)\n",
464
+ "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (2.1.1)\n",
465
  "Requirement already satisfied: yarl<2.0,>=1.0 in ./.local/lib/python3.8/site-packages (from aiohttp->gradio) (1.8.2)\n",
 
466
  "Requirement already satisfied: starlette==0.22.0 in ./.local/lib/python3.8/site-packages (from fastapi->gradio) (0.22.0)\n",
467
  "Requirement already satisfied: typing-extensions>=3.10.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (4.4.0)\n",
468
  "Requirement already satisfied: anyio<5,>=3.4.0 in ./.local/lib/python3.8/site-packages (from starlette==0.22.0->fastapi->gradio) (3.6.2)\n",
 
 
469
  "Requirement already satisfied: rfc3986[idna2008]<2,>=1.3 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.5.0)\n",
470
  "Requirement already satisfied: sniffio in ./.local/lib/python3.8/site-packages (from httpx->gradio) (1.3.0)\n",
471
+ "Requirement already satisfied: certifi in /usr/lib/python3/dist-packages (from httpx->gradio) (2019.11.28)\n",
472
+ "Requirement already satisfied: httpcore<0.17.0,>=0.15.0 in ./.local/lib/python3.8/site-packages (from httpx->gradio) (0.15.0)\n",
473
  "Requirement already satisfied: MarkupSafe>=2.0 in ./.local/lib/python3.8/site-packages (from jinja2->gradio) (2.1.1)\n",
474
  "Requirement already satisfied: mdurl~=0.1 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.1.2)\n",
 
475
  "Requirement already satisfied: linkify-it-py~=1.0 in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (1.0.3)\n",
476
+ "Requirement already satisfied: mdit-py-plugins in ./.local/lib/python3.8/site-packages (from markdown-it-py[linkify,plugins]->gradio) (0.3.3)\n",
477
+ "Requirement already satisfied: python-dateutil>=2.7 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (2.8.2)\n",
478
  "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (1.0.1)\n",
 
479
  "Requirement already satisfied: packaging>=20.0 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (22.0)\n",
 
480
  "Requirement already satisfied: cycler>=0.10 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (0.10.0)\n",
481
+ "Requirement already satisfied: pyparsing>=2.2.1 in /usr/lib/python3/dist-packages (from matplotlib->gradio) (2.4.6)\n",
482
+ "Requirement already satisfied: fonttools>=4.22.0 in ./.local/lib/python3.8/site-packages (from matplotlib->gradio) (4.38.0)\n",
483
  "Requirement already satisfied: pytz>=2020.1 in ./.local/lib/python3.8/site-packages (from pandas->gradio) (2022.5)\n",
484
+ "Requirement already satisfied: bcrypt>=3.1.3 in ./.local/lib/python3.8/site-packages (from paramiko->gradio) (4.0.1)\n",
485
  "Requirement already satisfied: six in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.14.0)\n",
486
  "Requirement already satisfied: pynacl>=1.0.1 in /usr/lib/python3/dist-packages (from paramiko->gradio) (1.3.0)\n",
 
487
  "Requirement already satisfied: cryptography>=2.5 in /usr/lib/python3/dist-packages (from paramiko->gradio) (2.8)\n",
 
488
  "Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./.local/lib/python3.8/site-packages (from requests->gradio) (1.26.13)\n",
489
+ "Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests->gradio) (2.8)\n",
490
  "Requirement already satisfied: click>=7.0 in /usr/lib/python3/dist-packages (from uvicorn->gradio) (7.0)\n",
491
  "Requirement already satisfied: uc-micro-py in ./.local/lib/python3.8/site-packages (from linkify-it-py~=1.0->markdown-it-py[linkify,plugins]->gradio) (1.0.1)\n",
492
  "Defaulting to user installation because normal site-packages is not writeable\n",
 
555
  {
556
  "data": {
557
  "application/vnd.jupyter.widget-view+json": {
558
+ "model_id": "ad867c59abb44253a78ca06b8853a84d",
559
  "version_major": 2,
560
  "version_minor": 0
561
  },
 
714
  " all_datasets = []\n",
715
  " # iterate over the datasets we want to interleave\n",
716
  " for i, dataset_name in enumerate(dataset_names):\n",
717
+ " dataset = load_dataset(dataset_name, dataset_config_names[i], split=splits[i], streaming=False, **kwargs)\n",
718
  " # resample to specified sampling rate\n",
719
  " dataset = dataset.cast_column(\"audio\", Audio(sampling_rate))\n",
720
  " # normalise columns to [\"audio\", \"sentence\"]\n",
 
739
  "id": "qOwlctMhNmCG",
740
  "tags": []
741
  },
742
+ "outputs": [],
 
 
 
 
 
 
 
 
 
743
  "source": [
744
  "ds = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
745
  "\n"
 
762
  "metadata": {
763
  "id": "imRHJOpm4V_j"
764
  },
765
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
766
  "source": [
767
  "from datasets import IterableDatasetDict\n",
768
  "raw_datasets = IterableDatasetDict()\n",
769
  "\n",
770
  "raw_datasets[\"train\"] = load_multiple_streaming_datasets(dataset_names, dataset_config_names=dataset_config_names, text_column_names=text_column_names, use_auth_token=True)\n",
771
+ "raw_datasets[\"test\"] = load_dataset(\"mozilla-foundation/common_voice_11_0\", \"el\", split=\"test\", streaming=False, use_auth_token=True)\n",
772
  "\n",
773
  "\n",
774
  "#raw_datasets = raw_datasets.remove_columns([\"accent\", \"age\", \"client_id\", \"down_votes\", \"gender\", \"locale\", \"path\", \"segment\", \"up_votes\"])\n",
 
995
  "metadata": {
996
  "id": "a37a7cdb-9013-427f-8de9-6a8d0e9dc684"
997
  },
998
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
999
  "source": [
1000
  "vectorized_datasets = raw_datasets.map(prepare_dataset, remove_columns=list(next(iter(raw_datasets.values())).features)).with_format(\"torch\")"
1001
  ]
 
1012
  },
1013
  {
1014
  "cell_type": "code",
1015
+ "execution_count": 17,
1016
  "id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c",
1017
  "metadata": {
1018
  "id": "1b145699-acfc-4b1d-93a2-a2ad3d62674c"
1019
  },
1020
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1021
  "source": [
1022
  "vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].shuffle(\n",
1023
  " #buffer_size=500,\n",
 
1040
  },
1041
  {
1042
  "cell_type": "code",
1043
+ "execution_count": 18,
1044
  "id": "01cb25ef-4bb0-4325-9461-f59198acadf6",
1045
  "metadata": {
1046
  "id": "01cb25ef-4bb0-4325-9461-f59198acadf6"
 
1065
  },
1066
  {
1067
  "cell_type": "code",
1068
+ "execution_count": 19,
1069
  "id": "333f7f6e-6053-4d3b-8924-c733c79b82ac",
1070
  "metadata": {
1071
  "id": "333f7f6e-6053-4d3b-8924-c733c79b82ac"
1072
  },
1073
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1074
  "source": [
1075
  "vectorized_datasets[\"train\"] = vectorized_datasets[\"train\"].filter(\n",
1076
  " is_audio_in_length_range,\n",
 
1145
  },
1146
  {
1147
  "cell_type": "code",
1148
+ "execution_count": 20,
1149
  "id": "8326221e-ec13-4731-bb4e-51e5fc1486c5",
1150
  "metadata": {
1151
  "id": "8326221e-ec13-4731-bb4e-51e5fc1486c5"
 
1197
  },
1198
  {
1199
  "cell_type": "code",
1200
+ "execution_count": 21,
1201
  "id": "fc834702-c0d3-4a96-b101-7b87be32bf42",
1202
  "metadata": {
1203
  "id": "fc834702-c0d3-4a96-b101-7b87be32bf42"
 
1230
  },
1231
  {
1232
  "cell_type": "code",
1233
+ "execution_count": 22,
1234
  "id": "b22b4011-f31f-4b57-b684-c52332f92890",
1235
  "metadata": {
1236
  "colab": {
 
1281
  },
1282
  {
1283
  "cell_type": "code",
1284
+ "execution_count": 23,
1285
  "id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb",
1286
  "metadata": {
1287
  "id": "a11d1bfc-9e28-460f-a287-72d8f7bc1acb"
 
1330
  },
1331
  {
1332
  "cell_type": "code",
1333
+ "execution_count": 24,
1334
  "id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
1335
  "metadata": {
1336
  "colab": {
 
1368
  {
1369
  "data": {
1370
  "application/vnd.jupyter.widget-view+json": {
1371
+ "model_id": "18e0d00451ec4e10b1cea9b9d3748384",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1372
  "version_major": 2,
1373
  "version_minor": 0
1374
  },
 
1401
  },
1402
  {
1403
  "cell_type": "code",
1404
+ "execution_count": 25,
1405
  "id": "62038ba3-88ed-4fce-84db-338f50dcd04f",
1406
  "metadata": {
1407
  "id": "62038ba3-88ed-4fce-84db-338f50dcd04f"
 
1438
  },
1439
  {
1440
  "cell_type": "code",
1441
+ "execution_count": 26,
1442
  "id": "0ae3e9af-97b7-4aa0-ae85-20b23b5bcb3a",
1443
  "metadata": {
1444
  "colab": {
 
1481
  },
1482
  {
1483
  "cell_type": "code",
1484
+ "execution_count": 27,
1485
  "id": "o72eOpGzD_sK",
1486
  "metadata": {
1487
  "colab": {
 
1495
  "name": "stdout",
1496
  "output_type": "stream",
1497
  "text": [
1498
+ "Tue Dec 13 21:29:08 2022 \n",
1499
  "+-----------------------------------------------------------------------------+\n",
1500
  "| NVIDIA-SMI 515.65.01 Driver Version: 515.65.01 CUDA Version: 11.7 |\n",
1501
  "|-------------------------------+----------------------+----------------------+\n",
 
1504
  "| | | MIG M. |\n",
1505
  "|===============================+======================+======================|\n",
1506
  "| 0 NVIDIA A100-SXM... On | 00000000:06:00.0 Off | 0 |\n",
1507
+ "| N/A 32C P0 47W / 400W | 2MiB / 40960MiB | 0% Default |\n",
1508
  "| | | Disabled |\n",
1509
  "+-------------------------------+----------------------+----------------------+\n",
1510
  " \n",
 
1545
  },
1546
  {
1547
  "cell_type": "code",
1548
+ "execution_count": 28,
1549
  "id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2",
1550
  "metadata": {
1551
  "id": "3ac16b62-b3c0-4c68-8f3d-9ecf471534b2"
 
1578
  },
1579
  {
1580
  "cell_type": "code",
1581
+ "execution_count": 29,
1582
  "id": "d546d7fe-0543-479a-b708-2ebabec19493",
1583
  "metadata": {
1584
  "colab": {
 
2192
  },
2193
  {
2194
  "cell_type": "code",
2195
+ "execution_count": 30,
2196
  "id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672",
2197
  "metadata": {
2198
  "id": "a1ccb9ed-cbc8-4419-91c0-651e9424b672"
 
2285
  "name": "stderr",
2286
  "output_type": "stream",
2287
  "text": [
2288
+ "Loading model from ./whisper-medium-el/checkpoint-4000.\n",
 
2289
  "/home/ubuntu/.local/lib/python3.8/site-packages/transformers/optimization.py:306: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
2290
  " warnings.warn(\n",
2291
  "***** Running training *****\n",
2292
+ " Num examples = 160000\n",
2293
+ " Num Epochs = 9223372036854775807\n",
2294
  " Instantaneous batch size per device = 32\n",
2295
  " Total train batch size (w. parallel, distributed & accumulation) = 32\n",
2296
  " Gradient Accumulation steps = 1\n",
2297
  " Total optimization steps = 5000\n",
2298
  " Number of trainable parameters = 763857920\n",
2299
  " Continuing training from checkpoint, will skip to saved global_step\n",
2300
+ " Continuing training from epoch 0\n",
2301
+ " Continuing training from global step 4000\n",
2302
+ "Reading metadata...: 1914it [00:00, 4074.06it/s]\n",
2303
+ "The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
2304
  ]
2305
  },
2306
  {
 
2309
  "\n",
2310
  " <div>\n",
2311
  " \n",
2312
+ " <progress value='4012' max='5000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
2313
+ " [4012/5000 01:11 < 1:57:29, 0.14 it/s, Epoch 0.00/9223372036854775807]\n",
2314
  " </div>\n",
2315
  " <table border=\"1\" class=\"dataframe\">\n",
2316
  " <thead>\n",
 
2318
  " <th>Step</th>\n",
2319
  " <th>Training Loss</th>\n",
2320
  " <th>Validation Loss</th>\n",
 
2321
  " </tr>\n",
2322
  " </thead>\n",
2323
  " <tbody>\n",
 
 
 
 
 
 
2324
  " </tbody>\n",
2325
  "</table><p>"
2326
  ],
 
2330
  },
2331
  "metadata": {},
2332
  "output_type": "display_data"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2333
  }
2334
  ],
2335
  "source": [
e5_interleaving-resume.ipynb ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb25d05dcb2d400df9f2d8b8019e39d601abd96db1d8851edcb5dea2546d6882
3
  size 3055754841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f7fdd05661053c2949f2de6138c02cb1fe501fbe43efcf806797c3e43cbf808
3
  size 3055754841
runs/Dec13_21-29-08_129-146-102-49/1670966960.518305/events.out.tfevents.1670966960.129-146-102-49.882304.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:652c159c0a7bbc04d6c208c74e4668602cb677b0fc2d296735cd23cd3d391b2b
3
+ size 5916
runs/Dec13_21-29-08_129-146-102-49/events.out.tfevents.1670966960.129-146-102-49.882304.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c6d5d76a7999c988e99742cae5b57c5aa438dc6403c604611d0c8fd18754328
3
+ size 5603
runs/Dec13_21-57-38_129-146-102-49/1670968669.9597044/events.out.tfevents.1670968669.129-146-102-49.882304.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8668bd5e2470303db22eb81688526a881371c3506fdfeed7a6b32abc5192a1e
3
+ size 5916
runs/Dec13_21-57-38_129-146-102-49/events.out.tfevents.1670968669.129-146-102-49.882304.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37a61ed2fa7d6d2ac64d6e063e35f8b5541406347236af61ace7e3f08422daea
3
+ size 4348
runs/Dec13_22-18-00_129-146-102-49/1670969892.775061/events.out.tfevents.1670969892.129-146-102-49.1014402.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51450fedd70a8ed8e04dbdda335b86fff15a62346527cf67bef861a20bf39cde
3
+ size 5916
runs/Dec13_22-18-00_129-146-102-49/1670995449.379962/events.out.tfevents.1670995449.129-146-102-49.1014402.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9ad24d679255e97efd512a0e6ec44b3d1b3f9d6b9fd69a929d4f4b65635093f
3
+ size 5916
runs/Dec13_22-18-00_129-146-102-49/events.out.tfevents.1670969892.129-146-102-49.1014402.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af928d9b3e795892da6df5ac604d6bb4c9799d8fbae2048212044a62e879c0fc
3
+ size 15254
runs/Dec14_05-46-08_129-146-102-49/1670996781.2697837/events.out.tfevents.1670996781.129-146-102-49.1113148.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1b3e632cba6fe6e654853b87efedea97668491d8e6906fb42ebf1c6b1f013cc
3
+ size 5916
runs/Dec14_05-46-08_129-146-102-49/events.out.tfevents.1670996781.129-146-102-49.1113148.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:243ca82c57c99466d5246efd3eb4dd017e04c059b7b31d2befe0ea6f22a39214
3
+ size 10946
runs/Dec14_09-33-49_129-146-102-49/1671010439.939292/events.out.tfevents.1671010439.129-146-102-49.1212260.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3fea8291dc179c7503abc25f7377b71002351df3b2639e4e6228b997b64d90
3
+ size 5916
runs/Dec14_09-33-49_129-146-102-49/events.out.tfevents.1671010439.129-146-102-49.1212260.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ccb9309b9bb866e6e16f7627e4a4b88a932cd62d0f847514e94d0e2208d3716
3
+ size 4347
runs/Dec14_10-24-09_129-146-102-49/1671013461.8981154/events.out.tfevents.1671013461.129-146-102-49.1508853.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af188c00a280a385bf7ede8ce3aea5fdf554d81e0aa7cab21884c04bcf42eb5e
3
+ size 5916
runs/Dec14_10-24-09_129-146-102-49/events.out.tfevents.1671013461.129-146-102-49.1508853.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b10f8350f1923948412c9c14188fa5cb649b2bf9081f63941e3fcf5ba378701a
3
+ size 10945
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6bd23b820fb512afe9dc750c92419a54a859d6f1861d7b20b0b9f155340657b
3
  size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeadae68908ede5e3241ff2195c01ad92b5ee3a7db47d3a44b664270809ad8db
3
  size 3643