diff --git "a/Untitled.ipynb" "b/Untitled.ipynb" --- "a/Untitled.ipynb" +++ "b/Untitled.ipynb" @@ -3,7 +3,7 @@ { "cell_type": "code", "execution_count": 1, - "id": "3ae82d97", + "id": "719bec25", "metadata": { "collapsed": true, "jupyter": { @@ -17,6 +17,8 @@ "text": [ "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", @@ -26,6 +28,8 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", @@ -39,39 +43,9 @@ "name": "stdout", "output_type": "stream", "text": [ - "Collecting datasets==1.13.3\n", - " Using cached datasets-1.13.3-py3-none-any.whl (287 kB)\n", - "Requirement already satisfied: numpy>=1.17 in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (1.19.2)\n", - "Requirement already satisfied: multiprocess in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (0.70.12.2)\n", - "Requirement already satisfied: xxhash in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (2.0.2)\n", - "Requirement already satisfied: pandas in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (1.4.0)\n", - "Requirement already satisfied: fsspec[http]>=2021.05.0 in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (2022.1.0)\n", - "Requirement already satisfied: tqdm>=4.62.1 in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (4.62.3)\n", - "Requirement already satisfied: pyarrow!=4.0.0,>=1.0.0 in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (6.0.1)\n", - "Requirement already satisfied: dill in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (0.3.4)\n", - "Collecting huggingface-hub<0.1.0,>=0.0.19\n", - " Using cached huggingface_hub-0.0.19-py3-none-any.whl (56 kB)\n", - "Requirement already satisfied: aiohttp in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (3.8.1)\n", - "Requirement already satisfied: requests>=2.19.0 in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (2.24.0)\n", - "Requirement already satisfied: packaging in /opt/conda/lib/python3.8/site-packages (from datasets==1.13.3) (21.3)\n", - "Requirement already satisfied: filelock in /opt/conda/lib/python3.8/site-packages (from huggingface-hub<0.1.0,>=0.0.19->datasets==1.13.3) (3.0.12)\n", - "Requirement already satisfied: typing-extensions in /opt/conda/lib/python3.8/site-packages (from huggingface-hub<0.1.0,>=0.0.19->datasets==1.13.3) (4.0.1)\n", - "Requirement already satisfied: pyyaml in /opt/conda/lib/python3.8/site-packages (from huggingface-hub<0.1.0,>=0.0.19->datasets==1.13.3) (5.4.1)\n", - "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging->datasets==1.13.3) (3.0.7)\n", - "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets==1.13.3) (3.0.4)\n", - "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets==1.13.3) (1.25.11)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets==1.13.3) (2020.12.5)\n", - "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets==1.13.3) (2.10)\n", - "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets==1.13.3) (4.0.2)\n", - "Requirement already satisfied: frozenlist>=1.1.1 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets==1.13.3) (1.3.0)\n", - "Requirement already satisfied: aiosignal>=1.1.2 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets==1.13.3) (1.2.0)\n", - "Requirement already satisfied: attrs>=17.3.0 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets==1.13.3) (21.4.0)\n", - "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets==1.13.3) (2.0.10)\n", - "Requirement already satisfied: multidict<7.0,>=4.5 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets==1.13.3) (6.0.2)\n", - "Requirement already satisfied: yarl<2.0,>=1.0 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets==1.13.3) (1.7.2)\n", - "Requirement already satisfied: python-dateutil>=2.8.1 in /opt/conda/lib/python3.8/site-packages (from pandas->datasets==1.13.3) (2.8.2)\n", - "Requirement already satisfied: pytz>=2020.1 in /opt/conda/lib/python3.8/site-packages (from pandas->datasets==1.13.3) (2021.1)\n", - "Requirement already satisfied: six>=1.5 in /opt/conda/lib/python3.8/site-packages (from python-dateutil>=2.8.1->pandas->datasets==1.13.3) (1.15.0)\n" + "Requirement already satisfied: torchaudio in /opt/conda/lib/python3.8/site-packages (0.10.2)\n", + "Requirement already satisfied: torch==1.10.2 in /opt/conda/lib/python3.8/site-packages (from torchaudio) (1.10.2)\n", + "Requirement already satisfied: typing-extensions in /opt/conda/lib/python3.8/site-packages (from torch==1.10.2->torchaudio) (4.0.1)\n" ] }, { @@ -80,55 +54,19 @@ "text": [ "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -0ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Installing collected packages: huggingface-hub, datasets\n", - " Attempting uninstall: huggingface-hub\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - " WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -0ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - " Found existing installation: huggingface-hub 0.4.0\n", - " Uninstalling huggingface-hub-0.4.0:\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "ERROR: Could not install packages due to an OSError: [Errno 13] Permission denied: 'INSTALLER'\n", - "Consider using the `--user` option or check the permissions.\n", - "\n", + "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", @@ -138,6 +76,8 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", @@ -147,6 +87,8 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", @@ -158,6 +100,7 @@ "You should consider upgrading via the '/opt/conda/bin/python -m pip install --upgrade pip' command.\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -168,6 +111,7 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -182,28 +126,31 @@ "name": "stdout", "output_type": "stream", "text": [ - "Collecting transformers==4.11.3\n", - " Using cached transformers-4.11.3-py3-none-any.whl (2.9 MB)\n", - "Requirement already satisfied: tqdm>=4.27 in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (4.62.3)\n", - "Requirement already satisfied: pyyaml>=5.1 in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (5.4.1)\n", - "Requirement already satisfied: requests in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (2.24.0)\n", - "Requirement already satisfied: numpy>=1.17 in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (1.19.2)\n", - "Requirement already satisfied: huggingface-hub>=0.0.17 in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (0.4.0)\n", - "Collecting tokenizers<0.11,>=0.10.1\n", - " Using cached tokenizers-0.10.3-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (3.3 MB)\n", - "Requirement already satisfied: packaging>=20.0 in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (21.3)\n", - "Requirement already satisfied: sacremoses in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (0.0.47)\n", - "Requirement already satisfied: filelock in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (3.0.12)\n", - "Requirement already satisfied: regex!=2019.12.17 in /opt/conda/lib/python3.8/site-packages (from transformers==4.11.3) (2022.1.18)\n", - "Requirement already satisfied: typing-extensions>=3.7.4.3 in /opt/conda/lib/python3.8/site-packages (from huggingface-hub>=0.0.17->transformers==4.11.3) (4.0.1)\n", - "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging>=20.0->transformers==4.11.3) (3.0.7)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests->transformers==4.11.3) (2020.12.5)\n", - "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests->transformers==4.11.3) (2.10)\n", - "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests->transformers==4.11.3) (1.25.11)\n", - "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests->transformers==4.11.3) (3.0.4)\n", - "Requirement already satisfied: six in /opt/conda/lib/python3.8/site-packages (from sacremoses->transformers==4.11.3) (1.15.0)\n", - "Requirement already satisfied: click in /opt/conda/lib/python3.8/site-packages (from sacremoses->transformers==4.11.3) (8.0.3)\n", - "Requirement already satisfied: joblib in /opt/conda/lib/python3.8/site-packages (from sacremoses->transformers==4.11.3) (1.1.0)\n" + "Requirement already satisfied: librosa in /opt/conda/lib/python3.8/site-packages (0.8.1)\n", + "Requirement already satisfied: soundfile>=0.10.2 in /opt/conda/lib/python3.8/site-packages (from librosa) (0.10.3.post1)\n", + "Requirement already satisfied: numba>=0.43.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (0.55.1)\n", + "Requirement already satisfied: decorator>=3.0.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (4.4.2)\n", + "Requirement already satisfied: numpy>=1.15.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.19.2)\n", + "Requirement already satisfied: packaging>=20.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (21.3)\n", + "Requirement already satisfied: scipy>=1.0.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.7.3)\n", + "Requirement already satisfied: resampy>=0.2.2 in /opt/conda/lib/python3.8/site-packages (from librosa) (0.2.2)\n", + "Requirement already satisfied: audioread>=2.0.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (2.1.9)\n", + "Requirement already satisfied: pooch>=1.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.6.0)\n", + "Requirement already satisfied: scikit-learn!=0.19.0,>=0.14.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.0.2)\n", + "Requirement already satisfied: joblib>=0.14 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.1.0)\n", + "Requirement already satisfied: llvmlite<0.39,>=0.38.0rc1 in /opt/conda/lib/python3.8/site-packages (from numba>=0.43.0->librosa) (0.38.0)\n", + "Requirement already satisfied: setuptools in /opt/conda/lib/python3.8/site-packages (from numba>=0.43.0->librosa) (50.3.1.post20201107)\n", + "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging>=20.0->librosa) (3.0.7)\n", + "Requirement already satisfied: appdirs>=1.3.0 in /opt/conda/lib/python3.8/site-packages (from pooch>=1.0->librosa) (1.4.4)\n", + "Requirement already satisfied: requests>=2.19.0 in /opt/conda/lib/python3.8/site-packages (from pooch>=1.0->librosa) (2.24.0)\n", + "Requirement already satisfied: six>=1.3 in /opt/conda/lib/python3.8/site-packages (from resampy>=0.2.2->librosa) (1.15.0)\n", + "Requirement already satisfied: threadpoolctl>=2.0.0 in /opt/conda/lib/python3.8/site-packages (from scikit-learn!=0.19.0,>=0.14.0->librosa) (3.0.0)\n", + "Requirement already satisfied: cffi>=1.0 in /opt/conda/lib/python3.8/site-packages (from soundfile>=0.10.2->librosa) (1.14.3)\n", + "Requirement already satisfied: pycparser in /opt/conda/lib/python3.8/site-packages (from cffi>=1.0->soundfile>=0.10.2->librosa) (2.20)\n", + "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.10)\n", + "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (1.25.11)\n", + "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (3.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2020.12.5)\n" ] }, { @@ -212,6 +159,7 @@ "text": [ "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -219,50 +167,10 @@ "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -0ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Installing collected packages: tokenizers, transformers\n", - " Attempting uninstall: tokenizers\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - " WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -0ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - " Found existing installation: tokenizers 0.11.4\n", - " Uninstalling tokenizers-0.11.4:\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "ERROR: Could not install packages due to an OSError: [Errno 13] Permission denied: 'INSTALLER'\n", - "Consider using the `--user` option or check the permissions.\n", - "\n", + "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -273,6 +181,7 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -283,6 +192,7 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -295,6 +205,7 @@ "You should consider upgrading via the '/opt/conda/bin/python -m pip install --upgrade pip' command.\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -305,6 +216,7 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -319,19 +231,9 @@ "name": "stdout", "output_type": "stream", "text": [ - "Collecting huggingface_hub==0.1\n", - " Using cached huggingface_hub-0.1.0-py3-none-any.whl (59 kB)\n", - "Requirement already satisfied: packaging>=20.9 in /opt/conda/lib/python3.8/site-packages (from huggingface_hub==0.1) (21.3)\n", - "Requirement already satisfied: pyyaml in /opt/conda/lib/python3.8/site-packages (from huggingface_hub==0.1) (5.4.1)\n", - "Requirement already satisfied: tqdm in /opt/conda/lib/python3.8/site-packages (from huggingface_hub==0.1) (4.62.3)\n", - "Requirement already satisfied: requests in /opt/conda/lib/python3.8/site-packages (from huggingface_hub==0.1) (2.24.0)\n", - "Requirement already satisfied: typing-extensions in /opt/conda/lib/python3.8/site-packages (from huggingface_hub==0.1) (4.0.1)\n", - "Requirement already satisfied: filelock in /opt/conda/lib/python3.8/site-packages (from huggingface_hub==0.1) (3.0.12)\n", - "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging>=20.9->huggingface_hub==0.1) (3.0.7)\n", - "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub==0.1) (1.25.11)\n", - "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub==0.1) (2.10)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub==0.1) (2020.12.5)\n", - "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub==0.1) (3.0.4)\n" + "Requirement already satisfied: jiwer in /opt/conda/lib/python3.8/site-packages (2.3.0)\n", + "Requirement already satisfied: python-Levenshtein==0.12.2 in /opt/conda/lib/python3.8/site-packages (from jiwer) (0.12.2)\n", + "Requirement already satisfied: setuptools in /opt/conda/lib/python3.8/site-packages (from python-Levenshtein==0.12.2->jiwer) (50.3.1.post20201107)\n" ] }, { @@ -340,6 +242,7 @@ "text": [ "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -347,50 +250,10 @@ "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -0ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Installing collected packages: huggingface-hub\n", - " Attempting uninstall: huggingface-hub\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - " WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -okenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -0ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", - " WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - " Found existing installation: huggingface-hub 0.4.0\n", - " Uninstalling huggingface-hub-0.4.0:\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "ERROR: Could not install packages due to an OSError: [Errno 13] Permission denied: 'INSTALLER'\n", - "Consider using the `--user` option or check the permissions.\n", - "\n", + "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -401,6 +264,7 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -411,6 +275,7 @@ "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", + "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -2ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -1ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -uggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -420,7 +285,35 @@ "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution - (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: You are using pip version 21.3.1; however, version 22.0.2 is available.\n", - "You should consider upgrading via the '/opt/conda/bin/python -m pip install --upgrade pip' command.\n", + "You should consider upgrading via the '/opt/conda/bin/python -m pip install --upgrade pip' command.\n" + ] + } + ], + "source": [ + "%%bash\n", + "# pip install datasets==1.13.3\n", + "# pip install transformers==4.11.3\n", + "# pip install huggingface_hub==0.1\n", + "pip install torchaudio\n", + "pip install librosa\n", + "pip install jiwer" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "1a85d4f9", + "metadata": { + "collapsed": true, + "jupyter": { + "outputs_hidden": true + } + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ "WARNING: Ignoring invalid distribution -kenizers (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", "WARNING: Ignoring invalid distribution -3ggingface-hub (/opt/conda/lib/python3.8/site-packages)\n", @@ -449,9 +342,37 @@ "name": "stdout", "output_type": "stream", "text": [ - "Requirement already satisfied: torchaudio in /opt/conda/lib/python3.8/site-packages (0.10.2)\n", - "Requirement already satisfied: torch==1.10.2 in /opt/conda/lib/python3.8/site-packages (from torchaudio) (1.10.2)\n", - "Requirement already satisfied: typing-extensions in /opt/conda/lib/python3.8/site-packages (from torch==1.10.2->torchaudio) (4.0.1)\n" + "Requirement already satisfied: datasets in /opt/conda/lib/python3.8/site-packages (1.18.2.dev0)\n", + "Requirement already satisfied: dill in /opt/conda/lib/python3.8/site-packages (from datasets) (0.3.4)\n", + "Requirement already satisfied: multiprocess in /opt/conda/lib/python3.8/site-packages (from datasets) (0.70.12.2)\n", + "Requirement already satisfied: huggingface-hub<1.0.0,>=0.1.0 in /opt/conda/lib/python3.8/site-packages (from datasets) (0.4.0)\n", + "Requirement already satisfied: tqdm>=4.62.1 in /opt/conda/lib/python3.8/site-packages (from datasets) (4.62.3)\n", + "Requirement already satisfied: numpy>=1.17 in /opt/conda/lib/python3.8/site-packages (from datasets) (1.19.2)\n", + "Requirement already satisfied: packaging in /opt/conda/lib/python3.8/site-packages (from datasets) (21.3)\n", + "Requirement already satisfied: pandas in /opt/conda/lib/python3.8/site-packages (from datasets) (1.4.0)\n", + "Requirement already satisfied: xxhash in /opt/conda/lib/python3.8/site-packages (from datasets) (2.0.2)\n", + "Requirement already satisfied: fsspec[http]>=2021.05.0 in /opt/conda/lib/python3.8/site-packages (from datasets) (2022.1.0)\n", + "Requirement already satisfied: aiohttp in /opt/conda/lib/python3.8/site-packages (from datasets) (3.8.1)\n", + "Requirement already satisfied: requests>=2.19.0 in /opt/conda/lib/python3.8/site-packages (from datasets) (2.24.0)\n", + "Requirement already satisfied: pyarrow!=4.0.0,>=3.0.0 in /opt/conda/lib/python3.8/site-packages (from datasets) (6.0.1)\n", + "Requirement already satisfied: filelock in /opt/conda/lib/python3.8/site-packages (from huggingface-hub<1.0.0,>=0.1.0->datasets) (3.0.12)\n", + "Requirement already satisfied: typing-extensions>=3.7.4.3 in /opt/conda/lib/python3.8/site-packages (from huggingface-hub<1.0.0,>=0.1.0->datasets) (4.0.1)\n", + "Requirement already satisfied: pyyaml in /opt/conda/lib/python3.8/site-packages (from huggingface-hub<1.0.0,>=0.1.0->datasets) (5.4.1)\n", + "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging->datasets) (3.0.7)\n", + "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets) (3.0.4)\n", + "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets) (2.10)\n", + "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets) (1.25.11)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->datasets) (2020.12.5)\n", + "Requirement already satisfied: multidict<7.0,>=4.5 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets) (6.0.2)\n", + "Requirement already satisfied: frozenlist>=1.1.1 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets) (1.3.0)\n", + "Requirement already satisfied: attrs>=17.3.0 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets) (21.4.0)\n", + "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets) (2.0.10)\n", + "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets) (4.0.2)\n", + "Requirement already satisfied: aiosignal>=1.1.2 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets) (1.2.0)\n", + "Requirement already satisfied: yarl<2.0,>=1.0 in /opt/conda/lib/python3.8/site-packages (from aiohttp->datasets) (1.7.2)\n", + "Requirement already satisfied: pytz>=2020.1 in /opt/conda/lib/python3.8/site-packages (from pandas->datasets) (2021.1)\n", + "Requirement already satisfied: python-dateutil>=2.8.1 in /opt/conda/lib/python3.8/site-packages (from pandas->datasets) (2.8.2)\n", + "Requirement already satisfied: six>=1.5 in /opt/conda/lib/python3.8/site-packages (from python-dateutil>=2.8.1->pandas->datasets) (1.15.0)\n" ] }, { @@ -532,31 +453,26 @@ "name": "stdout", "output_type": "stream", "text": [ - "Requirement already satisfied: librosa in /opt/conda/lib/python3.8/site-packages (0.8.1)\n", - "Requirement already satisfied: scikit-learn!=0.19.0,>=0.14.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.0.2)\n", - "Requirement already satisfied: scipy>=1.0.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.7.3)\n", - "Requirement already satisfied: numpy>=1.15.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.19.2)\n", - "Requirement already satisfied: pooch>=1.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.6.0)\n", - "Requirement already satisfied: audioread>=2.0.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (2.1.9)\n", - "Requirement already satisfied: decorator>=3.0.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (4.4.2)\n", - "Requirement already satisfied: resampy>=0.2.2 in /opt/conda/lib/python3.8/site-packages (from librosa) (0.2.2)\n", - "Requirement already satisfied: numba>=0.43.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (0.55.1)\n", - "Requirement already satisfied: soundfile>=0.10.2 in /opt/conda/lib/python3.8/site-packages (from librosa) (0.10.3.post1)\n", - "Requirement already satisfied: packaging>=20.0 in /opt/conda/lib/python3.8/site-packages (from librosa) (21.3)\n", - "Requirement already satisfied: joblib>=0.14 in /opt/conda/lib/python3.8/site-packages (from librosa) (1.1.0)\n", - "Requirement already satisfied: llvmlite<0.39,>=0.38.0rc1 in /opt/conda/lib/python3.8/site-packages (from numba>=0.43.0->librosa) (0.38.0)\n", - "Requirement already satisfied: setuptools in /opt/conda/lib/python3.8/site-packages (from numba>=0.43.0->librosa) (50.3.1.post20201107)\n", - "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging>=20.0->librosa) (3.0.7)\n", - "Requirement already satisfied: requests>=2.19.0 in /opt/conda/lib/python3.8/site-packages (from pooch>=1.0->librosa) (2.24.0)\n", - "Requirement already satisfied: appdirs>=1.3.0 in /opt/conda/lib/python3.8/site-packages (from pooch>=1.0->librosa) (1.4.4)\n", - "Requirement already satisfied: six>=1.3 in /opt/conda/lib/python3.8/site-packages (from resampy>=0.2.2->librosa) (1.15.0)\n", - "Requirement already satisfied: threadpoolctl>=2.0.0 in /opt/conda/lib/python3.8/site-packages (from scikit-learn!=0.19.0,>=0.14.0->librosa) (3.0.0)\n", - "Requirement already satisfied: cffi>=1.0 in /opt/conda/lib/python3.8/site-packages (from soundfile>=0.10.2->librosa) (1.14.3)\n", - "Requirement already satisfied: pycparser in /opt/conda/lib/python3.8/site-packages (from cffi>=1.0->soundfile>=0.10.2->librosa) (2.20)\n", - "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.10)\n", - "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (1.25.11)\n", - "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (3.0.4)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2020.12.5)\n" + "Requirement already satisfied: transformers in /opt/conda/lib/python3.8/site-packages (4.17.0.dev0)\n", + "Requirement already satisfied: requests in /opt/conda/lib/python3.8/site-packages (from transformers) (2.24.0)\n", + "Requirement already satisfied: regex!=2019.12.17 in /opt/conda/lib/python3.8/site-packages (from transformers) (2022.1.18)\n", + "Requirement already satisfied: tqdm>=4.27 in /opt/conda/lib/python3.8/site-packages (from transformers) (4.62.3)\n", + "Requirement already satisfied: packaging>=20.0 in /opt/conda/lib/python3.8/site-packages (from transformers) (21.3)\n", + "Requirement already satisfied: pyyaml>=5.1 in /opt/conda/lib/python3.8/site-packages (from transformers) (5.4.1)\n", + "Requirement already satisfied: sacremoses in /opt/conda/lib/python3.8/site-packages (from transformers) (0.0.47)\n", + "Requirement already satisfied: huggingface-hub<1.0,>=0.1.0 in /opt/conda/lib/python3.8/site-packages (from transformers) (0.4.0)\n", + "Requirement already satisfied: filelock in /opt/conda/lib/python3.8/site-packages (from transformers) (3.0.12)\n", + "Requirement already satisfied: numpy>=1.17 in /opt/conda/lib/python3.8/site-packages (from transformers) (1.19.2)\n", + "Requirement already satisfied: tokenizers!=0.11.3,>=0.10.1 in /opt/conda/lib/python3.8/site-packages (from transformers) (0.11.4)\n", + "Requirement already satisfied: typing-extensions>=3.7.4.3 in /opt/conda/lib/python3.8/site-packages (from huggingface-hub<1.0,>=0.1.0->transformers) (4.0.1)\n", + "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging>=20.0->transformers) (3.0.7)\n", + "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests->transformers) (3.0.4)\n", + "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests->transformers) (2.10)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests->transformers) (2020.12.5)\n", + "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests->transformers) (1.25.11)\n", + "Requirement already satisfied: click in /opt/conda/lib/python3.8/site-packages (from sacremoses->transformers) (8.0.3)\n", + "Requirement already satisfied: six in /opt/conda/lib/python3.8/site-packages (from sacremoses->transformers) (1.15.0)\n", + "Requirement already satisfied: joblib in /opt/conda/lib/python3.8/site-packages (from sacremoses->transformers) (1.1.0)\n" ] }, { @@ -637,9 +553,18 @@ "name": "stdout", "output_type": "stream", "text": [ - "Requirement already satisfied: jiwer in /opt/conda/lib/python3.8/site-packages (2.3.0)\n", - "Requirement already satisfied: python-Levenshtein==0.12.2 in /opt/conda/lib/python3.8/site-packages (from jiwer) (0.12.2)\n", - "Requirement already satisfied: setuptools in /opt/conda/lib/python3.8/site-packages (from python-Levenshtein==0.12.2->jiwer) (50.3.1.post20201107)\n" + "Requirement already satisfied: huggingface_hub in /opt/conda/lib/python3.8/site-packages (0.4.0)\n", + "Requirement already satisfied: typing-extensions>=3.7.4.3 in /opt/conda/lib/python3.8/site-packages (from huggingface_hub) (4.0.1)\n", + "Requirement already satisfied: packaging>=20.9 in /opt/conda/lib/python3.8/site-packages (from huggingface_hub) (21.3)\n", + "Requirement already satisfied: requests in /opt/conda/lib/python3.8/site-packages (from huggingface_hub) (2.24.0)\n", + "Requirement already satisfied: filelock in /opt/conda/lib/python3.8/site-packages (from huggingface_hub) (3.0.12)\n", + "Requirement already satisfied: tqdm in /opt/conda/lib/python3.8/site-packages (from huggingface_hub) (4.62.3)\n", + "Requirement already satisfied: pyyaml in /opt/conda/lib/python3.8/site-packages (from huggingface_hub) (5.4.1)\n", + "Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /opt/conda/lib/python3.8/site-packages (from packaging>=20.9->huggingface_hub) (3.0.7)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub) (2020.12.5)\n", + "Requirement already satisfied: idna<3,>=2.5 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub) (2.10)\n", + "Requirement already satisfied: chardet<4,>=3.0.2 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub) (3.0.4)\n", + "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /opt/conda/lib/python3.8/site-packages (from requests->huggingface_hub) (1.25.11)\n" ] }, { @@ -696,19 +621,16 @@ } ], "source": [ - "%%bash\n", - "pip install datasets==1.13.3\n", - "pip install transformers==4.11.3\n", - "pip install huggingface_hub==0.1\n", - "pip install torchaudio\n", - "pip install librosa\n", - "pip install jiwer" + "%%bash \n", + "pip install datasets\n", + "pip install transformers\n", + "pip install huggingface_hub" ] }, { "cell_type": "code", - "execution_count": 2, - "id": "5082f3ca", + "execution_count": 3, + "id": "de0f5463", "metadata": {}, "outputs": [], "source": [ @@ -721,7 +643,7 @@ { "cell_type": "code", "execution_count": null, - "id": "c5838f22", + "id": "63173007", "metadata": { "collapsed": true, "jupyter": { @@ -13481,10 +13403,18 @@ "unzip km_kh_male.zip" ] }, + { + "cell_type": "markdown", + "id": "0654902f", + "metadata": {}, + "source": [ + "### Load KH Data" + ] + }, { "cell_type": "code", - "execution_count": 3, - "id": "94fea955", + "execution_count": 75, + "id": "98a02203", "metadata": {}, "outputs": [], "source": [ @@ -13504,18 +13434,100 @@ }, { "cell_type": "code", - "execution_count": 32, - "id": "0bdb4556", + "execution_count": 76, + "id": "bae5c1a6", "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "Using custom data configuration default-217f48c3bbd91dba\n", - "Reusing dataset csv (/workspace/.cache/huggingface/datasets/csv/default-217f48c3bbd91dba/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)\n", - "Using custom data configuration default-b7fdb19422ec70d7\n", - "Reusing dataset csv (/workspace/.cache/huggingface/datasets/csv/default-b7fdb19422ec70d7/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e)\n" + "Using custom data configuration default-b51ead59fc2a879b\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Downloading and preparing dataset csv/default to /workspace/.cache/huggingface/datasets/csv/default-b51ead59fc2a879b/0.0.0/6b9057d9e23d9d8a2f05b985917a0da84d70c5dae3d22ddd8a3f22fb01c69d9e...\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "61f2d169012e407ba87f1b358ac4ff5b", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:00\n", - " \n", + " \n", " Your browser does not support the audio element.\n", " \n", " " @@ -13880,7 +13995,7 @@ "" ] }, - "execution_count": 51, + "execution_count": 22, "metadata": {}, "output_type": "execute_result" } @@ -13900,8 +14015,8 @@ }, { "cell_type": "code", - "execution_count": 52, - "id": "b10b6aa1", + "execution_count": 23, + "id": "c0af61ca", "metadata": {}, "outputs": [], "source": [ @@ -13922,10 +14037,33 @@ }, { "cell_type": "code", - "execution_count": 53, - "id": "a1776bef", + "execution_count": 24, + "id": "527e89eb", "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-e3ff506f96ec6817.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-00a0dacd1c387ee8.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-89839f1a29958c06.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-ea97d53e6e03248b.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-74c31e1ede89718b.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-b4485d5ec10af59a.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-87741a8a8705e488.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-2aa5c421e49dbb8a.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-6fa3756abc090cb1.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-7082faf01a7536d9.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-dbf56923bad5550e.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-cfa541d30ccf3270.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-9f28af78c8d178d8.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-4fc740b07e55a01b.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-ec4bd65c3d0c2b80.arrow\n", + "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/common_voice/tr/6.1.0/5693bfc0feeade582a78c2fb250bc88f52bd86f0a7f1bb22bfee67e715de30fd/cache-033c2e0fab0f0e8a.arrow\n" + ] + } + ], "source": [ "common_voice_train = common_voice_train.map(prepare_dataset, remove_columns=common_voice_train.column_names, num_proc=16)\n", "common_voice_test = common_voice_test.map(prepare_dataset, remove_columns=common_voice_test.column_names, num_proc=16)" @@ -13934,7 +14072,7 @@ { "cell_type": "code", "execution_count": 41, - "id": "8eea6563", + "id": "b73b00a8", "metadata": {}, "outputs": [], "source": [ @@ -13945,8 +14083,8 @@ }, { "cell_type": "code", - "execution_count": 54, - "id": "f15bec0a", + "execution_count": 25, + "id": "0d157cd6", "metadata": {}, "outputs": [], "source": [ @@ -13987,6 +14125,7 @@ " padding=self.padding,\n", " return_tensors=\"pt\",\n", " )\n", + "\n", " with self.processor.as_target_processor():\n", " labels_batch = self.processor.pad(\n", " label_features,\n", @@ -14004,8 +14143,8 @@ }, { "cell_type": "code", - "execution_count": 55, - "id": "d30dafe4", + "execution_count": 26, + "id": "848984c4", "metadata": {}, "outputs": [], "source": [ @@ -14014,19 +14153,19 @@ }, { "cell_type": "code", - "execution_count": 56, - "id": "408bcb4d", + "execution_count": 27, + "id": "1472ec1d", "metadata": {}, "outputs": [], "source": [ - "# wer_metric = load_metric(\"wer\")\n", - "cer_metric = load_metric(\"cer\")" + "wer_metric = load_metric(\"wer\")\n", + "# cer_metric = load_metric(\"cer\")" ] }, { "cell_type": "code", - "execution_count": 57, - "id": "e5573fd8", + "execution_count": 28, + "id": "585247d7", "metadata": {}, "outputs": [], "source": [ @@ -14034,48 +14173,30 @@ " pred_logits = pred.predictions\n", " pred_ids = np.argmax(pred_logits, axis=-1)\n", "\n", - " pred.label_ids[pred.label_ids == -100] = processor.tokenizer.pad_token_id\n", + " pred.label_ids[pred.label_ids == -100] = tokenizer.pad_token_id\n", "\n", - " pred_str = processor.batch_decode(pred_ids)\n", + " pred_str = tokenizer.batch_decode(pred_ids)\n", " # we do not want to group tokens when computing the metrics\n", - " label_str = processor.batch_decode(pred.label_ids, group_tokens=False)\n", + " label_str = tokenizer.batch_decode(pred.label_ids, group_tokens=False)\n", "\n", - " # wer = wer_metric.compute(predictions=pred_str, references=label_str)\n", - " cer = cer_metric.compute(predictions=pred_str, references=label_str)\n", + " wer = wer_metric.compute(predictions=pred_str, references=label_str)\n", + "# cer = cer_metric.compute(predictions=pred_str, references=label_str)\n", "\n", - " # return {\"wer\": wer}\n", - " return {\"cer\": cer}" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "da8c34ad", - "metadata": {}, - "outputs": [], - "source": [ - "\n" + " return {\"wer\": wer}\n", + "# return {\"cer\": cer}" ] }, { "cell_type": "code", - "execution_count": null, - "id": "229b8ebf", - "metadata": {}, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": 58, - "id": "7b36eee5", + "execution_count": 29, + "id": "674f8f32", "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "Some weights of the model checkpoint at facebook/wav2vec2-xls-r-300m were not used when initializing Wav2Vec2ForCTC: ['project_hid.bias', 'quantizer.weight_proj.weight', 'quantizer.weight_proj.bias', 'project_q.weight', 'project_hid.weight', 'quantizer.codevectors', 'project_q.bias']\n", + "Some weights of the model checkpoint at facebook/wav2vec2-xls-r-300m were not used when initializing Wav2Vec2ForCTC: ['quantizer.weight_proj.weight', 'project_q.bias', 'project_hid.bias', 'project_q.weight', 'quantizer.weight_proj.bias', 'quantizer.codevectors', 'project_hid.weight']\n", "- This IS expected if you are initializing Wav2Vec2ForCTC from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n", "- This IS NOT expected if you are initializing Wav2Vec2ForCTC from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n", "Some weights of Wav2Vec2ForCTC were not initialized from the model checkpoint at facebook/wav2vec2-xls-r-300m and are newly initialized: ['lm_head.weight', 'lm_head.bias']\n", @@ -14094,45 +14215,27 @@ " mask_time_prob=0.05,\n", " layerdrop=0.0,\n", " ctc_loss_reduction=\"mean\", \n", - " pad_token_id=processor.tokenizer.pad_token_id,\n", + " pad_token_id=tokenizer.pad_token_id,\n", " vocab_size=len(processor.tokenizer),\n", ")" ] }, { "cell_type": "code", - "execution_count": 59, - "id": "7ec46eca", + "execution_count": 30, + "id": "79cab4ae", "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/opt/conda/lib/python3.8/site-packages/transformers/models/wav2vec2/modeling_wav2vec2.py:1700: FutureWarning: The method `freeze_feature_extractor` is deprecated and will be removed in Transformers v5.Please use the equivalent `freeze_feature_encoder` method instead.\n", - " warnings.warn(\n" - ] - } - ], + "outputs": [], "source": [ - "model.freeze_feature_extractor()" + "model.freeze_feature_encoder()" ] }, { "cell_type": "code", - "execution_count": 65, - "id": "9db5b382", + "execution_count": 31, + "id": "d463ab8f", "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "PyTorch: setting up devices\n", - "The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).\n" - ] - } - ], + "outputs": [], "source": [ "from transformers import TrainingArguments\n", "\n", @@ -14144,28 +14247,26 @@ " evaluation_strategy=\"steps\",\n", " gradient_checkpointing=True,\n", " fp16=True,\n", - " num_train_epochs=30,\n", - " save_steps=1,\n", - " eval_steps=1,\n", + " num_train_epochs=25,\n", + " save_steps=500,\n", + " eval_steps=500,\n", " logging_steps=100,\n", - " learning_rate=3e-5,\n", - " warmup_steps=500,\n", - " save_total_limit=3,\n", - " push_to_hub=True,\n", + " learning_rate=5e-5,\n", + " warmup_steps=1000,\n", + " save_total_limit=3\n", ")" ] }, { "cell_type": "code", - "execution_count": 66, - "id": "96c9aeb9", + "execution_count": 32, + "id": "03fbc0fa", "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "/workspace/xls-r-300m-km/. is already a clone of https://huggingface.co/vitouphy/xls-r-300m-km. Make sure you pull the latest changes with `repo.git_pull()`.\n", "Using amp half precision backend\n" ] } @@ -14186,8 +14287,8 @@ }, { "cell_type": "code", - "execution_count": null, - "id": "a3a38848", + "execution_count": 33, + "id": "ddc04b2e", "metadata": {}, "outputs": [ { @@ -14198,12 +14299,12 @@ "/opt/conda/lib/python3.8/site-packages/transformers/optimization.py:306: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use thePyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n", " warnings.warn(\n", "***** Running training *****\n", - " Num examples = 2615\n", - " Num Epochs = 30\n", + " Num examples = 3478\n", + " Num Epochs = 25\n", " Instantaneous batch size per device = 8\n", " Total train batch size (w. parallel, distributed & accumulation) = 16\n", " Gradient Accumulation steps = 2\n", - " Total optimization steps = 4890\n" + " Total optimization steps = 5425\n" ] }, { @@ -14212,8 +14313,8 @@ "\n", "
\n", " \n", - " \n", - " [ 2/4890 : < :, Epoch 0.01/30]\n", + " \n", + " [5425/5425 1:31:08, Epoch 24/25]\n", "
\n", " \n", " \n", @@ -14221,15 +14322,69 @@ " \n", " \n", " \n", - " \n", + " \n", " \n", " \n", " \n", " \n", - " \n", - " \n", - " \n", - " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", " \n", " \n", "
StepTraining LossValidation LossCerWer
1No log13.3003260.9892655003.8859003.7607851.000000
10001.8193001.5307821.000613
15000.5986000.7295361.005616
20000.3992000.6185581.013377
25000.3199000.5972451.012254
30000.2388000.5555721.010109
35000.1882000.5172811.014092
40000.1604000.5170091.018278
45000.1443000.5267381.018380
50000.1404000.5366641.016747

" @@ -14247,14 +14402,107 @@ "text": [ "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", "***** Running Evaluation *****\n", - " Num examples = 291\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-500\n", + "Configuration saved in ./checkpoint-500/config.json\n", + "Model weights saved in ./checkpoint-500/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-500/preprocessor_config.json\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-1000\n", + "Configuration saved in ./checkpoint-1000/config.json\n", + "Model weights saved in ./checkpoint-1000/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-1000/preprocessor_config.json\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", " Batch size = 8\n", - "Saving model checkpoint to ./checkpoint-1\n", - "Configuration saved in ./checkpoint-1/config.json\n", - "Model weights saved in ./checkpoint-1/pytorch_model.bin\n", - "Configuration saved in ./checkpoint-1/preprocessor_config.json\n", - "Configuration saved in ./preprocessor_config.json\n" + "Saving model checkpoint to ./checkpoint-1500\n", + "Configuration saved in ./checkpoint-1500/config.json\n", + "Model weights saved in ./checkpoint-1500/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-1500/preprocessor_config.json\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-2000\n", + "Configuration saved in ./checkpoint-2000/config.json\n", + "Model weights saved in ./checkpoint-2000/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-2000/preprocessor_config.json\n", + "Deleting older checkpoint [checkpoint-500] due to args.save_total_limit\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-2500\n", + "Configuration saved in ./checkpoint-2500/config.json\n", + "Model weights saved in ./checkpoint-2500/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-2500/preprocessor_config.json\n", + "Deleting older checkpoint [checkpoint-1000] due to args.save_total_limit\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-3000\n", + "Configuration saved in ./checkpoint-3000/config.json\n", + "Model weights saved in ./checkpoint-3000/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-3000/preprocessor_config.json\n", + "Deleting older checkpoint [checkpoint-1500] due to args.save_total_limit\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-3500\n", + "Configuration saved in ./checkpoint-3500/config.json\n", + "Model weights saved in ./checkpoint-3500/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-3500/preprocessor_config.json\n", + "Deleting older checkpoint [checkpoint-2000] due to args.save_total_limit\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-4000\n", + "Configuration saved in ./checkpoint-4000/config.json\n", + "Model weights saved in ./checkpoint-4000/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-4000/preprocessor_config.json\n", + "Deleting older checkpoint [checkpoint-2500] due to args.save_total_limit\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-4500\n", + "Configuration saved in ./checkpoint-4500/config.json\n", + "Model weights saved in ./checkpoint-4500/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-4500/preprocessor_config.json\n", + "Deleting older checkpoint [checkpoint-3000] due to args.save_total_limit\n", + "The following columns in the evaluation set don't have a corresponding argument in `Wav2Vec2ForCTC.forward` and have been ignored: input_length.\n", + "***** Running Evaluation *****\n", + " Num examples = 1647\n", + " Batch size = 8\n", + "Saving model checkpoint to ./checkpoint-5000\n", + "Configuration saved in ./checkpoint-5000/config.json\n", + "Model weights saved in ./checkpoint-5000/pytorch_model.bin\n", + "Configuration saved in ./checkpoint-5000/preprocessor_config.json\n", + "Deleting older checkpoint [checkpoint-3500] due to args.save_total_limit\n", + "\n", + "\n", + "Training completed. Do not forget to share your model on huggingface.co/models =)\n", + "\n", + "\n" ] + }, + { + "data": { + "text/plain": [ + "TrainOutput(global_step=5425, training_loss=1.241710463449153, metrics={'train_runtime': 5469.9405, 'train_samples_per_second': 15.896, 'train_steps_per_second': 0.992, 'total_flos': 1.0590512839529611e+19, 'train_loss': 1.241710463449153, 'epoch': 25.0})" + ] + }, + "execution_count": 33, + "metadata": {}, + "output_type": "execute_result" } ], "source": [ @@ -14264,7 +14512,7 @@ { "cell_type": "code", "execution_count": null, - "id": "e27620ac", + "id": "f0587cc3", "metadata": {}, "outputs": [], "source": []