{ "cells": [ { "cell_type": "markdown", "metadata": { "id": "5hESxSyaGNfH" }, "source": [ "Code Credit: https://huggingface.co/spaces/fffiloni/instant-TTS-Bark-cloning" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "_4Hsgkg-Emz8", "outputId": "de235292-cd72-4ccd-8b74-65f41f2ca03f" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Cloning into 'instant-TTS-Bark-cloning'...\n", "remote: Enumerating objects: 33, done.\u001b[K\n", "remote: Counting objects: 100% (6/6), done.\u001b[K\n", "remote: Compressing objects: 100% (6/6), done.\u001b[K\n", "remote: Total 33 (delta 1), reused 3 (delta 0), pack-reused 27\u001b[K\n", "Unpacking objects: 100% (33/33), 2.73 MiB | 12.95 MiB/s, done.\n" ] } ], "source": [ "!git clone https://huggingface.co/spaces/agonh/instant-TTS-Bark-cloning" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "5zYEm7MTFBMR", "outputId": "90a9a3e8-fc76-4806-f698-a43034a7e6bf" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "/content/instant-TTS-Bark-cloning\n" ] } ], "source": [ "%cd instant-TTS-Bark-cloning" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "id": "sCIYYF39FRJV", "outputId": "3202b177-391a-4619-daef-974695e9163f" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Collecting git+https://github.com/agonai/TTS.git (from -r requirements.txt (line 1))\n", " Cloning https://github.com/agonai/TTS.git to /tmp/pip-req-build-pdd4oew4\n", " Running command git clone --filter=blob:none --quiet https://github.com/agonai/TTS.git /tmp/pip-req-build-pdd4oew4\n", " Resolved https://github.com/agonai/TTS.git to commit 5327b800fdc060399910770461a69ecade231a9e\n", " Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n", " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", "Collecting git+https://github.com/huggingface/transformers.git (from -r requirements.txt (line 2))\n", " Cloning https://github.com/huggingface/transformers.git to /tmp/pip-req-build-jdx032sc\n", " Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers.git /tmp/pip-req-build-jdx032sc\n", " Resolved https://github.com/huggingface/transformers.git to commit 95b374952dc27d8511541d6f5a4e22c9ec11fb24\n", " Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n", " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: torch in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 3)) (2.0.1+cu118)\n", "Requirement already satisfied: scipy in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 4)) (1.10.1)\n", "Collecting pydub (from -r requirements.txt (line 5))\n", " Downloading pydub-0.25.1-py2.py3-none-any.whl (32 kB)\n", "Collecting cython==0.29.30 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Using cached Cython-0.29.30-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl (1.9 MB)\n", "Requirement already satisfied: torchaudio in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (2.0.2+cu118)\n", "Requirement already satisfied: soundfile in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (0.12.1)\n", "Collecting librosa==0.10.0.* (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading librosa-0.10.0.post2-py3-none-any.whl (253 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m253.0/253.0 kB\u001b[0m \u001b[31m6.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting inflect==5.6.0 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading inflect-5.6.0-py3-none-any.whl (33 kB)\n", "Requirement already satisfied: tqdm in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (4.66.1)\n", "Collecting anyascii (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading anyascii-0.3.2-py3-none-any.whl (289 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m289.9/289.9 kB\u001b[0m \u001b[31m10.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (6.0.1)\n", "Requirement already satisfied: fsspec>=2021.04.0 in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (2023.6.0)\n", "Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (3.8.5)\n", "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (23.1)\n", "Requirement already satisfied: flask in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (2.2.5)\n", "Collecting pysbd (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading pysbd-0.3.4-py3-none-any.whl (71 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m71.1/71.1 kB\u001b[0m \u001b[31m8.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting umap-learn==0.5.1 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading umap-learn-0.5.1.tar.gz (80 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m80.9/80.9 kB\u001b[0m \u001b[31m9.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (1.5.3)\n", "Requirement already satisfied: matplotlib in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (3.7.1)\n", "Collecting trainer (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading trainer-0.0.31-py3-none-any.whl (50 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m50.6/50.6 kB\u001b[0m \u001b[31m6.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting coqpit>=0.0.16 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading coqpit-0.0.17-py3-none-any.whl (13 kB)\n", "Requirement already satisfied: jieba in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (0.42.1)\n", "Collecting pypinyin (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading pypinyin-0.49.0-py2.py3-none-any.whl (1.4 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.4/1.4 MB\u001b[0m \u001b[31m13.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting gruut[de,es,fr]==2.2.3 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading gruut-2.2.3.tar.gz (73 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m73.5/73.5 kB\u001b[0m \u001b[31m6.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting jamo (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading jamo-0.4.1-py3-none-any.whl (9.5 kB)\n", "Requirement already satisfied: nltk in /usr/local/lib/python3.10/dist-packages (from TTS==0.16.3->-r requirements.txt (line 1)) (3.8.1)\n", "Collecting g2pkk>=0.1.1 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading g2pkk-0.1.2-py3-none-any.whl (25 kB)\n", "Collecting bangla==0.0.2 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading bangla-0.0.2-py2.py3-none-any.whl (6.2 kB)\n", "Collecting bnnumerizer (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading bnnumerizer-0.0.2.tar.gz (4.7 kB)\n", " Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting bnunicodenormalizer==0.1.1 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading bnunicodenormalizer-0.1.1.tar.gz (38 kB)\n", " Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting k-diffusion (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading k_diffusion-0.0.16-py3-none-any.whl (25 kB)\n", "Collecting einops (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading einops-0.6.1-py3-none-any.whl (42 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m42.2/42.2 kB\u001b[0m \u001b[31m4.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting encodec (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading encodec-0.1.1.tar.gz (3.7 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.7/3.7 MB\u001b[0m \u001b[31m22.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting numpy==1.22.0 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Using cached numpy-1.22.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (16.8 MB)\n", "Collecting numba==0.57.0 (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading numba-0.57.0-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl (3.6 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.6/3.6 MB\u001b[0m \u001b[31m35.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: Babel<3.0.0,>=2.8.0 in /usr/local/lib/python3.10/dist-packages (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1)) (2.12.1)\n", "Collecting dateparser~=1.1.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading dateparser-1.1.8-py2.py3-none-any.whl (293 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m293.8/293.8 kB\u001b[0m \u001b[31m28.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting gruut-ipa<1.0,>=0.12.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading gruut-ipa-0.13.0.tar.gz (101 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m101.6/101.6 kB\u001b[0m \u001b[31m12.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting gruut_lang_en~=2.0.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading gruut_lang_en-2.0.0.tar.gz (15.2 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m15.2/15.2 MB\u001b[0m \u001b[31m40.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting jsonlines~=1.2.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading jsonlines-1.2.0-py2.py3-none-any.whl (7.6 kB)\n", "Collecting networkx<3.0.0,>=2.5.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading networkx-2.8.8-py3-none-any.whl (2.0 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m2.0/2.0 MB\u001b[0m \u001b[31m76.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting num2words<1.0.0,>=0.5.10 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading num2words-0.5.12-py3-none-any.whl (125 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m125.2/125.2 kB\u001b[0m \u001b[31m16.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting python-crfsuite~=0.9.7 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading python_crfsuite-0.9.9-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (993 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m993.5/993.5 kB\u001b[0m \u001b[31m67.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting gruut_lang_fr~=2.0.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading gruut_lang_fr-2.0.2.tar.gz (10.9 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m10.9/10.9 MB\u001b[0m \u001b[31m63.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting gruut_lang_es~=2.0.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading gruut_lang_es-2.0.0.tar.gz (31.4 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m31.4/31.4 MB\u001b[0m \u001b[31m14.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting gruut_lang_de~=2.0.0 (from gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading gruut_lang_de-2.0.0.tar.gz (18.1 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m18.1/18.1 MB\u001b[0m \u001b[31m75.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: audioread>=2.1.9 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (3.0.0)\n", "INFO: pip is looking at multiple versions of librosa to determine which version is compatible with other requirements. This could take a while.\n", "Collecting librosa==0.10.0.* (from TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading librosa-0.10.0.post1-py3-none-any.whl (252 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m253.0/253.0 kB\u001b[0m \u001b[31m22.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Downloading librosa-0.10.0-py3-none-any.whl (252 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m252.9/252.9 kB\u001b[0m \u001b[31m28.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: scikit-learn>=0.20.0 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (1.2.2)\n", "Requirement already satisfied: joblib>=0.14 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (1.3.2)\n", "Requirement already satisfied: decorator>=4.3.0 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (4.4.2)\n", "Requirement already satisfied: pooch>=1.0 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (1.7.0)\n", "Requirement already satisfied: soxr>=0.3.2 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (0.3.6)\n", "Requirement already satisfied: typing-extensions>=4.1.1 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (4.5.0)\n", "Requirement already satisfied: lazy-loader>=0.1 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (0.3)\n", "Requirement already satisfied: msgpack>=1.0 in /usr/local/lib/python3.10/dist-packages (from librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (1.0.5)\n", "Collecting llvmlite<0.41,>=0.40.0dev0 (from numba==0.57.0->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading llvmlite-0.40.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (42.1 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m42.1/42.1 MB\u001b[0m \u001b[31m13.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting pynndescent>=0.5 (from umap-learn==0.5.1->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading pynndescent-0.5.10.tar.gz (1.1 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.1/1.1 MB\u001b[0m \u001b[31m60.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers==4.34.0.dev0->-r requirements.txt (line 2)) (3.12.2)\n", "Collecting huggingface-hub<1.0,>=0.15.1 (from transformers==4.34.0.dev0->-r requirements.txt (line 2))\n", " Downloading huggingface_hub-0.16.4-py3-none-any.whl (268 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m268.8/268.8 kB\u001b[0m \u001b[31m26.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.34.0.dev0->-r requirements.txt (line 2)) (2023.6.3)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers==4.34.0.dev0->-r requirements.txt (line 2)) (2.31.0)\n", "Collecting tokenizers!=0.11.3,<0.14,>=0.11.1 (from transformers==4.34.0.dev0->-r requirements.txt (line 2))\n", " Downloading tokenizers-0.13.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.8 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.8/7.8 MB\u001b[0m \u001b[31m82.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting safetensors>=0.3.1 (from transformers==4.34.0.dev0->-r requirements.txt (line 2))\n", " Downloading safetensors-0.3.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m66.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch->-r requirements.txt (line 3)) (1.12)\n", "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch->-r requirements.txt (line 3)) (3.1.2)\n", "Requirement already satisfied: triton==2.0.0 in /usr/local/lib/python3.10/dist-packages (from torch->-r requirements.txt (line 3)) (2.0.0)\n", "Requirement already satisfied: cmake in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch->-r requirements.txt (line 3)) (3.27.4.1)\n", "Requirement already satisfied: lit in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch->-r requirements.txt (line 3)) (16.0.6)\n", "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.10/dist-packages (from soundfile->TTS==0.16.3->-r requirements.txt (line 1)) (1.15.1)\n", "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->TTS==0.16.3->-r requirements.txt (line 1)) (23.1.0)\n", "Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->TTS==0.16.3->-r requirements.txt (line 1)) (3.2.0)\n", "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->TTS==0.16.3->-r requirements.txt (line 1)) (6.0.4)\n", "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.10/dist-packages (from aiohttp->TTS==0.16.3->-r requirements.txt (line 1)) (4.0.3)\n", "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->TTS==0.16.3->-r requirements.txt (line 1)) (1.9.2)\n", "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->TTS==0.16.3->-r requirements.txt (line 1)) (1.4.0)\n", "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->TTS==0.16.3->-r requirements.txt (line 1)) (1.3.1)\n", "Requirement already satisfied: Werkzeug>=2.2.2 in /usr/local/lib/python3.10/dist-packages (from flask->TTS==0.16.3->-r requirements.txt (line 1)) (2.3.7)\n", "Requirement already satisfied: itsdangerous>=2.0 in /usr/local/lib/python3.10/dist-packages (from flask->TTS==0.16.3->-r requirements.txt (line 1)) (2.1.2)\n", "Requirement already satisfied: click>=8.0 in /usr/local/lib/python3.10/dist-packages (from flask->TTS==0.16.3->-r requirements.txt (line 1)) (8.1.7)\n", "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch->-r requirements.txt (line 3)) (2.1.3)\n", "Collecting accelerate (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading accelerate-0.22.0-py3-none-any.whl (251 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m251.2/251.2 kB\u001b[0m \u001b[31m23.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting clean-fid (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading clean_fid-0.1.35-py3-none-any.whl (26 kB)\n", "Collecting clip-anytorch (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading clip_anytorch-2.5.2-py3-none-any.whl (1.4 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.4/1.4 MB\u001b[0m \u001b[31m60.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting jsonmerge (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading jsonmerge-1.9.2-py3-none-any.whl (19 kB)\n", "Collecting kornia (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading kornia-0.7.0-py2.py3-none-any.whl (705 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m705.7/705.7 kB\u001b[0m \u001b[31m44.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: Pillow in /usr/local/lib/python3.10/dist-packages (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (9.4.0)\n", "Collecting resize-right (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading resize_right-0.0.2-py3-none-any.whl (8.9 kB)\n", "Requirement already satisfied: scikit-image in /usr/local/lib/python3.10/dist-packages (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (0.19.3)\n", "Collecting torchdiffeq (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading torchdiffeq-0.2.3-py3-none-any.whl (31 kB)\n", "Collecting torchsde (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading torchsde-0.2.5-py3-none-any.whl (59 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m59.2/59.2 kB\u001b[0m \u001b[31m6.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: torchvision in /usr/local/lib/python3.10/dist-packages (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (0.15.2+cu118)\n", "Collecting wandb (from k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading wandb-0.15.10-py3-none-any.whl (2.1 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m2.1/2.1 MB\u001b[0m \u001b[31m70.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->TTS==0.16.3->-r requirements.txt (line 1)) (1.1.0)\n", "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib->TTS==0.16.3->-r requirements.txt (line 1)) (0.11.0)\n", "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->TTS==0.16.3->-r requirements.txt (line 1)) (4.42.1)\n", "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->TTS==0.16.3->-r requirements.txt (line 1)) (1.4.5)\n", "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->TTS==0.16.3->-r requirements.txt (line 1)) (3.1.1)\n", "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib->TTS==0.16.3->-r requirements.txt (line 1)) (2.8.2)\n", "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->TTS==0.16.3->-r requirements.txt (line 1)) (2023.3.post1)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.34.0.dev0->-r requirements.txt (line 2)) (3.4)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.34.0.dev0->-r requirements.txt (line 2)) (2.0.4)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.34.0.dev0->-r requirements.txt (line 2)) (2023.7.22)\n", "Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch->-r requirements.txt (line 3)) (1.3.0)\n", "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from trainer->TTS==0.16.3->-r requirements.txt (line 1)) (5.9.5)\n", "Requirement already satisfied: tensorboard in /usr/local/lib/python3.10/dist-packages (from trainer->TTS==0.16.3->-r requirements.txt (line 1)) (2.13.0)\n", "Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0->soundfile->TTS==0.16.3->-r requirements.txt (line 1)) (2.21)\n", "Requirement already satisfied: tzlocal in /usr/local/lib/python3.10/dist-packages (from dateparser~=1.1.0->gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1)) (5.0.1)\n", "Requirement already satisfied: six in /usr/local/lib/python3.10/dist-packages (from jsonlines~=1.2.0->gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1)) (1.16.0)\n", "Collecting docopt>=0.6.2 (from num2words<1.0.0,>=0.5.10->gruut[de,es,fr]==2.2.3->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading docopt-0.6.2.tar.gz (25 kB)\n", " Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: platformdirs>=2.5.0 in /usr/local/lib/python3.10/dist-packages (from pooch>=1.0->librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (3.10.0)\n", "Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.20.0->librosa==0.10.0.*->TTS==0.16.3->-r requirements.txt (line 1)) (3.2.0)\n", "Collecting ftfy (from clip-anytorch->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading ftfy-6.1.1-py3-none-any.whl (53 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m53.1/53.1 kB\u001b[0m \u001b[31m6.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: jsonschema>2.4.0 in /usr/local/lib/python3.10/dist-packages (from jsonmerge->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (4.19.0)\n", "Requirement already satisfied: imageio>=2.4.1 in /usr/local/lib/python3.10/dist-packages (from scikit-image->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (2.31.3)\n", "Requirement already satisfied: tifffile>=2019.7.26 in /usr/local/lib/python3.10/dist-packages (from scikit-image->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (2023.8.30)\n", "Requirement already satisfied: PyWavelets>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from scikit-image->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (1.4.1)\n", "Requirement already satisfied: absl-py>=0.4 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (1.4.0)\n", "Requirement already satisfied: grpcio>=1.48.2 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (1.57.0)\n", "Requirement already satisfied: google-auth<3,>=1.6.3 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (2.17.3)\n", "Requirement already satisfied: google-auth-oauthlib<1.1,>=0.5 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (1.0.0)\n", "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (3.4.4)\n", "Requirement already satisfied: protobuf>=3.19.6 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (3.20.3)\n", "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (67.7.2)\n", "Requirement already satisfied: tensorboard-data-server<0.8.0,>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (0.7.1)\n", "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.10/dist-packages (from tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (0.41.2)\n", "Collecting boltons>=20.2.1 (from torchsde->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading boltons-23.0.0-py2.py3-none-any.whl (194 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.8/194.8 kB\u001b[0m \u001b[31m21.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting trampoline>=0.1.2 (from torchsde->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading trampoline-0.1.2-py3-none-any.whl (5.2 kB)\n", "Collecting GitPython!=3.1.29,>=1.0.0 (from wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading GitPython-3.1.35-py3-none-any.whl (188 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m188.8/188.8 kB\u001b[0m \u001b[31m20.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting sentry-sdk>=1.0.0 (from wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading sentry_sdk-1.30.0-py2.py3-none-any.whl (218 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m218.8/218.8 kB\u001b[0m \u001b[31m20.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hCollecting docker-pycreds>=0.4.0 (from wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading docker_pycreds-0.4.0-py2.py3-none-any.whl (9.0 kB)\n", "Collecting pathtools (from wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading pathtools-0.1.2.tar.gz (11 kB)\n", " Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "Collecting setproctitle (from wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading setproctitle-1.3.2-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (30 kB)\n", "Requirement already satisfied: appdirs>=1.4.3 in /usr/local/lib/python3.10/dist-packages (from wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (1.4.4)\n", "Collecting gitdb<5,>=4.0.1 (from GitPython!=3.1.29,>=1.0.0->wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading gitdb-4.0.10-py3-none-any.whl (62 kB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.7/62.7 kB\u001b[0m \u001b[31m6.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hRequirement already satisfied: cachetools<6.0,>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (5.3.1)\n", "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (0.3.0)\n", "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (4.9)\n", "Requirement already satisfied: requests-oauthlib>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from google-auth-oauthlib<1.1,>=0.5->tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (1.3.1)\n", "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema>2.4.0->jsonmerge->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (2023.7.1)\n", "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema>2.4.0->jsonmerge->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (0.30.2)\n", "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema>2.4.0->jsonmerge->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (0.10.2)\n", "Requirement already satisfied: wcwidth>=0.2.5 in /usr/local/lib/python3.10/dist-packages (from ftfy->clip-anytorch->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1)) (0.2.6)\n", "Collecting smmap<6,>=3.0.1 (from gitdb<5,>=4.0.1->GitPython!=3.1.29,>=1.0.0->wandb->k-diffusion->TTS==0.16.3->-r requirements.txt (line 1))\n", " Downloading smmap-5.0.0-py3-none-any.whl (24 kB)\n", "Requirement already satisfied: pyasn1<0.6.0,>=0.4.6 in /usr/local/lib/python3.10/dist-packages (from pyasn1-modules>=0.2.1->google-auth<3,>=1.6.3->tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (0.5.0)\n", "Requirement already satisfied: oauthlib>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from requests-oauthlib>=0.7.0->google-auth-oauthlib<1.1,>=0.5->tensorboard->trainer->TTS==0.16.3->-r requirements.txt (line 1)) (3.2.2)\n", "Building wheels for collected packages: TTS, bnunicodenormalizer, umap-learn, transformers, bnnumerizer, encodec, gruut-ipa, gruut_lang_de, gruut_lang_en, gruut_lang_es, gruut_lang_fr, pynndescent, gruut, docopt, pathtools\n", " Building wheel for TTS (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for TTS: filename=TTS-0.16.3-cp310-cp310-linux_x86_64.whl size=809310 sha256=b9d3cb51d7e8b8bd2990ddff3e91cb03dbdf8b0d3ff946bec40c358f4b7be99f\n", " Stored in directory: /tmp/pip-ephem-wheel-cache-w7n769jv/wheels/5c/01/b4/af2f06d03a78af481d99ac6902c1b9c399fbfb922c1a7e1508\n", " Building wheel for bnunicodenormalizer (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for bnunicodenormalizer: filename=bnunicodenormalizer-0.1.1-py3-none-any.whl size=21895 sha256=024b3845ff58ec45bdb9aac7359863062184b6d415025e17f3b5889549826650\n", " Stored in directory: /root/.cache/pip/wheels/b4/f6/01/9e68ecec7c7ea85fc9431cfac42eba1c5a5f6debe5070de5c7\n", " Building wheel for umap-learn (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for umap-learn: filename=umap_learn-0.5.1-py3-none-any.whl size=76543 sha256=baaf147854ecbcf2abd0ae046c9994b751fc14c9f3cc22ea702f00aead97ea9d\n", " Stored in directory: /root/.cache/pip/wheels/69/21/8e/802cb9c4c606a67139f538cb17bf3bf1b98b739a7900469953\n", " Building wheel for transformers (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for transformers: filename=transformers-4.34.0.dev0-py3-none-any.whl size=7640036 sha256=bb74cf4a35266320411f623f5d5f460ea7a5165e8fcbf13f7990747da26b8f35\n", " Stored in directory: /tmp/pip-ephem-wheel-cache-w7n769jv/wheels/e7/9c/5b/e1a9c8007c343041e61cc484433d512ea9274272e3fcbe7c16\n", " Building wheel for bnnumerizer (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for bnnumerizer: filename=bnnumerizer-0.0.2-py3-none-any.whl size=5259 sha256=85b73938ba1c2fa9cb3b675af4714c3ab116f3a5bb64360f3f3a9d6b5e83ede6\n", " Stored in directory: /root/.cache/pip/wheels/59/6b/e8/223172e7d5c9f72df3ea1a0d9258f3a8ab5b28e827728edef5\n", " Building wheel for encodec (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for encodec: filename=encodec-0.1.1-py3-none-any.whl size=45760 sha256=a32ac6a2cad0598ada52925c7a72aa4185da4a350763e29a145311f0d06d4e60\n", " Stored in directory: /root/.cache/pip/wheels/fc/36/cb/81af8b985a5f5e0815312d5e52b41263237af07b977e6bcbf3\n", " Building wheel for gruut-ipa (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for gruut-ipa: filename=gruut_ipa-0.13.0-py3-none-any.whl size=104871 sha256=9ca7ae6bf44d88f5f060b9316b838558dea165728fee1ac4abacf49eaa82faf1\n", " Stored in directory: /root/.cache/pip/wheels/7b/18/49/e4f500ecdf0babe757953f844e4d7cd1ea81c5503c09bfe984\n", " Building wheel for gruut_lang_de (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for gruut_lang_de: filename=gruut_lang_de-2.0.0-py3-none-any.whl size=18498181 sha256=6e20f641bd2ff22dd43408e43d8cf1264267a21f60d9bdc7981b7b0684887754\n", " Stored in directory: /root/.cache/pip/wheels/95/9a/05/cfce98f0c41a1a540f15708c4a02df190b82d84cf91ef6bc7f\n", " Building wheel for gruut_lang_en (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for gruut_lang_en: filename=gruut_lang_en-2.0.0-py3-none-any.whl size=15297179 sha256=47c014ec3f0dbf22fa7b2df009c585f5512c77bd35cddbb0e3e76a283aa6769b\n", " Stored in directory: /root/.cache/pip/wheels/10/9c/fb/77c655a9fbd78cdb9935d0ab65d80ddd0a3bcf7dbe18261650\n", " Building wheel for gruut_lang_es (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for gruut_lang_es: filename=gruut_lang_es-2.0.0-py3-none-any.whl size=32173797 sha256=0cd6d94acf730afc2e5b7535919460e3ce82991bff766f22ea05afafa0d9d856\n", " Stored in directory: /root/.cache/pip/wheels/9b/0a/90/788d92c07744b329b9283e37b29b064f5db6b1bb0442a1a19b\n", " Building wheel for gruut_lang_fr (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for gruut_lang_fr: filename=gruut_lang_fr-2.0.2-py3-none-any.whl size=10968767 sha256=ebf90e148a317f44db4a694657ac3107350cf19dedaaa4006e88221431103fe5\n", " Stored in directory: /root/.cache/pip/wheels/db/21/be/d0436e3f1cf9bf38b9bb9b4a476399c77a1ab19f7172b45e19\n", " Building wheel for pynndescent (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for pynndescent: filename=pynndescent-0.5.10-py3-none-any.whl size=55615 sha256=e3ce416bce4596459c357e6bd53b5fa1ed706b767d93e781f05a00ee46d597f2\n", " Stored in directory: /root/.cache/pip/wheels/4a/38/5d/f60a40a66a9512b7e5e83517ebc2d1b42d857be97d135f1096\n", " Building wheel for gruut (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for gruut: filename=gruut-2.2.3-py3-none-any.whl size=75793 sha256=c0a52ea3e1ad4171570e597aab43f2110dcbdc4e7b626a94256e97bd7c8530b2\n", " Stored in directory: /root/.cache/pip/wheels/fc/57/a8/f9de532daf5214f53644f20f3a9e6f69269453c87df9c0a817\n", " Building wheel for docopt (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for docopt: filename=docopt-0.6.2-py2.py3-none-any.whl size=13705 sha256=f96a6d78fb3be8ff2eb176127f702d14ac10933e8eaf0f98f007ff9b83af9811\n", " Stored in directory: /root/.cache/pip/wheels/fc/ab/d4/5da2067ac95b36618c629a5f93f809425700506f72c9732fac\n", " Building wheel for pathtools (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for pathtools: filename=pathtools-0.1.2-py3-none-any.whl size=8791 sha256=2db1b4d593898aef1ce7d586a5673b14c36584da56696399450b2230182761de\n", " Stored in directory: /root/.cache/pip/wheels/e7/f3/22/152153d6eb222ee7a56ff8617d80ee5207207a8c00a7aab794\n", "Successfully built TTS bnunicodenormalizer umap-learn transformers bnnumerizer encodec gruut-ipa gruut_lang_de gruut_lang_en gruut_lang_es gruut_lang_fr pynndescent gruut docopt pathtools\n", "Installing collected packages: trampoline, tokenizers, safetensors, resize-right, python-crfsuite, pydub, pathtools, jamo, gruut_lang_fr, gruut_lang_es, gruut_lang_en, gruut_lang_de, docopt, boltons, bnunicodenormalizer, bnnumerizer, bangla, smmap, setproctitle, sentry-sdk, pysbd, pypinyin, numpy, num2words, networkx, llvmlite, jsonlines, inflect, gruut-ipa, ftfy, einops, docker-pycreds, cython, coqpit, anyascii, numba, huggingface-hub, gitdb, g2pkk, dateparser, transformers, gruut, GitPython, wandb, pynndescent, librosa, jsonmerge, umap-learn, torchsde, torchdiffeq, kornia, clip-anytorch, clean-fid, accelerate, trainer, k-diffusion, encodec, TTS\n", " Attempting uninstall: numpy\n", " Found existing installation: numpy 1.23.5\n", " Uninstalling numpy-1.23.5:\n", " Successfully uninstalled numpy-1.23.5\n", " Attempting uninstall: networkx\n", " Found existing installation: networkx 3.1\n", " Uninstalling networkx-3.1:\n", " Successfully uninstalled networkx-3.1\n", " Attempting uninstall: llvmlite\n", " Found existing installation: llvmlite 0.39.1\n", " Uninstalling llvmlite-0.39.1:\n", " Successfully uninstalled llvmlite-0.39.1\n", " Attempting uninstall: inflect\n", " Found existing installation: inflect 7.0.0\n", " Uninstalling inflect-7.0.0:\n", " Successfully uninstalled inflect-7.0.0\n", " Attempting uninstall: cython\n", " Found existing installation: Cython 0.29.36\n", " Uninstalling Cython-0.29.36:\n", " Successfully uninstalled Cython-0.29.36\n", " Attempting uninstall: numba\n", " Found existing installation: numba 0.56.4\n", " Uninstalling numba-0.56.4:\n", " Successfully uninstalled numba-0.56.4\n", " Attempting uninstall: librosa\n", " Found existing installation: librosa 0.10.1\n", " Uninstalling librosa-0.10.1:\n", " Successfully uninstalled librosa-0.10.1\n", "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n", "plotnine 0.12.3 requires numpy>=1.23.0, but you have numpy 1.22.0 which is incompatible.\u001b[0m\u001b[31m\n", "\u001b[0mSuccessfully installed GitPython-3.1.35 TTS-0.16.3 accelerate-0.22.0 anyascii-0.3.2 bangla-0.0.2 bnnumerizer-0.0.2 bnunicodenormalizer-0.1.1 boltons-23.0.0 clean-fid-0.1.35 clip-anytorch-2.5.2 coqpit-0.0.17 cython-0.29.30 dateparser-1.1.8 docker-pycreds-0.4.0 docopt-0.6.2 einops-0.6.1 encodec-0.1.1 ftfy-6.1.1 g2pkk-0.1.2 gitdb-4.0.10 gruut-2.2.3 gruut-ipa-0.13.0 gruut_lang_de-2.0.0 gruut_lang_en-2.0.0 gruut_lang_es-2.0.0 gruut_lang_fr-2.0.2 huggingface-hub-0.16.4 inflect-5.6.0 jamo-0.4.1 jsonlines-1.2.0 jsonmerge-1.9.2 k-diffusion-0.0.16 kornia-0.7.0 librosa-0.10.0 llvmlite-0.40.1 networkx-2.8.8 num2words-0.5.12 numba-0.57.0 numpy-1.22.0 pathtools-0.1.2 pydub-0.25.1 pynndescent-0.5.10 pypinyin-0.49.0 pysbd-0.3.4 python-crfsuite-0.9.9 resize-right-0.0.2 safetensors-0.3.3 sentry-sdk-1.30.0 setproctitle-1.3.2 smmap-5.0.0 tokenizers-0.13.3 torchdiffeq-0.2.3 torchsde-0.2.5 trainer-0.0.31 trampoline-0.1.2 transformers-4.34.0.dev0 umap-learn-0.5.1 wandb-0.15.10\n" ] }, { "output_type": "display_data", "data": { "application/vnd.colab-display-data+json": { "pip_warning": { "packages": [ "numpy" ] } } }, "metadata": {} } ], "source": [ "!pip install -r requirements.txt" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "t7wrm3ArG-h-", "outputId": "a33ffb21-bbbc-4089-bb89-6cb6eb0be938" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m20.1/20.1 MB\u001b[0m \u001b[31m23.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m66.2/66.2 kB\u001b[0m \u001b[31m8.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m298.2/298.2 kB\u001b[0m \u001b[31m30.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m75.4/75.4 kB\u001b[0m \u001b[31m8.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m138.7/138.7 kB\u001b[0m \u001b[31m15.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m45.7/45.7 kB\u001b[0m \u001b[31m4.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m59.5/59.5 kB\u001b[0m \u001b[31m7.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m129.9/129.9 kB\u001b[0m \u001b[31m16.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.3/58.3 kB\u001b[0m \u001b[31m6.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m67.0/67.0 kB\u001b[0m \u001b[31m8.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m74.5/74.5 kB\u001b[0m \u001b[31m9.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25h Building wheel for ffmpy (setup.py) ... \u001b[?25l\u001b[?25hdone\n" ] } ], "source": [ "!pip install -q gradio" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "DCmb9A8lFpSc", "outputId": "e8d0d44b-cdf4-48f9-e2c5-1afc7c949e15" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "/usr/local/lib/python3.10/dist-packages/TTS/api.py:77: UserWarning: `gpu` will be deprecated. Please use `tts.to(device)` instead.\n", " warnings.warn(\"`gpu` will be deprecated. Please use `tts.to(device)` instead.\")\n", " > Downloading model to /root/.local/share/tts/tts_models--multilingual--multi-dataset--bark\n", "100% 3.93G/3.93G [01:00<00:00, 54.0MiB/s]\n", "100% 3.93G/3.93G [01:00<00:00, 64.6MiB/s]\n", "\n", " 0% 4.66M/3.74G [00:00<01:20, 46.6MiB/s]\u001b[A\n", " 0% 13.2M/3.74G [00:00<00:53, 69.1MiB/s]\u001b[A\n", " 1% 22.0M/3.74G [00:00<00:47, 78.1MiB/s]\u001b[A\n", " 1% 30.8M/3.74G [00:00<00:45, 82.0MiB/s]\u001b[A\n", " 1% 39.0M/3.74G [00:00<00:53, 69.1MiB/s]\u001b[A\n", " 1% 46.9M/3.74G [00:00<00:51, 71.9MiB/s]\u001b[A\n", " 1% 55.2M/3.74G [00:00<00:48, 75.3MiB/s]\u001b[A\n", " 2% 64.3M/3.74G [00:00<00:45, 80.0MiB/s]\u001b[A\n", " 2% 73.1M/3.74G [00:00<00:44, 82.4MiB/s]\u001b[A\n", " 2% 82.0M/3.74G [00:01<00:43, 84.6MiB/s]\u001b[A\n", " 2% 90.6M/3.74G [00:01<00:43, 84.3MiB/s]\u001b[A\n", " 3% 99.1M/3.74G [00:01<00:45, 80.7MiB/s]\u001b[A\n", " 3% 108M/3.74G [00:01<00:43, 83.0MiB/s] \u001b[A\n", " 3% 117M/3.74G [00:01<00:43, 84.0MiB/s]\u001b[A\n", " 3% 126M/3.74G [00:01<00:42, 85.8MiB/s]\u001b[A\n", " 4% 134M/3.74G [00:01<00:43, 83.7MiB/s]\u001b[A\n", " 4% 144M/3.74G [00:01<00:41, 86.5MiB/s]\u001b[A\n", " 4% 152M/3.74G [00:01<00:41, 87.2MiB/s]\u001b[A\n", " 4% 161M/3.74G [00:01<00:40, 88.3MiB/s]\u001b[A\n", " 5% 171M/3.74G [00:02<00:39, 89.9MiB/s]\u001b[A\n", " 5% 180M/3.74G [00:02<00:39, 90.5MiB/s]\u001b[A\n", " 5% 189M/3.74G [00:02<00:39, 90.6MiB/s]\u001b[A\n", " 5% 199M/3.74G [00:02<00:38, 91.6MiB/s]\u001b[A\n", " 6% 208M/3.74G [00:02<00:37, 93.6MiB/s]\u001b[A\n", " 6% 218M/3.74G [00:02<00:40, 87.6MiB/s]\u001b[A\n", " 6% 227M/3.74G [00:02<00:46, 76.2MiB/s]\u001b[A\n", " 6% 236M/3.74G [00:02<00:43, 80.0MiB/s]\u001b[A\n", " 7% 244M/3.74G [00:02<00:43, 80.5MiB/s]\u001b[A\n", " 7% 252M/3.74G [00:04<03:29, 16.7MiB/s]\u001b[A\n", " 7% 260M/3.74G [00:04<02:45, 21.0MiB/s]\u001b[A\n", " 7% 268M/3.74G [00:04<02:05, 27.6MiB/s]\u001b[A\n", " 7% 276M/3.74G [00:04<01:41, 34.1MiB/s]\u001b[A\n", " 8% 286M/3.74G [00:04<01:20, 42.8MiB/s]\u001b[A\n", " 8% 295M/3.74G [00:04<01:06, 51.7MiB/s]\u001b[A\n", " 8% 304M/3.74G [00:05<00:57, 60.1MiB/s]\u001b[A\n", " 8% 314M/3.74G [00:05<00:51, 67.1MiB/s]\u001b[A\n", " 9% 323M/3.74G [00:05<00:46, 73.5MiB/s]\u001b[A\n", " 9% 332M/3.74G [00:05<00:45, 75.7MiB/s]\u001b[A\n", " 9% 341M/3.74G [00:05<00:42, 80.7MiB/s]\u001b[A\n", " 9% 351M/3.74G [00:05<00:40, 83.7MiB/s]\u001b[A\n", " 10% 360M/3.74G [00:05<00:39, 84.9MiB/s]\u001b[A\n", " 10% 368M/3.74G [00:05<00:45, 74.3MiB/s]\u001b[A\n", " 10% 376M/3.74G [00:05<00:45, 74.4MiB/s]\u001b[A\n", " 10% 386M/3.74G [00:06<00:42, 78.7MiB/s]\u001b[A\n", " 11% 395M/3.74G [00:06<00:40, 81.9MiB/s]\u001b[A\n", " 11% 403M/3.74G [00:06<00:39, 83.7MiB/s]\u001b[A\n", " 11% 412M/3.74G [00:06<00:40, 83.1MiB/s]\u001b[A\n", " 11% 421M/3.74G [00:06<00:39, 84.4MiB/s]\u001b[A\n", " 11% 429M/3.74G [00:06<00:39, 82.9MiB/s]\u001b[A\n", " 12% 438M/3.74G [00:06<00:39, 83.7MiB/s]\u001b[A\n", " 12% 446M/3.74G [00:06<00:39, 83.7MiB/s]\u001b[A\n", " 12% 455M/3.74G [00:06<00:39, 82.5MiB/s]\u001b[A\n", " 12% 463M/3.74G [00:06<00:39, 83.1MiB/s]\u001b[A\n", " 13% 473M/3.74G [00:07<00:37, 86.4MiB/s]\u001b[A\n", " 13% 482M/3.74G [00:07<00:36, 88.2MiB/s]\u001b[A\n", " 13% 491M/3.74G [00:07<00:36, 88.5MiB/s]\u001b[A\n", " 13% 500M/3.74G [00:07<00:36, 89.9MiB/s]\u001b[A\n", " 14% 509M/3.74G [00:07<00:36, 89.4MiB/s]\u001b[A\n", " 14% 519M/3.74G [00:07<00:34, 92.4MiB/s]\u001b[A\n", " 14% 529M/3.74G [00:07<00:34, 94.5MiB/s]\u001b[A\n", " 14% 538M/3.74G [00:07<00:34, 93.8MiB/s]\u001b[A\n", " 15% 548M/3.74G [00:07<00:33, 95.1MiB/s]\u001b[A\n", " 15% 558M/3.74G [00:08<00:42, 74.1MiB/s]\u001b[A\n", " 15% 567M/3.74G [00:08<00:40, 78.8MiB/s]\u001b[A\n", " 15% 576M/3.74G [00:08<00:38, 82.2MiB/s]\u001b[A\n", " 16% 585M/3.74G [00:08<00:38, 82.8MiB/s]\u001b[A\n", " 16% 594M/3.74G [00:08<00:37, 84.6MiB/s]\u001b[A\n", " 16% 603M/3.74G [00:08<00:36, 85.7MiB/s]\u001b[A\n", " 16% 612M/3.74G [00:08<00:36, 86.6MiB/s]\u001b[A\n", " 17% 620M/3.74G [00:08<00:35, 87.5MiB/s]\u001b[A\n", " 17% 630M/3.74G [00:08<00:34, 89.7MiB/s]\u001b[A\n", " 17% 639M/3.74G [00:08<00:35, 87.2MiB/s]\u001b[A\n", " 17% 648M/3.74G [00:09<00:35, 88.3MiB/s]\u001b[A\n", " 18% 657M/3.74G [00:09<00:35, 86.3MiB/s]\u001b[A\n", " 18% 666M/3.74G [00:09<00:36, 84.5MiB/s]\u001b[A\n", " 18% 674M/3.74G [00:09<00:36, 83.2MiB/s]\u001b[A\n", " 18% 683M/3.74G [00:10<02:59, 17.0MiB/s]\u001b[A\n", " 18% 689M/3.74G [00:10<02:31, 20.1MiB/s]\u001b[A\n", " 19% 694M/3.74G [00:11<02:09, 23.5MiB/s]\u001b[A\n", " 19% 700M/3.74G [00:11<01:50, 27.5MiB/s]\u001b[A\n", " 19% 705M/3.74G [00:11<01:35, 31.7MiB/s]\u001b[A\n", " 19% 711M/3.74G [00:11<01:25, 35.5MiB/s]\u001b[A\n", " 19% 716M/3.74G [00:11<01:17, 39.0MiB/s]\u001b[A\n", " 19% 722M/3.74G [00:11<01:10, 42.5MiB/s]\u001b[A\n", " 19% 727M/3.74G [00:11<01:06, 45.1MiB/s]\u001b[A\n", " 20% 733M/3.74G [00:11<01:03, 47.1MiB/s]\u001b[A\n", " 20% 738M/3.74G [00:11<01:00, 49.4MiB/s]\u001b[A\n", " 20% 744M/3.74G [00:11<01:00, 49.3MiB/s]\u001b[A\n", " 20% 749M/3.74G [00:12<01:01, 49.0MiB/s]\u001b[A\n", " 20% 755M/3.74G [00:12<00:58, 51.2MiB/s]\u001b[A\n", " 20% 760M/3.74G [00:12<00:56, 52.4MiB/s]\u001b[A\n", " 20% 766M/3.74G [00:12<00:55, 53.7MiB/s]\u001b[A\n", " 21% 772M/3.74G [00:12<00:53, 55.4MiB/s]\u001b[A\n", " 21% 778M/3.74G [00:12<00:52, 56.0MiB/s]\u001b[A\n", " 21% 783M/3.74G [00:12<00:53, 55.0MiB/s]\u001b[A\n", " 21% 789M/3.74G [00:12<00:53, 55.3MiB/s]\u001b[A\n", " 21% 795M/3.74G [00:12<00:54, 53.6MiB/s]\u001b[A\n", " 21% 800M/3.74G [00:13<01:02, 46.7MiB/s]\u001b[A\n", " 22% 805M/3.74G [00:13<01:03, 46.2MiB/s]\u001b[A\n", " 22% 810M/3.74G [00:13<01:00, 48.6MiB/s]\u001b[A\n", " 22% 816M/3.74G [00:13<00:58, 50.3MiB/s]\u001b[A\n", " 22% 821M/3.74G [00:13<00:56, 51.2MiB/s]\u001b[A\n", " 22% 827M/3.74G [00:13<00:54, 53.3MiB/s]\u001b[A\n", " 22% 833M/3.74G [00:13<00:53, 54.2MiB/s]\u001b[A\n", " 22% 838M/3.74G [00:13<00:54, 53.2MiB/s]\u001b[A\n", " 23% 843M/3.74G [00:13<00:54, 53.4MiB/s]\u001b[A\n", " 23% 849M/3.74G [00:13<00:54, 53.2MiB/s]\u001b[A\n", " 23% 854M/3.74G [00:14<00:55, 51.7MiB/s]\u001b[A\n", " 23% 859M/3.74G [00:14<00:58, 49.6MiB/s]\u001b[A\n", " 23% 865M/3.74G [00:14<00:56, 51.2MiB/s]\u001b[A\n", " 23% 870M/3.74G [00:14<00:55, 51.6MiB/s]\u001b[A\n", " 23% 875M/3.74G [00:14<00:55, 51.6MiB/s]\u001b[A\n", " 24% 880M/3.74G [00:14<00:56, 50.5MiB/s]\u001b[A\n", " 24% 886M/3.74G [00:14<00:55, 51.3MiB/s]\u001b[A\n", " 24% 891M/3.74G [00:14<00:54, 52.1MiB/s]\u001b[A\n", " 24% 896M/3.74G [00:14<00:55, 51.2MiB/s]\u001b[A\n", " 24% 902M/3.74G [00:15<00:55, 51.4MiB/s]\u001b[A\n", " 24% 907M/3.74G [00:15<00:54, 52.3MiB/s]\u001b[A\n", " 24% 912M/3.74G [00:15<00:55, 50.9MiB/s]\u001b[A\n", " 25% 917M/3.74G [00:15<00:55, 51.0MiB/s]\u001b[A\n", " 25% 923M/3.74G [00:15<00:54, 51.3MiB/s]\u001b[A\n", " 25% 928M/3.74G [00:15<00:54, 51.3MiB/s]\u001b[A\n", " 25% 933M/3.74G [00:15<00:53, 52.3MiB/s]\u001b[A\n", " 25% 939M/3.74G [00:15<00:52, 53.1MiB/s]\u001b[A\n", " 25% 945M/3.74G [00:15<00:50, 55.5MiB/s]\u001b[A\n", " 25% 951M/3.74G [00:15<00:49, 56.8MiB/s]\u001b[A\n", " 26% 957M/3.74G [00:16<00:48, 57.1MiB/s]\u001b[A\n", " 26% 962M/3.74G [00:16<00:48, 57.0MiB/s]\u001b[A\n", " 26% 968M/3.74G [00:16<00:48, 57.0MiB/s]\u001b[A\n", " 26% 974M/3.74G [00:16<00:50, 54.8MiB/s]\u001b[A\n", " 26% 979M/3.74G [00:16<00:51, 53.4MiB/s]\u001b[A\n", " 26% 985M/3.74G [00:16<00:51, 53.0MiB/s]\u001b[A\n", " 26% 990M/3.74G [00:16<00:51, 53.0MiB/s]\u001b[A\n", " 27% 995M/3.74G [00:16<00:53, 51.8MiB/s]\u001b[A\n", " 27% 1.00G/3.74G [00:16<00:52, 52.3MiB/s]\u001b[A\n", " 27% 1.01G/3.74G [00:16<00:51, 53.0MiB/s]\u001b[A\n", " 27% 1.01G/3.74G [00:17<00:49, 54.8MiB/s]\u001b[A\n", " 27% 1.02G/3.74G [00:17<00:56, 48.3MiB/s]\u001b[A\n", " 27% 1.02G/3.74G [00:17<00:56, 48.0MiB/s]\u001b[A\n", " 27% 1.03G/3.74G [00:17<00:54, 49.5MiB/s]\u001b[A\n", " 28% 1.03G/3.74G [00:17<00:53, 50.7MiB/s]\u001b[A\n", " 28% 1.04G/3.74G [00:17<00:52, 51.4MiB/s]\u001b[A\n", " 28% 1.04G/3.74G [00:17<00:52, 51.8MiB/s]\u001b[A\n", " 28% 1.05G/3.74G [00:17<00:50, 53.4MiB/s]\u001b[A\n", " 28% 1.06G/3.74G [00:17<00:51, 52.3MiB/s]\u001b[A\n", " 28% 1.06G/3.74G [00:18<00:50, 53.0MiB/s]\u001b[A\n", " 28% 1.07G/3.74G [00:18<00:49, 53.9MiB/s]\u001b[A\n", " 29% 1.07G/3.74G [00:18<00:49, 53.8MiB/s]\u001b[A\n", " 29% 1.08G/3.74G [00:18<00:49, 53.8MiB/s]\u001b[A\n", " 29% 1.08G/3.74G [00:18<00:48, 54.7MiB/s]\u001b[A\n", " 29% 1.09G/3.74G [00:18<00:48, 54.4MiB/s]\u001b[A\n", " 29% 1.09G/3.74G [00:18<00:48, 54.5MiB/s]\u001b[A\n", " 29% 1.10G/3.74G [00:18<00:48, 54.8MiB/s]\u001b[A\n", " 30% 1.10G/3.74G [00:18<01:07, 39.3MiB/s]\u001b[A\n", " 30% 1.11G/3.74G [00:19<01:01, 42.5MiB/s]\u001b[A\n", " 30% 1.12G/3.74G [00:19<00:54, 48.1MiB/s]\u001b[A\n", " 30% 1.13G/3.74G [00:19<00:43, 59.8MiB/s]\u001b[A\n", " 30% 1.13G/3.74G [00:19<00:38, 67.0MiB/s]\u001b[A\n", " 31% 1.14G/3.74G [00:19<00:36, 71.6MiB/s]\u001b[A\n", " 31% 1.15G/3.74G [00:19<00:34, 75.2MiB/s]\u001b[A\n", " 31% 1.16G/3.74G [00:19<00:32, 78.3MiB/s]\u001b[A\n", " 31% 1.17G/3.74G [00:19<00:31, 80.7MiB/s]\u001b[A\n", " 31% 1.18G/3.74G [00:19<00:30, 84.9MiB/s]\u001b[A\n", " 32% 1.19G/3.74G [00:19<00:29, 87.7MiB/s]\u001b[A\n", " 32% 1.20G/3.74G [00:20<00:30, 84.6MiB/s]\u001b[A\n", " 32% 1.20G/3.74G [00:20<00:33, 75.0MiB/s]\u001b[A\n", " 32% 1.21G/3.74G [00:20<00:32, 78.1MiB/s]\u001b[A\n", " 33% 1.22G/3.74G [00:20<00:33, 76.2MiB/s]\u001b[A\n", " 33% 1.23G/3.74G [00:20<00:31, 79.3MiB/s]\u001b[A\n", " 33% 1.24G/3.74G [00:20<00:30, 81.8MiB/s]\u001b[A\n", " 33% 1.25G/3.74G [00:20<00:30, 81.8MiB/s]\u001b[A\n", " 34% 1.26G/3.74G [00:20<00:30, 81.0MiB/s]\u001b[A\n", " 34% 1.26G/3.74G [00:20<00:30, 81.5MiB/s]\u001b[A\n", " 34% 1.27G/3.74G [00:21<00:30, 81.7MiB/s]\u001b[A\n", " 34% 1.28G/3.74G [00:21<00:29, 83.7MiB/s]\u001b[A\n", " 34% 1.29G/3.74G [00:21<00:29, 84.4MiB/s]\u001b[A\n", " 35% 1.30G/3.74G [00:21<00:29, 83.7MiB/s]\u001b[A\n", " 35% 1.31G/3.74G [00:21<00:29, 82.4MiB/s]\u001b[A\n", " 35% 1.32G/3.74G [00:21<00:28, 85.4MiB/s]\u001b[A\n", " 35% 1.32G/3.74G [00:21<00:28, 85.2MiB/s]\u001b[A\n", " 36% 1.33G/3.74G [00:21<00:27, 86.5MiB/s]\u001b[A\n", " 36% 1.34G/3.74G [00:21<00:27, 87.2MiB/s]\u001b[A\n", " 36% 1.35G/3.74G [00:21<00:27, 88.2MiB/s]\u001b[A\n", " 36% 1.36G/3.74G [00:22<00:26, 91.2MiB/s]\u001b[A\n", " 37% 1.37G/3.74G [00:22<00:25, 91.5MiB/s]\u001b[A\n", " 37% 1.38G/3.74G [00:22<00:26, 89.3MiB/s]\u001b[A\n", " 37% 1.39G/3.74G [00:22<00:31, 74.7MiB/s]\u001b[A\n", " 37% 1.40G/3.74G [00:22<00:32, 72.5MiB/s]\u001b[A\n", " 38% 1.40G/3.74G [00:22<00:30, 77.4MiB/s]\u001b[A\n", " 38% 1.41G/3.74G [00:22<00:29, 78.5MiB/s]\u001b[A\n", " 38% 1.42G/3.74G [00:22<00:28, 80.3MiB/s]\u001b[A\n", " 38% 1.43G/3.74G [00:22<00:28, 82.1MiB/s]\u001b[A\n", " 38% 1.44G/3.74G [00:23<00:27, 82.8MiB/s]\u001b[A\n", " 39% 1.45G/3.74G [00:23<00:26, 85.2MiB/s]\u001b[A\n", " 39% 1.46G/3.74G [00:23<00:26, 86.3MiB/s]\u001b[A\n", " 39% 1.47G/3.74G [00:23<00:26, 85.9MiB/s]\u001b[A\n", " 39% 1.47G/3.74G [00:23<00:26, 87.1MiB/s]\u001b[A\n", " 40% 1.48G/3.74G [00:23<00:26, 85.2MiB/s]\u001b[A\n", " 40% 1.49G/3.74G [00:24<01:04, 35.0MiB/s]\u001b[A\n", " 40% 1.50G/3.74G [00:24<00:52, 42.3MiB/s]\u001b[A\n", " 40% 1.51G/3.74G [00:24<00:45, 49.2MiB/s]\u001b[A\n", " 41% 1.52G/3.74G [00:24<00:40, 55.4MiB/s]\u001b[A\n", " 41% 1.52G/3.74G [00:24<00:36, 60.3MiB/s]\u001b[A\n", " 41% 1.53G/3.74G [00:24<00:33, 66.3MiB/s]\u001b[A\n", " 41% 1.54G/3.74G [00:24<00:31, 70.5MiB/s]\u001b[A\n", " 41% 1.55G/3.74G [00:24<00:29, 75.2MiB/s]\u001b[A\n", " 42% 1.56G/3.74G [00:24<00:27, 78.1MiB/s]\u001b[A\n", " 42% 1.57G/3.74G [00:25<00:27, 80.2MiB/s]\u001b[A\n", " 42% 1.58G/3.74G [00:25<00:26, 82.8MiB/s]\u001b[A\n", " 42% 1.58G/3.74G [00:25<00:25, 84.7MiB/s]\u001b[A\n", " 43% 1.59G/3.74G [00:25<00:24, 86.5MiB/s]\u001b[A\n", " 43% 1.60G/3.74G [00:25<00:24, 88.9MiB/s]\u001b[A\n", " 43% 1.61G/3.74G [00:25<00:24, 87.9MiB/s]\u001b[A\n", " 43% 1.62G/3.74G [00:25<00:23, 89.0MiB/s]\u001b[A\n", " 44% 1.63G/3.74G [00:25<00:23, 88.3MiB/s]\u001b[A\n", " 44% 1.64G/3.74G [00:25<00:24, 84.6MiB/s]\u001b[A\n", " 44% 1.65G/3.74G [00:25<00:27, 76.7MiB/s]\u001b[A\n", " 44% 1.66G/3.74G [00:26<00:25, 80.4MiB/s]\u001b[A\n", " 45% 1.67G/3.74G [00:26<00:25, 83.0MiB/s]\u001b[A\n", " 45% 1.67G/3.74G [00:26<00:25, 82.0MiB/s]\u001b[A\n", " 45% 1.68G/3.74G [00:26<00:24, 84.0MiB/s]\u001b[A\n", " 45% 1.69G/3.74G [00:26<00:23, 86.6MiB/s]\u001b[A\n", " 45% 1.70G/3.74G [00:26<00:24, 83.5MiB/s]\u001b[A\n", " 46% 1.71G/3.74G [00:26<00:24, 83.5MiB/s]\u001b[A\n", " 46% 1.72G/3.74G [00:26<00:23, 84.6MiB/s]\u001b[A\n", " 46% 1.73G/3.74G [00:26<00:23, 84.0MiB/s]\u001b[A\n", " 46% 1.74G/3.74G [00:27<00:23, 87.0MiB/s]\u001b[A\n", " 47% 1.75G/3.74G [00:27<00:22, 89.8MiB/s]\u001b[A\n", " 47% 1.76G/3.74G [00:27<00:21, 90.9MiB/s]\u001b[A\n", " 47% 1.76G/3.74G [00:27<00:21, 92.0MiB/s]\u001b[A\n", " 47% 1.77G/3.74G [00:27<00:21, 92.6MiB/s]\u001b[A\n", " 48% 1.78G/3.74G [00:27<00:21, 92.4MiB/s]\u001b[A\n", " 48% 1.79G/3.74G [00:27<00:21, 91.2MiB/s]\u001b[A\n", " 48% 1.80G/3.74G [00:27<00:21, 91.4MiB/s]\u001b[A\n", " 48% 1.81G/3.74G [00:27<00:20, 92.0MiB/s]\u001b[A\n", " 49% 1.82G/3.74G [00:27<00:21, 88.1MiB/s]\u001b[A\n", " 49% 1.83G/3.74G [00:28<00:24, 77.5MiB/s]\u001b[A\n", " 49% 1.84G/3.74G [00:28<00:24, 79.0MiB/s]\u001b[A\n", " 49% 1.85G/3.74G [00:28<00:22, 83.1MiB/s]\u001b[A\n", " 50% 1.86G/3.74G [00:28<00:22, 84.0MiB/s]\u001b[A\n", " 50% 1.86G/3.74G [00:28<00:21, 86.2MiB/s]\u001b[A\n", " 50% 1.87G/3.74G [00:28<00:21, 86.2MiB/s]\u001b[A\n", " 50% 1.88G/3.74G [00:28<00:22, 82.5MiB/s]\u001b[A\n", " 51% 1.89G/3.74G [00:28<00:21, 85.7MiB/s]\u001b[A\n", " 51% 1.90G/3.74G [00:28<00:21, 86.0MiB/s]\u001b[A\n", " 51% 1.91G/3.74G [00:28<00:21, 85.1MiB/s]\u001b[A\n", " 51% 1.92G/3.74G [00:29<00:21, 86.3MiB/s]\u001b[A\n", " 51% 1.93G/3.74G [00:29<00:24, 74.1MiB/s]\u001b[A\n", " 52% 1.93G/3.74G [00:29<00:27, 64.8MiB/s]\u001b[A\n", " 52% 1.94G/3.74G [00:29<00:30, 60.0MiB/s]\u001b[A\n", " 52% 1.95G/3.74G [00:29<00:31, 56.7MiB/s]\u001b[A\n", " 52% 1.95G/3.74G [00:29<00:32, 54.9MiB/s]\u001b[A\n", " 52% 1.96G/3.74G [00:29<00:32, 54.4MiB/s]\u001b[A\n", " 52% 1.96G/3.74G [00:30<00:32, 54.8MiB/s]\u001b[A\n", " 53% 1.97G/3.74G [00:30<00:31, 55.8MiB/s]\u001b[A\n", " 53% 1.98G/3.74G [00:30<00:31, 55.6MiB/s]\u001b[A\n", " 53% 1.98G/3.74G [00:30<00:32, 55.0MiB/s]\u001b[A\n", " 53% 1.99G/3.74G [00:30<00:33, 52.8MiB/s]\u001b[A\n", " 53% 1.99G/3.74G [00:30<00:33, 52.6MiB/s]\u001b[A\n", " 53% 2.00G/3.74G [00:30<00:32, 53.4MiB/s]\u001b[A\n", " 54% 2.00G/3.74G [00:30<00:32, 53.3MiB/s]\u001b[A\n", " 54% 2.01G/3.74G [00:30<00:32, 53.2MiB/s]\u001b[A\n", " 54% 2.01G/3.74G [00:30<00:32, 53.4MiB/s]\u001b[A\n", " 54% 2.02G/3.74G [00:31<00:31, 54.7MiB/s]\u001b[A\n", " 54% 2.03G/3.74G [00:31<00:31, 54.0MiB/s]\u001b[A\n", " 54% 2.03G/3.74G [00:31<00:31, 54.4MiB/s]\u001b[A\n", " 54% 2.04G/3.74G [00:31<00:30, 55.3MiB/s]\u001b[A\n", " 55% 2.04G/3.74G [00:31<00:31, 54.4MiB/s]\u001b[A\n", " 55% 2.05G/3.74G [00:31<00:31, 54.0MiB/s]\u001b[A\n", " 55% 2.05G/3.74G [00:31<00:42, 39.8MiB/s]\u001b[A\n", " 55% 2.06G/3.74G [00:31<00:39, 42.5MiB/s]\u001b[A\n", " 55% 2.06G/3.74G [00:31<00:37, 44.4MiB/s]\u001b[A\n", " 55% 2.07G/3.74G [00:32<00:36, 46.4MiB/s]\u001b[A\n", " 55% 2.07G/3.74G [00:32<00:33, 49.4MiB/s]\u001b[A\n", " 56% 2.08G/3.74G [00:32<00:32, 51.0MiB/s]\u001b[A\n", " 56% 2.08G/3.74G [00:32<00:33, 50.1MiB/s]\u001b[A\n", " 56% 2.09G/3.74G [00:32<00:33, 49.2MiB/s]\u001b[A\n", " 56% 2.09G/3.74G [00:32<00:33, 49.7MiB/s]\u001b[A\n", " 56% 2.10G/3.74G [00:32<00:33, 49.3MiB/s]\u001b[A\n", " 56% 2.11G/3.74G [00:32<00:32, 50.1MiB/s]\u001b[A\n", " 56% 2.11G/3.74G [00:32<00:31, 51.8MiB/s]\u001b[A\n", " 57% 2.12G/3.74G [00:33<00:32, 50.0MiB/s]\u001b[A\n", " 57% 2.12G/3.74G [00:33<00:32, 49.6MiB/s]\u001b[A\n", " 57% 2.13G/3.74G [00:33<00:34, 46.9MiB/s]\u001b[A\n", " 57% 2.13G/3.74G [00:33<00:34, 47.0MiB/s]\u001b[A\n", " 57% 2.14G/3.74G [00:33<00:32, 49.0MiB/s]\u001b[A\n", " 57% 2.14G/3.74G [00:33<00:31, 51.3MiB/s]\u001b[A\n", " 57% 2.15G/3.74G [00:33<00:30, 52.6MiB/s]\u001b[A\n", " 58% 2.15G/3.74G [00:33<00:29, 53.5MiB/s]\u001b[A\n", " 58% 2.16G/3.74G [00:33<00:29, 53.8MiB/s]\u001b[A\n", " 58% 2.16G/3.74G [00:33<00:29, 53.9MiB/s]\u001b[A\n", " 58% 2.17G/3.74G [00:34<00:28, 54.6MiB/s]\u001b[A\n", " 58% 2.17G/3.74G [00:34<00:28, 55.1MiB/s]\u001b[A\n", " 58% 2.18G/3.74G [00:34<00:28, 54.9MiB/s]\u001b[A\n", " 58% 2.19G/3.74G [00:34<00:28, 55.2MiB/s]\u001b[A\n", " 59% 2.19G/3.74G [00:34<00:28, 55.1MiB/s]\u001b[A\n", " 59% 2.20G/3.74G [00:34<00:27, 56.1MiB/s]\u001b[A\n", " 59% 2.20G/3.74G [00:34<00:38, 40.4MiB/s]\u001b[A\n", " 59% 2.21G/3.74G [00:34<00:35, 43.4MiB/s]\u001b[A\n", " 59% 2.21G/3.74G [00:34<00:32, 47.1MiB/s]\u001b[A\n", " 59% 2.22G/3.74G [00:35<00:30, 49.6MiB/s]\u001b[A\n", " 59% 2.23G/3.74G [00:35<00:29, 51.4MiB/s]\u001b[A\n", " 60% 2.23G/3.74G [00:35<00:32, 46.0MiB/s]\u001b[A\n", " 60% 2.24G/3.74G [00:35<00:36, 41.0MiB/s]\u001b[A\n", " 60% 2.24G/3.74G [00:35<00:34, 43.7MiB/s]\u001b[A\n", " 60% 2.25G/3.74G [00:35<00:32, 45.9MiB/s]\u001b[A\n", " 60% 2.25G/3.74G [00:35<00:31, 47.6MiB/s]\u001b[A\n", " 60% 2.26G/3.74G [00:35<00:30, 48.1MiB/s]\u001b[A\n", " 60% 2.26G/3.74G [00:35<00:30, 48.8MiB/s]\u001b[A\n", " 61% 2.27G/3.74G [00:36<00:29, 49.5MiB/s]\u001b[A\n", " 61% 2.27G/3.74G [00:36<00:29, 50.3MiB/s]\u001b[A\n", " 61% 2.28G/3.74G [00:36<00:28, 50.6MiB/s]\u001b[A\n", " 61% 2.28G/3.74G [00:36<00:29, 49.8MiB/s]\u001b[A\n", " 61% 2.29G/3.74G [00:36<00:28, 50.8MiB/s]\u001b[A\n", " 61% 2.29G/3.74G [00:36<00:29, 48.9MiB/s]\u001b[A\n", " 61% 2.30G/3.74G [00:36<00:29, 48.8MiB/s]\u001b[A\n", " 62% 2.30G/3.74G [00:36<00:29, 48.7MiB/s]\u001b[A\n", " 62% 2.31G/3.74G [00:36<00:29, 48.9MiB/s]\u001b[A\n", " 62% 2.31G/3.74G [00:36<00:29, 48.9MiB/s]\u001b[A\n", " 62% 2.32G/3.74G [00:37<00:28, 49.9MiB/s]\u001b[A\n", " 62% 2.32G/3.74G [00:37<00:27, 51.6MiB/s]\u001b[A\n", " 62% 2.33G/3.74G [00:37<00:26, 52.7MiB/s]\u001b[A\n", " 62% 2.33G/3.74G [00:37<00:26, 53.1MiB/s]\u001b[A\n", " 63% 2.34G/3.74G [00:37<00:26, 52.8MiB/s]\u001b[A\n", " 63% 2.34G/3.74G [00:37<00:26, 53.3MiB/s]\u001b[A\n", " 63% 2.35G/3.74G [00:37<00:25, 53.7MiB/s]\u001b[A\n", " 63% 2.36G/3.74G [00:37<00:25, 54.2MiB/s]\u001b[A\n", " 63% 2.36G/3.74G [00:37<00:25, 54.3MiB/s]\u001b[A\n", " 63% 2.37G/3.74G [00:37<00:25, 53.6MiB/s]\u001b[A\n", " 63% 2.37G/3.74G [00:38<00:25, 53.4MiB/s]\u001b[A\n", " 64% 2.38G/3.74G [00:38<00:25, 53.9MiB/s]\u001b[A\n", " 64% 2.38G/3.74G [00:38<00:23, 57.4MiB/s]\u001b[A\n", " 64% 2.39G/3.74G [00:38<00:19, 69.0MiB/s]\u001b[A\n", " 64% 2.40G/3.74G [00:38<00:17, 76.3MiB/s]\u001b[A\n", " 64% 2.41G/3.74G [00:38<00:17, 76.2MiB/s]\u001b[A\n", " 65% 2.42G/3.74G [00:38<00:18, 70.7MiB/s]\u001b[A\n", " 65% 2.43G/3.74G [00:38<00:17, 76.7MiB/s]\u001b[A\n", " 65% 2.44G/3.74G [00:38<00:16, 79.5MiB/s]\u001b[A\n", " 65% 2.44G/3.74G [00:39<00:16, 79.3MiB/s]\u001b[A\n", " 66% 2.45G/3.74G [00:39<00:16, 80.5MiB/s]\u001b[A\n", " 66% 2.46G/3.74G [00:39<00:15, 82.2MiB/s]\u001b[A\n", " 66% 2.47G/3.74G [00:39<00:15, 83.2MiB/s]\u001b[A\n", " 66% 2.48G/3.74G [00:39<00:14, 85.6MiB/s]\u001b[A\n", " 66% 2.49G/3.74G [00:39<00:14, 84.0MiB/s]\u001b[A\n", " 67% 2.50G/3.74G [00:39<00:14, 84.7MiB/s]\u001b[A\n", " 67% 2.51G/3.74G [00:39<00:14, 86.8MiB/s]\u001b[A\n", " 67% 2.51G/3.74G [00:39<00:13, 88.7MiB/s]\u001b[A\n", " 67% 2.52G/3.74G [00:39<00:13, 89.5MiB/s]\u001b[A\n", " 68% 2.53G/3.74G [00:40<00:13, 89.4MiB/s]\u001b[A\n", " 68% 2.54G/3.74G [00:40<00:13, 90.5MiB/s]\u001b[A\n", " 68% 2.55G/3.74G [00:40<00:13, 90.5MiB/s]\u001b[A\n", " 68% 2.56G/3.74G [00:40<00:12, 92.2MiB/s]\u001b[A\n", " 69% 2.57G/3.74G [00:40<00:12, 92.8MiB/s]\u001b[A\n", " 69% 2.58G/3.74G [00:40<00:14, 77.5MiB/s]\u001b[A\n", " 69% 2.59G/3.74G [00:40<00:14, 80.2MiB/s]\u001b[A\n", " 69% 2.60G/3.74G [00:40<00:14, 81.7MiB/s]\u001b[A\n", " 70% 2.61G/3.74G [00:40<00:13, 84.3MiB/s]\u001b[A\n", " 70% 2.61G/3.74G [00:41<00:13, 81.6MiB/s]\u001b[A\n", " 70% 2.62G/3.74G [00:41<00:13, 83.4MiB/s]\u001b[A\n", " 70% 2.63G/3.74G [00:41<00:13, 84.5MiB/s]\u001b[A\n", " 71% 2.64G/3.74G [00:41<00:12, 85.3MiB/s]\u001b[A\n", " 71% 2.65G/3.74G [00:41<00:13, 83.6MiB/s]\u001b[A\n", " 71% 2.66G/3.74G [00:41<00:12, 84.7MiB/s]\u001b[A\n", " 71% 2.67G/3.74G [00:41<00:12, 86.2MiB/s]\u001b[A\n", " 72% 2.68G/3.74G [00:41<00:12, 86.6MiB/s]\u001b[A\n", " 72% 2.68G/3.74G [00:41<00:12, 87.4MiB/s]\u001b[A\n", " 72% 2.69G/3.74G [00:41<00:11, 90.5MiB/s]\u001b[A\n", " 72% 2.70G/3.74G [00:42<00:11, 87.8MiB/s]\u001b[A\n", " 73% 2.71G/3.74G [00:42<00:11, 90.5MiB/s]\u001b[A\n", " 73% 2.72G/3.74G [00:42<00:10, 93.2MiB/s]\u001b[A\n", " 73% 2.73G/3.74G [00:42<00:10, 93.7MiB/s]\u001b[A\n", " 73% 2.74G/3.74G [00:42<00:10, 95.0MiB/s]\u001b[A\n", " 74% 2.75G/3.74G [00:42<00:10, 95.1MiB/s]\u001b[A\n", " 74% 2.76G/3.74G [00:42<00:11, 87.6MiB/s]\u001b[A\n", " 74% 2.77G/3.74G [00:42<00:12, 79.9MiB/s]\u001b[A\n", " 74% 2.78G/3.74G [00:42<00:11, 83.0MiB/s]\u001b[A\n", " 75% 2.79G/3.74G [00:42<00:11, 85.4MiB/s]\u001b[A\n", " 75% 2.80G/3.74G [00:43<00:11, 84.4MiB/s]\u001b[A\n", " 75% 2.81G/3.74G [00:43<00:10, 85.5MiB/s]\u001b[A\n", " 75% 2.82G/3.74G [00:43<00:10, 87.4MiB/s]\u001b[A\n", " 75% 2.82G/3.74G [00:43<00:10, 87.3MiB/s]\u001b[A\n", " 76% 2.83G/3.74G [00:43<00:10, 89.0MiB/s]\u001b[A\n", " 76% 2.84G/3.74G [00:43<00:09, 90.1MiB/s]\u001b[A\n", " 76% 2.85G/3.74G [00:43<00:10, 85.9MiB/s]\u001b[A\n", " 76% 2.86G/3.74G [00:43<00:09, 88.4MiB/s]\u001b[A\n", " 77% 2.87G/3.74G [00:44<00:15, 55.1MiB/s]\u001b[A\n", " 77% 2.88G/3.74G [00:44<00:14, 61.4MiB/s]\u001b[A\n", " 77% 2.89G/3.74G [00:44<00:12, 66.8MiB/s]\u001b[A\n", " 77% 2.89G/3.74G [00:44<00:12, 69.4MiB/s]\u001b[A\n", " 78% 2.90G/3.74G [00:44<00:11, 73.5MiB/s]\u001b[A\n", " 78% 2.91G/3.74G [00:44<00:10, 78.4MiB/s]\u001b[A\n", " 78% 2.92G/3.74G [00:44<00:10, 81.8MiB/s]\u001b[A\n", " 78% 2.93G/3.74G [00:44<00:09, 85.0MiB/s]\u001b[A\n", " 79% 2.94G/3.74G [00:44<00:09, 84.7MiB/s]\u001b[A\n", " 79% 2.95G/3.74G [00:45<00:09, 85.4MiB/s]\u001b[A\n", " 79% 2.96G/3.74G [00:45<00:09, 85.8MiB/s]\u001b[A\n", " 79% 2.97G/3.74G [00:45<00:08, 89.1MiB/s]\u001b[A\n", " 80% 2.98G/3.74G [00:45<00:08, 91.3MiB/s]\u001b[A\n", " 80% 2.99G/3.74G [00:45<00:08, 93.5MiB/s]\u001b[A\n", " 80% 3.00G/3.74G [00:45<00:07, 95.2MiB/s]\u001b[A\n", " 80% 3.01G/3.74G [00:45<00:07, 95.4MiB/s]\u001b[A\n", " 81% 3.02G/3.74G [00:45<00:07, 96.3MiB/s]\u001b[A\n", " 81% 3.03G/3.74G [00:45<00:08, 80.6MiB/s]\u001b[A\n", " 81% 3.03G/3.74G [00:45<00:08, 81.3MiB/s]\u001b[A\n", " 81% 3.04G/3.74G [00:46<00:08, 78.6MiB/s]\u001b[A\n", " 82% 3.05G/3.74G [00:46<00:08, 81.3MiB/s]\u001b[A\n", " 82% 3.06G/3.74G [00:46<00:08, 83.4MiB/s]\u001b[A\n", " 82% 3.07G/3.74G [00:46<00:07, 86.8MiB/s]\u001b[A\n", " 82% 3.08G/3.74G [00:46<00:07, 87.8MiB/s]\u001b[A\n", " 83% 3.09G/3.74G [00:46<00:07, 91.1MiB/s]\u001b[A\n", " 83% 3.10G/3.74G [00:46<00:07, 91.7MiB/s]\u001b[A\n", " 83% 3.11G/3.74G [00:46<00:06, 93.3MiB/s]\u001b[A\n", " 83% 3.12G/3.74G [00:46<00:06, 94.1MiB/s]\u001b[A\n", " 84% 3.13G/3.74G [00:47<00:06, 92.8MiB/s]\u001b[A\n", " 84% 3.14G/3.74G [00:47<00:06, 90.1MiB/s]\u001b[A\n", " 84% 3.15G/3.74G [00:47<00:06, 91.5MiB/s]\u001b[A\n", " 84% 3.15G/3.74G [00:47<00:06, 89.7MiB/s]\u001b[A\n", " 85% 3.16G/3.74G [00:47<00:07, 74.7MiB/s]\u001b[A\n", " 85% 3.17G/3.74G [00:47<00:07, 79.2MiB/s]\u001b[A\n", " 85% 3.18G/3.74G [00:47<00:06, 81.8MiB/s]\u001b[A\n", " 85% 3.19G/3.74G [00:47<00:06, 83.9MiB/s]\u001b[A\n", " 86% 3.20G/3.74G [00:47<00:06, 88.4MiB/s]\u001b[A\n", " 86% 3.21G/3.74G [00:48<00:05, 90.2MiB/s]\u001b[A\n", " 86% 3.22G/3.74G [00:48<00:05, 91.4MiB/s]\u001b[A\n", " 86% 3.23G/3.74G [00:48<00:05, 91.0MiB/s]\u001b[A\n", " 87% 3.24G/3.74G [00:48<00:05, 84.5MiB/s]\u001b[A\n", " 87% 3.25G/3.74G [00:48<00:06, 72.9MiB/s]\u001b[A\n", " 87% 3.25G/3.74G [00:48<00:07, 66.3MiB/s]\u001b[A\n", " 87% 3.26G/3.74G [00:48<00:07, 61.9MiB/s]\u001b[A\n", " 87% 3.27G/3.74G [00:48<00:07, 59.5MiB/s]\u001b[A\n", " 87% 3.27G/3.74G [00:48<00:07, 58.5MiB/s]\u001b[A\n", " 88% 3.28G/3.74G [00:49<00:08, 55.0MiB/s]\u001b[A\n", " 88% 3.29G/3.74G [00:49<00:09, 49.3MiB/s]\u001b[A\n", " 88% 3.29G/3.74G [00:49<00:09, 49.7MiB/s]\u001b[A\n", " 88% 3.30G/3.74G [00:49<00:08, 50.0MiB/s]\u001b[A\n", " 88% 3.30G/3.74G [00:49<00:08, 51.0MiB/s]\u001b[A\n", " 88% 3.31G/3.74G [00:49<00:08, 51.9MiB/s]\u001b[A\n", " 89% 3.31G/3.74G [00:49<00:08, 53.5MiB/s]\u001b[A\n", " 89% 3.32G/3.74G [00:49<00:07, 53.7MiB/s]\u001b[A\n", " 89% 3.32G/3.74G [00:49<00:07, 53.8MiB/s]\u001b[A\n", " 89% 3.33G/3.74G [00:50<00:07, 53.8MiB/s]\u001b[A\n", " 89% 3.33G/3.74G [00:50<00:07, 53.6MiB/s]\u001b[A\n", " 89% 3.34G/3.74G [00:50<00:07, 53.8MiB/s]\u001b[A\n", " 89% 3.34G/3.74G [00:50<00:07, 54.4MiB/s]\u001b[A\n", " 90% 3.35G/3.74G [00:50<00:07, 54.1MiB/s]\u001b[A\n", " 90% 3.36G/3.74G [00:50<00:07, 54.4MiB/s]\u001b[A\n", " 90% 3.36G/3.74G [00:50<00:07, 54.4MiB/s]\u001b[A\n", " 90% 3.37G/3.74G [00:50<00:06, 54.6MiB/s]\u001b[A\n", " 90% 3.37G/3.74G [00:50<00:06, 55.1MiB/s]\u001b[A\n", " 90% 3.38G/3.74G [00:50<00:06, 53.7MiB/s]\u001b[A\n", " 90% 3.38G/3.74G [00:51<00:07, 46.9MiB/s]\u001b[A\n", " 91% 3.39G/3.74G [00:51<00:07, 48.9MiB/s]\u001b[A\n", " 91% 3.39G/3.74G [00:51<00:07, 48.7MiB/s]\u001b[A\n", " 91% 3.40G/3.74G [00:51<00:06, 49.5MiB/s]\u001b[A\n", " 91% 3.40G/3.74G [00:51<00:06, 49.9MiB/s]\u001b[A\n", " 91% 3.41G/3.74G [00:51<00:06, 50.4MiB/s]\u001b[A\n", " 91% 3.41G/3.74G [00:51<00:06, 51.1MiB/s]\u001b[A\n", " 91% 3.42G/3.74G [00:51<00:06, 50.9MiB/s]\u001b[A\n", " 92% 3.42G/3.74G [00:51<00:06, 50.3MiB/s]\u001b[A\n", " 92% 3.43G/3.74G [00:52<00:06, 50.8MiB/s]\u001b[A\n", " 92% 3.43G/3.74G [00:52<00:06, 49.3MiB/s]\u001b[A\n", " 92% 3.44G/3.74G [00:52<00:06, 49.5MiB/s]\u001b[A\n", " 92% 3.44G/3.74G [00:52<00:06, 48.2MiB/s]\u001b[A\n", " 92% 3.45G/3.74G [00:52<00:06, 47.9MiB/s]\u001b[A\n", " 92% 3.45G/3.74G [00:52<00:05, 47.9MiB/s]\u001b[A\n", " 92% 3.46G/3.74G [00:52<00:05, 47.4MiB/s]\u001b[A\n", " 93% 3.46G/3.74G [00:52<00:05, 48.1MiB/s]\u001b[A\n", " 93% 3.47G/3.74G [00:52<00:05, 48.3MiB/s]\u001b[A\n", " 93% 3.47G/3.74G [00:52<00:05, 50.3MiB/s]\u001b[A\n", " 93% 3.48G/3.74G [00:53<00:05, 52.0MiB/s]\u001b[A\n", " 93% 3.49G/3.74G [00:53<00:04, 53.1MiB/s]\u001b[A\n", " 93% 3.49G/3.74G [00:53<00:04, 54.2MiB/s]\u001b[A\n", " 93% 3.50G/3.74G [00:53<00:04, 54.9MiB/s]\u001b[A\n", " 94% 3.50G/3.74G [00:53<00:04, 54.8MiB/s]\u001b[A\n", " 94% 3.51G/3.74G [00:53<00:04, 54.1MiB/s]\u001b[A\n", " 94% 3.51G/3.74G [00:53<00:04, 54.6MiB/s]\u001b[A\n", " 94% 3.52G/3.74G [00:53<00:04, 55.1MiB/s]\u001b[A\n", " 94% 3.52G/3.74G [00:53<00:03, 54.7MiB/s]\u001b[A\n", " 94% 3.53G/3.74G [00:53<00:03, 53.6MiB/s]\u001b[A\n", " 94% 3.54G/3.74G [00:54<00:03, 53.9MiB/s]\u001b[A\n", " 95% 3.54G/3.74G [00:54<00:03, 53.0MiB/s]\u001b[A\n", " 95% 3.55G/3.74G [00:54<00:03, 53.3MiB/s]\u001b[A\n", " 95% 3.55G/3.74G [00:54<00:03, 53.3MiB/s]\u001b[A\n", " 95% 3.56G/3.74G [00:54<00:03, 49.2MiB/s]\u001b[A\n", " 95% 3.56G/3.74G [00:54<00:04, 38.0MiB/s]\u001b[A\n", " 95% 3.57G/3.74G [00:54<00:04, 40.5MiB/s]\u001b[A\n", " 95% 3.57G/3.74G [00:54<00:03, 42.9MiB/s]\u001b[A\n", " 96% 3.58G/3.74G [00:55<00:03, 44.7MiB/s]\u001b[A\n", " 96% 3.58G/3.74G [00:55<00:03, 46.8MiB/s]\u001b[A\n", " 96% 3.59G/3.74G [00:55<00:03, 48.8MiB/s]\u001b[A\n", " 96% 3.59G/3.74G [00:55<00:03, 49.5MiB/s]\u001b[A\n", " 96% 3.60G/3.74G [00:55<00:02, 50.1MiB/s]\u001b[A\n", " 96% 3.60G/3.74G [00:55<00:02, 49.5MiB/s]\u001b[A\n", " 96% 3.61G/3.74G [00:55<00:02, 48.8MiB/s]\u001b[A\n", " 97% 3.61G/3.74G [00:55<00:02, 50.5MiB/s]\u001b[A\n", " 97% 3.62G/3.74G [00:55<00:02, 49.2MiB/s]\u001b[A\n", " 97% 3.62G/3.74G [00:55<00:02, 48.9MiB/s]\u001b[A\n", " 97% 3.63G/3.74G [00:56<00:02, 49.8MiB/s]\u001b[A\n", " 97% 3.63G/3.74G [00:56<00:02, 50.3MiB/s]\u001b[A\n", " 97% 3.64G/3.74G [00:56<00:02, 50.2MiB/s]\u001b[A\n", " 97% 3.64G/3.74G [00:56<00:01, 50.2MiB/s]\u001b[A\n", " 98% 3.65G/3.74G [00:56<00:01, 51.2MiB/s]\u001b[A\n", " 98% 3.65G/3.74G [00:56<00:01, 51.1MiB/s]\u001b[A\n", " 98% 3.66G/3.74G [00:56<00:01, 52.8MiB/s]\u001b[A\n", " 98% 3.67G/3.74G [00:56<00:01, 54.5MiB/s]\u001b[A\n", " 98% 3.67G/3.74G [00:56<00:01, 54.8MiB/s]\u001b[A\n", " 98% 3.68G/3.74G [00:56<00:01, 55.7MiB/s]\u001b[A\n", " 98% 3.68G/3.74G [00:57<00:01, 56.4MiB/s]\u001b[A\n", " 99% 3.69G/3.74G [00:57<00:00, 55.3MiB/s]\u001b[A\n", " 99% 3.69G/3.74G [00:57<00:00, 56.5MiB/s]\u001b[A\n", " 99% 3.70G/3.74G [00:57<00:00, 56.8MiB/s]\u001b[A\n", " 99% 3.71G/3.74G [00:57<00:00, 56.3MiB/s]\u001b[A\n", " 99% 3.71G/3.74G [00:57<00:00, 57.6MiB/s]\u001b[A\n", " 99% 3.72G/3.74G [00:57<00:00, 69.3MiB/s]\u001b[A\n", "100% 3.73G/3.74G [00:57<00:00, 75.1MiB/s]\u001b[A\n", "100% 3.74G/3.74G [00:58<00:00, 64.0MiB/s]\n", "100% 5.35G/5.35G [01:19<00:00, 87.0MiB/s]\n", "100% 5.35G/5.35G [01:20<00:00, 66.6MiB/s]\n", "100% 6.11k/6.11k [00:00<00:00, 18.2MiB/s]\n", " > Model's license - MIT\n", " > Check https://choosealicense.com/licenses/mit/ for more info.\n", "2023-09-10 17:14:57.111436: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n", "Downloading (…)solve/main/vocab.txt: 100% 996k/996k [00:00<00:00, 16.1MB/s]\n", "Downloading (…)okenizer_config.json: 100% 29.0/29.0 [00:00<00:00, 170kB/s]\n", "Downloading (…)lve/main/config.json: 100% 625/625 [00:00<00:00, 3.24MB/s]\n", " > Using model: bark\n", "Downloading: \"https://dl.fbaipublicfiles.com/encodec/v0/encodec_24khz-d7cc33bc.th\" to /root/.cache/torch/hub/checkpoints/encodec_24khz-d7cc33bc.th\n", "100% 88.9M/88.9M [00:00<00:00, 157MB/s]\n", "Running on local URL: http://127.0.0.1:7860\n", "Running on public URL: https://6820cc891ce9add0c3.gradio.live\n", "\n", "This share link expires in 72 hours. For free permanent hosting and GPU upgrades, run `gradio deploy` from Terminal to deploy to Spaces (https://huggingface.co/spaces)\n", "Traceback (most recent call last):\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/queueing.py\", line 388, in call_prediction\n", " output = await route_utils.call_process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/route_utils.py\", line 219, in call_process_api\n", " output = await app.get_blocks().process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1437, in process_api\n", " result = await self.call_function(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1109, in call_function\n", " prediction = await anyio.to_thread.run_sync(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/to_thread.py\", line 33, in run_sync\n", " return await get_asynclib().run_sync_in_worker_thread(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 877, in run_sync_in_worker_thread\n", " return await future\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 807, in run\n", " result = context.run(func, *args)\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/utils.py\", line 641, in wrapper\n", " response = f(*args, **kwargs)\n", " File \"/content/instant-TTS-Bark-cloning/app.py\", line 97, in infer\n", " tts.tts_to_file(text=prompt,\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 387, in tts_to_file\n", " wav = self.tts(text=text, speaker=speaker, language=language, speaker_wav=speaker_wav, **kwargs)\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 334, in tts\n", " wav = self.synthesizer.tts(\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/utils/synthesizer.py\", line 282, in tts\n", " raise ValueError(\n", "ValueError: You need to define either `text` (for sythesis) or a `reference_wav` (for voice conversion) to use the Coqui TTS API.\n", "Traceback (most recent call last):\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/queueing.py\", line 388, in call_prediction\n", " output = await route_utils.call_process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/route_utils.py\", line 219, in call_process_api\n", " output = await app.get_blocks().process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1437, in process_api\n", " result = await self.call_function(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1109, in call_function\n", " prediction = await anyio.to_thread.run_sync(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/to_thread.py\", line 33, in run_sync\n", " return await get_asynclib().run_sync_in_worker_thread(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 877, in run_sync_in_worker_thread\n", " return await future\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 807, in run\n", " result = context.run(func, *args)\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/utils.py\", line 641, in wrapper\n", " response = f(*args, **kwargs)\n", " File \"/content/instant-TTS-Bark-cloning/app.py\", line 97, in infer\n", " tts.tts_to_file(text=prompt,\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 387, in tts_to_file\n", " wav = self.tts(text=text, speaker=speaker, language=language, speaker_wav=speaker_wav, **kwargs)\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 334, in tts\n", " wav = self.synthesizer.tts(\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/utils/synthesizer.py\", line 282, in tts\n", " raise ValueError(\n", "ValueError: You need to define either `text` (for sythesis) or a `reference_wav` (for voice conversion) to use the Coqui TTS API.\n", "Traceback (most recent call last):\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/queueing.py\", line 388, in call_prediction\n", " output = await route_utils.call_process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/route_utils.py\", line 219, in call_process_api\n", " output = await app.get_blocks().process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1437, in process_api\n", " result = await self.call_function(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1109, in call_function\n", " prediction = await anyio.to_thread.run_sync(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/to_thread.py\", line 33, in run_sync\n", " return await get_asynclib().run_sync_in_worker_thread(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 877, in run_sync_in_worker_thread\n", " return await future\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 807, in run\n", " result = context.run(func, *args)\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/utils.py\", line 641, in wrapper\n", " response = f(*args, **kwargs)\n", " File \"/content/instant-TTS-Bark-cloning/app.py\", line 97, in infer\n", " tts.tts_to_file(text=prompt,\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 387, in tts_to_file\n", " wav = self.tts(text=text, speaker=speaker, language=language, speaker_wav=speaker_wav, **kwargs)\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 334, in tts\n", " wav = self.synthesizer.tts(\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/utils/synthesizer.py\", line 282, in tts\n", " raise ValueError(\n", "ValueError: You need to define either `text` (for sythesis) or a `reference_wav` (for voice conversion) to use the Coqui TTS API.\n", "Traceback (most recent call last):\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/queueing.py\", line 388, in call_prediction\n", " output = await route_utils.call_process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/route_utils.py\", line 219, in call_process_api\n", " output = await app.get_blocks().process_api(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1437, in process_api\n", " result = await self.call_function(\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/blocks.py\", line 1109, in call_function\n", " prediction = await anyio.to_thread.run_sync(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/to_thread.py\", line 33, in run_sync\n", " return await get_asynclib().run_sync_in_worker_thread(\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 877, in run_sync_in_worker_thread\n", " return await future\n", " File \"/usr/local/lib/python3.10/dist-packages/anyio/_backends/_asyncio.py\", line 807, in run\n", " result = context.run(func, *args)\n", " File \"/usr/local/lib/python3.10/dist-packages/gradio/utils.py\", line 641, in wrapper\n", " response = f(*args, **kwargs)\n", " File \"/content/instant-TTS-Bark-cloning/app.py\", line 97, in infer\n", " tts.tts_to_file(text=prompt,\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 387, in tts_to_file\n", " wav = self.tts(text=text, speaker=speaker, language=language, speaker_wav=speaker_wav, **kwargs)\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/api.py\", line 334, in tts\n", " wav = self.synthesizer.tts(\n", " File \"/usr/local/lib/python3.10/dist-packages/TTS/utils/synthesizer.py\", line 282, in tts\n", " raise ValueError(\n", "ValueError: You need to define either `text` (for sythesis) or a `reference_wav` (for voice conversion) to use the Coqui TTS API.\n", " > Text splitted to sentences.\n", "['Hi how are you']\n", "Downloading HuBERT custom tokenizer\n", "Downloading (…)rt_base_ls960_14.pth: 100% 104M/104M [00:02<00:00, 36.1MB/s]\n", "Downloaded tokenizer\n", "Downloading (…)lve/main/config.json: 100% 1.39k/1.39k [00:00<00:00, 7.82MB/s]\n", "Downloading pytorch_model.bin: 100% 378M/378M [00:05<00:00, 64.9MB/s]\n", "100% 100/100 [00:02<00:00, 45.28it/s]\n", "100% 8/8 [00:07<00:00, 1.00it/s]\n", " > Processing time: 30.34160089492798\n", " > Real-time factor: 8.158930484550755\n", "voice_preview_Joanne - pensive introspective soft and lovely 1 1-0-100.wav\n", "voice_preview_Joanne - pensive introspective soft and lovely 1 1-0-100.npz\n", "/usr/local/lib/python3.10/dist-packages/matplotlib/patches.py:739: RuntimeWarning: overflow encountered in short_scalars\n", " y1 = self.convert_yunits(self._y0 + self._height)\n", "ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers\n", " built with gcc 11 (Ubuntu 11.2.0-19ubuntu1)\n", " configuration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared\n", " libavutil 56. 70.100 / 56. 70.100\n", " libavcodec 58.134.100 / 58.134.100\n", " libavformat 58. 76.100 / 58. 76.100\n", " libavdevice 58. 13.100 / 58. 13.100\n", " libavfilter 7.110.100 / 7.110.100\n", " libswscale 5. 9.100 / 5. 9.100\n", " libswresample 3. 9.100 / 3. 9.100\n", " libpostproc 55. 9.100 / 55. 9.100\n", "Input #0, png_pipe, from '/tmp/tmpd2ethk12.png':\n", " Duration: N/A, bitrate: N/A\n", " Stream #0:0: Video: png, rgba(pc), 1000x400, 25 fps, 25 tbr, 25 tbn, 25 tbc\n", "\u001b[0;33mGuessed Channel Layout for Input Stream #1.0 : mono\n", "\u001b[0mInput #1, wav, from 'output.wav':\n", " Duration: 00:00:03.42, bitrate: 384 kb/s\n", " Stream #1:0: Audio: pcm_s16le ([1][0][0][0] / 0x0001), 24000 Hz, mono, s16, 384 kb/s\n", "Stream mapping:\n", " Stream #0:0 -> #0:0 (png (native) -> h264 (libx264))\n", " Stream #1:0 -> #0:1 (pcm_s16le (native) -> aac (native))\n", "Press [q] to stop, [?] for help\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0musing cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mprofile High, level 3.0, 4:2:0, 8-bit\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0m264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=3 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=25 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=23.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\n", "Output #0, mp4, to '/tmp/tmpo304xhpg.mp4':\n", " Metadata:\n", " encoder : Lavf58.76.100\n", " Stream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 1000x400, q=2-31, 25 fps, 12800 tbn\n", " Metadata:\n", " encoder : Lavc58.134.100 libx264\n", " Side data:\n", " cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A\n", " Stream #0:1: Audio: aac (LC) (mp4a / 0x6134706D), 24000 Hz, mono, fltp, 69 kb/s\n", " Metadata:\n", " encoder : Lavc58.134.100 aac\n", "frame= 85 fps=0.0 q=-1.0 Lsize= 44kB time=00:00:03.41 bitrate= 105.2kbits/s speed=4.07x \n", "video:13kB audio:28kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 8.501535%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mframe I:1 Avg QP:10.99 size: 2753\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mframe P:30 Avg QP:20.00 size: 208\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mframe B:54 Avg QP:16.20 size: 61\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mconsecutive B-frames: 10.6% 14.1% 0.0% 75.3%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mmb I I16..4: 91.7% 4.1% 4.3%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mmb P I16..4: 1.7% 2.4% 0.1% P16..4: 2.3% 0.1% 0.0% 0.0% 0.0% skip:93.3%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mmb B I16..4: 0.3% 0.0% 0.0% B16..8: 2.6% 0.4% 0.0% direct: 0.0% skip:96.7% L0:34.1% L1:65.9% BI: 0.0%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0m8x8 transform intra:31.0% inter:39.2%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mcoded y,uvDC,uvAC intra: 1.4% 4.1% 3.2% inter: 0.0% 0.1% 0.0%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mi16 v,h,dc,p: 95% 0% 5% 0%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mi8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 18% 2% 81% 0% 0% 0% 0% 0% 0%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mi4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 54% 19% 23% 0% 1% 1% 1% 1% 1%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mi8c dc,h,v,p: 82% 1% 17% 0%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mWeighted P-Frames: Y:0.0% UV:0.0%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mref P L0: 95.5% 0.4% 3.0% 1.1%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mref B L0: 88.7% 11.2% 0.1%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mref B L1: 99.9% 0.1%\n", "\u001b[1;36m[libx264 @ 0x5818b5c33b80] \u001b[0mkb/s:28.94\n", "\u001b[1;36m[aac @ 0x5818b5c34e80] \u001b[0mQavg: 9516.688\n", " > Text splitted to sentences.\n", "['Bob Harvey first met Annette Adkins during study hall in 1955—and was immediately smitten.', '\"I couldn’t take my eyes off her,\" Harvey told the New York Times.', '\"She had auburn hair and a stunningly beautiful face and her eyes were just, wow.\"', 'The two teens ended up going to prom together, but as many young relationships go, they lost touch after high school and married other people.', 'Harvey never forgot about Adkins, though.', 'In 2017, after his wife died, he searched for Adkins on Google and discovered she had also become widowed.', 'He sent her a card with his phone number and after chatting for a bit, Harvey drove 500 miles to visit her, stopping only for gas and a bouquet of carnations.', '\"I handed her the flowers, and then I cupped her face in my hand and said, \\'Whether you like it or not, I’m going to kiss you,\\'\" he recalled.', \"In October, the high school sweethearts married at a '50s-style diner and danced to Johnny Mathis—just like they did at prom 63 years earlier.\"]\n", "100% 100/100 [00:05<00:00, 17.63it/s]\n", "100% 19/19 [00:17<00:00, 1.10it/s]\n", "100% 100/100 [00:03<00:00, 32.03it/s] \n", "100% 15/15 [00:14<00:00, 1.04it/s]\n", "100% 100/100 [00:05<00:00, 16.74it/s]\n", "100% 29/29 [00:28<00:00, 1.03it/s]\n", "100% 100/100 [00:04<00:00, 24.08it/s]\n", "100% 21/21 [00:20<00:00, 1.04it/s]\n", "100% 100/100 [00:03<00:00, 25.54it/s] \n", "100% 14/14 [00:13<00:00, 1.02it/s]\n", "100% 100/100 [00:05<00:00, 18.30it/s]\n", "100% 18/18 [00:17<00:00, 1.05it/s]\n", "100% 100/100 [00:07<00:00, 13.35it/s]\n", "100% 34/34 [00:34<00:00, 1.01s/it]\n", "100% 100/100 [00:08<00:00, 11.90it/s]\n", "100% 31/31 [00:30<00:00, 1.01it/s]\n", "100% 100/100 [00:08<00:00, 11.34it/s]\n", "100% 34/34 [00:34<00:00, 1.02s/it]\n", " > Processing time: 287.33636355400085\n", " > Real-time factor: 2.9880054783841343\n", "voice_preview_Joanne - pensive introspective soft and lovely 1 1-0-100.wav\n", "voice_preview_Joanne - pensive introspective soft and lovely 1 1-0-100.npz\n", "/usr/local/lib/python3.10/dist-packages/matplotlib/axes/_axes.py:2229: RuntimeWarning: overflow encountered in short_scalars\n", " dx = [convert(x0 + ddx) - x for ddx in dx]\n", "/usr/local/lib/python3.10/dist-packages/matplotlib/patches.py:739: RuntimeWarning: overflow encountered in short_scalars\n", " y1 = self.convert_yunits(self._y0 + self._height)\n", "ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers\n", " built with gcc 11 (Ubuntu 11.2.0-19ubuntu1)\n", " configuration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared\n", " libavutil 56. 70.100 / 56. 70.100\n", " libavcodec 58.134.100 / 58.134.100\n", " libavformat 58. 76.100 / 58. 76.100\n", " libavdevice 58. 13.100 / 58. 13.100\n", " libavfilter 7.110.100 / 7.110.100\n", " libswscale 5. 9.100 / 5. 9.100\n", " libswresample 3. 9.100 / 3. 9.100\n", " libpostproc 55. 9.100 / 55. 9.100\n", "Input #0, png_pipe, from '/tmp/tmpg8wlxynu.png':\n", " Duration: N/A, bitrate: N/A\n", " Stream #0:0: Video: png, rgba(pc), 1000x400, 25 fps, 25 tbr, 25 tbn, 25 tbc\n", "\u001b[0;33mGuessed Channel Layout for Input Stream #1.0 : mono\n", "\u001b[0mInput #1, wav, from 'output.wav':\n", " Duration: 00:01:28.35, bitrate: 384 kb/s\n", " Stream #1:0: Audio: pcm_s16le ([1][0][0][0] / 0x0001), 24000 Hz, mono, s16, 384 kb/s\n", "Stream mapping:\n", " Stream #0:0 -> #0:0 (png (native) -> h264 (libx264))\n", " Stream #1:0 -> #0:1 (pcm_s16le (native) -> aac (native))\n", "Press [q] to stop, [?] for help\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0musing cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mprofile High, level 3.0, 4:2:0, 8-bit\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0m264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=3 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=25 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=23.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\n", "Output #0, mp4, to '/tmp/tmpg6nv7891.mp4':\n", " Metadata:\n", " encoder : Lavf58.76.100\n", " Stream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 1000x400, q=2-31, 25 fps, 12800 tbn\n", " Metadata:\n", " encoder : Lavc58.134.100 libx264\n", " Side data:\n", " cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A\n", " Stream #0:1: Audio: aac (LC) (mp4a / 0x6134706D), 24000 Hz, mono, fltp, 69 kb/s\n", " Metadata:\n", " encoder : Lavc58.134.100 aac\n", "frame= 2209 fps= 84 q=-1.0 Lsize= 980kB time=00:01:28.32 bitrate= 90.9kbits/s speed=3.34x \n", "video:195kB audio:731kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 5.916169%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mframe I:9 Avg QP:11.25 size: 7294\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mframe P:556 Avg QP:20.17 size: 126\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mframe B:1644 Avg QP:15.89 size: 38\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mconsecutive B-frames: 0.8% 0.0% 0.0% 99.2%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mmb I I16..4: 87.0% 1.8% 11.1%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mmb P I16..4: 0.7% 0.2% 0.0% P16..4: 3.0% 0.1% 0.0% 0.0% 0.0% skip:95.9%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mmb B I16..4: 0.0% 0.0% 0.0% B16..8: 1.1% 0.0% 0.0% direct: 0.0% skip:98.8% L0:55.2% L1:44.7% BI: 0.1%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0m8x8 transform intra:8.5% inter:49.2%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mcoded y,uvDC,uvAC intra: 3.3% 9.3% 7.9% inter: 0.0% 0.0% 0.0%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mi16 v,h,dc,p: 96% 1% 3% 0%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mi8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 11% 2% 86% 1% 0% 0% 0% 0% 0%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mi4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 59% 19% 18% 0% 1% 1% 1% 1% 1%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mi8c dc,h,v,p: 26% 4% 69% 0%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mWeighted P-Frames: Y:0.0% UV:0.0%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mref P L0: 97.3% 0.1% 2.3% 0.3%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mref B L0: 70.9% 28.4% 0.7%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mref B L1: 99.4% 0.6%\n", "\u001b[1;36m[libx264 @ 0x5c76b5eba740] \u001b[0mkb/s:17.98\n", "\u001b[1;36m[aac @ 0x5c76b5ebbf80] \u001b[0mQavg: 7958.416\n" ] } ], "source": [ "!python app.py" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "background_save": true, "base_uri": "https://localhost:8080/" }, "id": "IcJRXDCwG61R", "outputId": "4dfb8211-121d-49a6-cb9e-75ffe8e1daf1" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "/usr/local/lib/python3.10/dist-packages/TTS/api.py:77: UserWarning: `gpu` will be deprecated. Please use `tts.to(device)` instead.\n", " warnings.warn(\"`gpu` will be deprecated. Please use `tts.to(device)` instead.\")\n", " > tts_models/multilingual/multi-dataset/bark is already downloaded.\n", "2023-09-05 07:11:17.023349: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n", " > Using model: bark\n", "Running on local URL: http://127.0.0.1:7860\n", "Running on public URL: https://037501a79514617442.gradio.live\n", "\n", "This share link expires in 72 hours. For free permanent hosting and GPU upgrades, run `gradio deploy` from Terminal to deploy to Spaces (https://huggingface.co/spaces)\n", " > Text splitted to sentences.\n", "['Hi Raja, Llama Llama Red pajama.', \"Today was a very tiring day and I can't believe it how it went.\", \"I'm happy that it was not very bad.\"]\n", "100% 100/100 [00:07<00:00, 13.70it/s]\n", "100% 31/31 [00:31<00:00, 1.02s/it]\n", "100% 100/100 [00:02<00:00, 34.29it/s] \n", "100% 15/15 [00:15<00:00, 1.02s/it]\n", "100% 100/100 [00:02<00:00, 41.95it/s] \n", "100% 12/12 [00:12<00:00, 1.06s/it]\n", " > Processing time: 90.9921088218689\n", " > Real-time factor: 3.493480985377854\n", "jordan20sec-0-100.wav\n", "jordan20sec-0-100.npz\n", "/usr/local/lib/python3.10/dist-packages/matplotlib/axes/_axes.py:2229: RuntimeWarning: overflow encountered in short_scalars\n", " dx = [convert(x0 + ddx) - x for ddx in dx]\n", "/usr/local/lib/python3.10/dist-packages/matplotlib/patches.py:739: RuntimeWarning: overflow encountered in short_scalars\n", " y1 = self.convert_yunits(self._y0 + self._height)\n", "ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers\n", " built with gcc 11 (Ubuntu 11.2.0-19ubuntu1)\n", " configuration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared\n", " libavutil 56. 70.100 / 56. 70.100\n", " libavcodec 58.134.100 / 58.134.100\n", " libavformat 58. 76.100 / 58. 76.100\n", " libavdevice 58. 13.100 / 58. 13.100\n", " libavfilter 7.110.100 / 7.110.100\n", " libswscale 5. 9.100 / 5. 9.100\n", " libswresample 3. 9.100 / 3. 9.100\n", " libpostproc 55. 9.100 / 55. 9.100\n", "Input #0, png_pipe, from '/tmp/tmpvv7uiwnb.png':\n", " Duration: N/A, bitrate: N/A\n", " Stream #0:0: Video: png, rgba(pc), 1000x400, 25 fps, 25 tbr, 25 tbn, 25 tbc\n", "\u001b[0;33mGuessed Channel Layout for Input Stream #1.0 : mono\n", "\u001b[0mInput #1, wav, from 'output.wav':\n", " Duration: 00:00:23.93, bitrate: 384 kb/s\n", " Stream #1:0: Audio: pcm_s16le ([1][0][0][0] / 0x0001), 24000 Hz, mono, s16, 384 kb/s\n", "Stream mapping:\n", " Stream #0:0 -> #0:0 (png (native) -> h264 (libx264))\n", " Stream #1:0 -> #0:1 (pcm_s16le (native) -> aac (native))\n", "Press [q] to stop, [?] for help\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0musing cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mprofile High, level 3.0, 4:2:0, 8-bit\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0m264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=3 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=25 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=23.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\n", "Output #0, mp4, to '/tmp/tmp3p2nj6fv.mp4':\n", " Metadata:\n", " encoder : Lavf58.76.100\n", " Stream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 1000x400, q=2-31, 25 fps, 12800 tbn\n", " Metadata:\n", " encoder : Lavc58.134.100 libx264\n", " Side data:\n", " cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A\n", " Stream #0:1: Audio: aac (LC) (mp4a / 0x6134706D), 24000 Hz, mono, fltp, 69 kb/s\n", " Metadata:\n", " encoder : Lavc58.134.100 aac\n", "frame= 598 fps= 85 q=-1.0 Lsize= 298kB time=00:00:23.89 bitrate= 102.3kbits/s speed= 3.4x \n", "video:82kB audio:201kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 5.440982%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mframe I:3 Avg QP:13.41 size: 6596\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mframe P:250 Avg QP:19.70 size: 176\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mframe B:345 Avg QP:17.07 size: 56\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mconsecutive B-frames: 15.9% 19.1% 7.5% 57.5%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mmb I I16..4: 75.2% 13.8% 11.0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mmb P I16..4: 1.1% 0.4% 0.0% P16..4: 4.5% 0.2% 0.0% 0.0% 0.0% skip:93.7%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mmb B I16..4: 0.1% 0.0% 0.0% B16..8: 1.6% 0.1% 0.0% direct: 0.0% skip:98.1% L0:43.1% L1:56.4% BI: 0.5%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0m8x8 transform intra:20.1% inter:47.8%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mcoded y,uvDC,uvAC intra: 2.4% 7.2% 6.1% inter: 0.0% 0.1% 0.0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mi16 v,h,dc,p: 98% 0% 2% 0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mi8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 19% 5% 76% 1% 0% 0% 0% 0% 0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mi4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 63% 18% 16% 0% 1% 1% 1% 0% 1%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mi8c dc,h,v,p: 42% 2% 56% 0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mWeighted P-Frames: Y:0.0% UV:0.0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mref P L0: 96.7% 0.1% 2.2% 0.9%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mref B L0: 78.1% 19.9% 2.0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mref B L1: 99.0% 1.0%\n", "\u001b[1;36m[libx264 @ 0x5a8aeeef0a40] \u001b[0mkb/s:27.80\n", "\u001b[1;36m[aac @ 0x5a8aeeef2280] \u001b[0mQavg: 5041.738\n", "/usr/local/lib/python3.10/dist-packages/gradio/processing_utils.py:188: UserWarning: Trying to convert audio automatically from int32 to 16-bit int format.\n", " warnings.warn(warning.format(data.dtype))\n", " > Text splitted to sentences.\n", "['Hi Raja, Llama Llama Red pajama.', \"Today was a very tiring day and I can't believe it how it went.\", \"I'm happy that it was not very bad.\"]\n", "100% 100/100 [00:07<00:00, 12.94it/s]\n", "100% 35/35 [00:35<00:00, 1.02s/it]\n", "100% 100/100 [00:05<00:00, 18.15it/s]\n", "100% 20/20 [00:19<00:00, 1.01it/s]\n", "100% 100/100 [00:06<00:00, 16.30it/s]\n", "100% 26/26 [00:26<00:00, 1.02s/it]\n", " > Processing time: 113.43854403495789\n", " > Real-time factor: 3.1395219097936806\n", "audio-0-100.wav\n", "audio-0-100.npz\n", "/usr/local/lib/python3.10/dist-packages/matplotlib/axes/_axes.py:2229: RuntimeWarning: overflow encountered in short_scalars\n", " dx = [convert(x0 + ddx) - x for ddx in dx]\n", "/usr/local/lib/python3.10/dist-packages/matplotlib/patches.py:739: RuntimeWarning: overflow encountered in short_scalars\n", " y1 = self.convert_yunits(self._y0 + self._height)\n", "ffmpeg version 4.4.2-0ubuntu0.22.04.1 Copyright (c) 2000-2021 the FFmpeg developers\n", " built with gcc 11 (Ubuntu 11.2.0-19ubuntu1)\n", " configuration: --prefix=/usr --extra-version=0ubuntu0.22.04.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libdav1d --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librabbitmq --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libsrt --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzimg --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-pocketsphinx --enable-librsvg --enable-libmfx --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared\n", " libavutil 56. 70.100 / 56. 70.100\n", " libavcodec 58.134.100 / 58.134.100\n", " libavformat 58. 76.100 / 58. 76.100\n", " libavdevice 58. 13.100 / 58. 13.100\n", " libavfilter 7.110.100 / 7.110.100\n", " libswscale 5. 9.100 / 5. 9.100\n", " libswresample 3. 9.100 / 3. 9.100\n", " libpostproc 55. 9.100 / 55. 9.100\n", "Input #0, png_pipe, from '/tmp/tmpujyofy0d.png':\n", " Duration: N/A, bitrate: N/A\n", " Stream #0:0: Video: png, rgba(pc), 1000x400, 25 fps, 25 tbr, 25 tbn, 25 tbc\n", "\u001b[0;33mGuessed Channel Layout for Input Stream #1.0 : mono\n", "\u001b[0mInput #1, wav, from 'output.wav':\n", " Duration: 00:00:33.20, bitrate: 384 kb/s\n", " Stream #1:0: Audio: pcm_s16le ([1][0][0][0] / 0x0001), 24000 Hz, mono, s16, 384 kb/s\n", "Stream mapping:\n", " Stream #0:0 -> #0:0 (png (native) -> h264 (libx264))\n", " Stream #1:0 -> #0:1 (pcm_s16le (native) -> aac (native))\n", "Press [q] to stop, [?] for help\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0musing cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mprofile High, level 3.0, 4:2:0, 8-bit\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0m264 - core 163 r3060 5db6aa6 - H.264/MPEG-4 AVC codec - Copyleft 2003-2021 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=3 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=25 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=23.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\n", "Output #0, mp4, to '/tmp/tmp5pmtmaeh.mp4':\n", " Metadata:\n", " encoder : Lavf58.76.100\n", " Stream #0:0: Video: h264 (avc1 / 0x31637661), yuv420p(tv, progressive), 1000x400, q=2-31, 25 fps, 12800 tbn\n", " Metadata:\n", " encoder : Lavc58.134.100 libx264\n", " Side data:\n", " cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: N/A\n", " Stream #0:1: Audio: aac (LC) (mp4a / 0x6134706D), 24000 Hz, mono, fltp, 69 kb/s\n", " Metadata:\n", " encoder : Lavc58.134.100 aac\n", "frame= 830 fps= 81 q=-1.0 Lsize= 391kB time=00:00:33.19 bitrate= 96.4kbits/s speed=3.25x \n", "video:93kB audio:276kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 5.758711%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mframe I:4 Avg QP:12.94 size: 6450\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mframe P:278 Avg QP:20.63 size: 155\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mframe B:548 Avg QP:16.81 size: 47\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mconsecutive B-frames: 4.5% 19.5% 9.0% 67.0%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mmb I I16..4: 85.1% 5.3% 9.6%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mmb P I16..4: 1.0% 0.4% 0.0% P16..4: 3.6% 0.1% 0.0% 0.0% 0.0% skip:94.8%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mmb B I16..4: 0.1% 0.0% 0.0% B16..8: 1.5% 0.1% 0.0% direct: 0.0% skip:98.3% L0:41.6% L1:58.2% BI: 0.2%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0m8x8 transform intra:16.4% inter:41.9%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mcoded y,uvDC,uvAC intra: 2.4% 7.1% 5.9% inter: 0.0% 0.0% 0.0%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mi16 v,h,dc,p: 97% 0% 2% 0%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mi8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 12% 1% 86% 1% 0% 0% 0% 0% 0%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mi4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 62% 20% 14% 0% 1% 1% 1% 1% 1%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mi8c dc,h,v,p: 44% 2% 54% 0%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mWeighted P-Frames: Y:0.0% UV:0.0%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mref P L0: 96.7% 0.2% 2.4% 0.7%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mref B L0: 82.8% 15.5% 1.7%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mref B L1: 99.7% 0.3%\n", "\u001b[1;36m[libx264 @ 0x55ec971bef80] \u001b[0mkb/s:22.85\n", "\u001b[1;36m[aac @ 0x55ec971c09c0] \u001b[0mQavg: 2766.381\n" ] } ], "source": [ "!python app.py" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "7ARlmJE2KxSl" }, "outputs": [], "source": [] } ], "metadata": { "accelerator": "GPU", "colab": { "provenance": [] }, "kernelspec": { "display_name": "Python 3", "name": "python3" }, "language_info": { "name": "python" } }, "nbformat": 4, "nbformat_minor": 0 }