LearnItAnyway commited on
Commit
c62d0e0
1 Parent(s): bd25455

Upload tester.ipynb

Browse files
Files changed (1) hide show
  1. tester.ipynb +455 -219
tester.ipynb CHANGED
@@ -2,47 +2,323 @@
2
  "cells": [
3
  {
4
  "cell_type": "code",
5
- "execution_count": null,
6
  "id": "cb5d0890-3f2d-4020-8270-f3a9bb9f63c6",
7
- "metadata": {},
8
- "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9
  "source": [
10
- "%%bash # install the vall-e and required libraries\n",
 
11
  "# PyTorch\n",
12
  "pip install torch==1.13.1 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116\n",
13
  "pip install torchmetrics==0.11.1\n",
14
  "# fbank\n",
15
- "pip install librosa==0.8.1\n",
16
  "\n",
17
  "# phonemizer pypinyin\n",
18
- "apt-get install espeak-ng\n",
19
  "## OSX: brew install espeak\n",
20
  "pip install phonemizer==3.2.1 pypinyin==0.48.0\n",
21
  "\n",
22
- "# lhotse update to newest version\n",
23
- "# https://github.com/lhotse-speech/lhotse/pull/956\n",
24
- "# https://github.com/lhotse-speech/lhotse/pull/960\n",
25
- "pip uninstall lhotse\n",
26
  "pip install lhotse\n",
27
  "\n",
28
  "# k2\n",
29
  "# find the right version in https://huggingface.co/csukuangfj/k2\n",
30
- "pip install https://huggingface.co/csukuangfj/k2/resolve/main/cuda/k2-1.23.4.dev20230224+cuda11.6.torch1.13.1-cp310-cp310-linux_x86_64.whl\n",
 
31
  "\n",
32
- "# icefall\n",
33
  "git clone https://github.com/k2-fsa/icefall\n",
34
- "cd icefall\n",
 
35
  "pip install -r requirements.txt\n",
 
36
  "export PYTHONPATH=`pwd`/../icefall:$PYTHONPATH\n",
37
  "echo \"export PYTHONPATH=`pwd`/../icefall:\\$PYTHONPATH\" >> ~/.zshrc\n",
38
  "echo \"export PYTHONPATH=`pwd`/../icefall:\\$PYTHONPATH\" >> ~/.bashrc\n",
39
- "cd -\n",
40
  "source ~/.zshrc\n",
 
41
  "\n",
42
- "# valle\n",
43
- "git clone https://github.com/lifeiteng/valle.git\n",
44
- "cd valle\n",
45
- "pip install -e ."
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  ]
47
  },
48
  {
@@ -52,20 +328,60 @@
52
  "metadata": {},
53
  "outputs": [
54
  {
55
- "name": "stderr",
56
  "output_type": "stream",
57
  "text": [
58
- "/home/dongsun/.local/lib/python3.10/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: '/home/dongsun/.local/lib/python3.10/site-packages/torchvision/image.so: undefined symbol: _ZN3c104cuda20CUDACachingAllocator9allocatorE'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source?\n",
59
- " warn(\n"
60
  ]
61
  },
62
  {
63
- "name": "stdout",
64
  "output_type": "stream",
65
  "text": [
66
- "[2023-09-21 14:36:33,978] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\n",
67
- "Use 8 cpu cores for computing\n"
68
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
69
  }
70
  ],
71
  "source": [
@@ -87,7 +403,7 @@
87
  " AudioTokenizer,\n",
88
  " TextTokenizer,\n",
89
  " tokenize_audio,\n",
90
- " tokenize_text,\n",
91
  ")\n",
92
  "from icefall.utils import AttributeDict\n",
93
  "from valle.data.collation import get_text_token_collater\n",
@@ -175,104 +491,10 @@
175
  },
176
  {
177
  "cell_type": "code",
178
- "execution_count": 2,
179
  "id": "41e40fe5-595e-4f9a-8dd7-dfda52944529",
180
  "metadata": {},
181
- "outputs": [
182
- {
183
- "data": {
184
- "text/html": [
185
- "<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\"><span style=\"color: #800000; text-decoration-color: #800000\">╭─────────────────────────────── </span><span style=\"color: #800000; text-decoration-color: #800000; font-weight: bold\">Traceback </span><span style=\"color: #bf7f7f; text-decoration-color: #bf7f7f; font-weight: bold\">(most recent call last)</span><span style=\"color: #800000; text-decoration-color: #800000\"> ────────────────────────────────╮</span>\n",
186
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> in <span style=\"color: #00ff00; text-decoration-color: #00ff00\">&lt;module&gt;</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
187
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
188
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">1 </span>text_prompt = <span style=\"color: #808000; text-decoration-color: #808000\">''</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"># text of the audio </span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
189
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">2 </span>audio_prompt = <span style=\"color: #808000; text-decoration-color: #808000\">''</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"># path to the audio file</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
190
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">3 </span>text = <span style=\"color: #808000; text-decoration-color: #808000\">''</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"># </span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
191
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">❱ </span>4 message, (sr, data) = infer_from_prompt(text_prompt, audio_prompt, text) <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
192
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">5 </span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
193
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
194
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #bfbf7f; text-decoration-color: #bfbf7f\">/home/dongsun/.local/lib/python3.10/site-packages/torch/autograd/</span><span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">grad_mode.py</span>:<span style=\"color: #0000ff; text-decoration-color: #0000ff\">27</span> in <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
195
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #00ff00; text-decoration-color: #00ff00\">decorate_context</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
196
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
197
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"> 24 │ │ </span><span style=\"color: #ff00ff; text-decoration-color: #ff00ff; font-weight: bold\">@functools</span>.wraps(func) <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
198
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"> 25 │ │ </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">def</span> <span style=\"color: #00ff00; text-decoration-color: #00ff00\">decorate_context</span>(*args, **kwargs): <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
199
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"> 26 │ │ │ </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">with</span> <span style=\"color: #00ffff; text-decoration-color: #00ffff\">self</span>.clone(): <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
200
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">❱ </span> 27 <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">│ │ │ │ </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">return</span> func(*args, **kwargs) <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
201
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"> 28 │ │ </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">return</span> cast(F, decorate_context) <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
202
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"> 29 │ </span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
203
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"> 30 │ </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">def</span> <span style=\"color: #00ff00; text-decoration-color: #00ff00\">_wrap_generator</span>(<span style=\"color: #00ffff; text-decoration-color: #00ffff\">self</span>, func): <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
204
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
205
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> in <span style=\"color: #00ff00; text-decoration-color: #00ff00\">infer_from_prompt</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
206
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
207
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">64 │ ## text to token</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
208
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">65 │ </span>text_tokens, text_tokens_lens = text_collater( <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
209
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">66 │ │ </span>[ <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
210
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">❱ </span>67 <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">│ │ │ </span>tokenize_text( <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
211
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">68 │ │ │ │ </span>text_tokenizer, text=<span style=\"color: #808000; text-decoration-color: #808000\">f\"{</span>text_prompt<span style=\"color: #808000; text-decoration-color: #808000\">} {</span>text<span style=\"color: #808000; text-decoration-color: #808000\">}\"</span>.strip() <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
212
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">69 │ │ │ </span>) <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
213
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">70 │ │ </span>] <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
214
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
215
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #bfbf7f; text-decoration-color: #bfbf7f\">/home/dongsun/vall-e/valle/data/</span><span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">tokenizer.py</span>:<span style=\"color: #0000ff; text-decoration-color: #0000ff\">178</span> in <span style=\"color: #00ff00; text-decoration-color: #00ff00\">tokenize_text</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
216
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
217
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">175 </span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
218
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">176 </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">def</span> <span style=\"color: #00ff00; text-decoration-color: #00ff00\">tokenize_text</span>(tokenizer: TextTokenizer, text: <span style=\"color: #00ffff; text-decoration-color: #00ffff\">str</span>) -&gt; List[<span style=\"color: #00ffff; text-decoration-color: #00ffff\">str</span>]: <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
219
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">177 │ </span>phonemes = tokenizer([text.strip()]) <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
220
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #800000; text-decoration-color: #800000\">❱ </span>178 <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">│ </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">return</span> phonemes[<span style=\"color: #0000ff; text-decoration-color: #0000ff\">0</span>] <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\"># k2symbols</span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
221
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">179 </span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
222
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">180 </span> <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
223
- "<span style=\"color: #800000; text-decoration-color: #800000\">│</span> <span style=\"color: #7f7f7f; text-decoration-color: #7f7f7f\">181 </span><span style=\"color: #0000ff; text-decoration-color: #0000ff\">def</span> <span style=\"color: #00ff00; text-decoration-color: #00ff00\">remove_encodec_weight_norm</span>(model): <span style=\"color: #800000; text-decoration-color: #800000\">│</span>\n",
224
- "<span style=\"color: #800000; text-decoration-color: #800000\">╰──────────────────────────────────────────────────────────────────────────────────────────────────╯</span>\n",
225
- "<span style=\"color: #ff0000; text-decoration-color: #ff0000; font-weight: bold\">IndexError: </span>list index out of range\n",
226
- "</pre>\n"
227
- ],
228
- "text/plain": [
229
- "\u001b[31m╭─\u001b[0m\u001b[31m──────────────────────────────\u001b[0m\u001b[31m \u001b[0m\u001b[1;31mTraceback \u001b[0m\u001b[1;2;31m(most recent call last)\u001b[0m\u001b[31m \u001b[0m\u001b[31m───────────────────────────────\u001b[0m\u001b[31m─╮\u001b[0m\n",
230
- "\u001b[31m│\u001b[0m in \u001b[92m<module>\u001b[0m \u001b[31m│\u001b[0m\n",
231
- "\u001b[31m│\u001b[0m \u001b[31m│\u001b[0m\n",
232
- "\u001b[31m│\u001b[0m \u001b[2m1 \u001b[0mtext_prompt = \u001b[33m'\u001b[0m\u001b[33m'\u001b[0m \u001b[2m# text of the audio \u001b[0m \u001b[31m│\u001b[0m\n",
233
- "\u001b[31m│\u001b[0m \u001b[2m2 \u001b[0maudio_prompt = \u001b[33m'\u001b[0m\u001b[33m'\u001b[0m \u001b[2m# path to the audio file\u001b[0m \u001b[31m│\u001b[0m\n",
234
- "\u001b[31m│\u001b[0m \u001b[2m3 \u001b[0mtext = \u001b[33m'\u001b[0m\u001b[33m'\u001b[0m \u001b[2m# \u001b[0m \u001b[31m│\u001b[0m\n",
235
- "\u001b[31m│\u001b[0m \u001b[31m❱ \u001b[0m4 message, (sr, data) = infer_from_prompt(text_prompt, audio_prompt, text) \u001b[31m│\u001b[0m\n",
236
- "\u001b[31m│\u001b[0m \u001b[2m5 \u001b[0m \u001b[31m│\u001b[0m\n",
237
- "\u001b[31m│\u001b[0m \u001b[31m│\u001b[0m\n",
238
- "\u001b[31m│\u001b[0m \u001b[2;33m/home/dongsun/.local/lib/python3.10/site-packages/torch/autograd/\u001b[0m\u001b[1;33mgrad_mode.py\u001b[0m:\u001b[94m27\u001b[0m in \u001b[31m│\u001b[0m\n",
239
- "\u001b[31m│\u001b[0m \u001b[92mdecorate_context\u001b[0m \u001b[31m│\u001b[0m\n",
240
- "\u001b[31m│\u001b[0m \u001b[31m│\u001b[0m\n",
241
- "\u001b[31m│\u001b[0m \u001b[2m 24 \u001b[0m\u001b[2m│ │ \u001b[0m\u001b[1;95m@functools\u001b[0m.wraps(func) \u001b[31m│\u001b[0m\n",
242
- "\u001b[31m│\u001b[0m \u001b[2m 25 \u001b[0m\u001b[2m│ │ \u001b[0m\u001b[94mdef\u001b[0m \u001b[92mdecorate_context\u001b[0m(*args, **kwargs): \u001b[31m│\u001b[0m\n",
243
- "\u001b[31m│\u001b[0m \u001b[2m 26 \u001b[0m\u001b[2m│ │ │ \u001b[0m\u001b[94mwith\u001b[0m \u001b[96mself\u001b[0m.clone(): \u001b[31m│\u001b[0m\n",
244
- "\u001b[31m│\u001b[0m \u001b[31m❱ \u001b[0m 27 \u001b[2m│ │ │ │ \u001b[0m\u001b[94mreturn\u001b[0m func(*args, **kwargs) \u001b[31m│\u001b[0m\n",
245
- "\u001b[31m│\u001b[0m \u001b[2m 28 \u001b[0m\u001b[2m│ │ \u001b[0m\u001b[94mreturn\u001b[0m cast(F, decorate_context) \u001b[31m│\u001b[0m\n",
246
- "\u001b[31m│\u001b[0m \u001b[2m 29 \u001b[0m\u001b[2m│ \u001b[0m \u001b[31m│\u001b[0m\n",
247
- "\u001b[31m│\u001b[0m \u001b[2m 30 \u001b[0m\u001b[2m│ \u001b[0m\u001b[94mdef\u001b[0m \u001b[92m_wrap_generator\u001b[0m(\u001b[96mself\u001b[0m, func): \u001b[31m│\u001b[0m\n",
248
- "\u001b[31m│\u001b[0m \u001b[31m│\u001b[0m\n",
249
- "\u001b[31m│\u001b[0m in \u001b[92minfer_from_prompt\u001b[0m \u001b[31m│\u001b[0m\n",
250
- "\u001b[31m│\u001b[0m \u001b[31m│\u001b[0m\n",
251
- "\u001b[31m│\u001b[0m \u001b[2m64 \u001b[0m\u001b[2m│ \u001b[0m\u001b[2m## text to token\u001b[0m \u001b[31m│\u001b[0m\n",
252
- "\u001b[31m│\u001b[0m \u001b[2m65 \u001b[0m\u001b[2m│ \u001b[0mtext_tokens, text_tokens_lens = text_collater( \u001b[31m│\u001b[0m\n",
253
- "\u001b[31m│\u001b[0m \u001b[2m66 \u001b[0m\u001b[2m│ │ \u001b[0m[ \u001b[31m│\u001b[0m\n",
254
- "\u001b[31m│\u001b[0m \u001b[31m❱ \u001b[0m67 \u001b[2m│ │ │ \u001b[0mtokenize_text( \u001b[31m│\u001b[0m\n",
255
- "\u001b[31m│\u001b[0m \u001b[2m68 \u001b[0m\u001b[2m│ │ │ │ \u001b[0mtext_tokenizer, text=\u001b[33mf\u001b[0m\u001b[33m\"\u001b[0m\u001b[33m{\u001b[0mtext_prompt\u001b[33m}\u001b[0m\u001b[33m \u001b[0m\u001b[33m{\u001b[0mtext\u001b[33m}\u001b[0m\u001b[33m\"\u001b[0m.strip() \u001b[31m│\u001b[0m\n",
256
- "\u001b[31m│\u001b[0m \u001b[2m69 \u001b[0m\u001b[2m│ │ │ \u001b[0m) \u001b[31m│\u001b[0m\n",
257
- "\u001b[31m│\u001b[0m \u001b[2m70 \u001b[0m\u001b[2m│ │ \u001b[0m] \u001b[31m│\u001b[0m\n",
258
- "\u001b[31m│\u001b[0m \u001b[31m│\u001b[0m\n",
259
- "\u001b[31m│\u001b[0m \u001b[2;33m/home/dongsun/vall-e/valle/data/\u001b[0m\u001b[1;33mtokenizer.py\u001b[0m:\u001b[94m178\u001b[0m in \u001b[92mtokenize_text\u001b[0m \u001b[31m│\u001b[0m\n",
260
- "\u001b[31m│\u001b[0m \u001b[31m│\u001b[0m\n",
261
- "\u001b[31m│\u001b[0m \u001b[2m175 \u001b[0m \u001b[31m│\u001b[0m\n",
262
- "\u001b[31m│\u001b[0m \u001b[2m176 \u001b[0m\u001b[94mdef\u001b[0m \u001b[92mtokenize_text\u001b[0m(tokenizer: TextTokenizer, text: \u001b[96mstr\u001b[0m) -> List[\u001b[96mstr\u001b[0m]: \u001b[31m│\u001b[0m\n",
263
- "\u001b[31m│\u001b[0m \u001b[2m177 \u001b[0m\u001b[2m│ \u001b[0mphonemes = tokenizer([text.strip()]) \u001b[31m│\u001b[0m\n",
264
- "\u001b[31m│\u001b[0m \u001b[31m❱ \u001b[0m178 \u001b[2m│ \u001b[0m\u001b[94mreturn\u001b[0m phonemes[\u001b[94m0\u001b[0m] \u001b[2m# k2symbols\u001b[0m \u001b[31m│\u001b[0m\n",
265
- "\u001b[31m│\u001b[0m \u001b[2m179 \u001b[0m \u001b[31m│\u001b[0m\n",
266
- "\u001b[31m│\u001b[0m \u001b[2m180 \u001b[0m \u001b[31m│\u001b[0m\n",
267
- "\u001b[31m│\u001b[0m \u001b[2m181 \u001b[0m\u001b[94mdef\u001b[0m \u001b[92mremove_encodec_weight_norm\u001b[0m(model): \u001b[31m│\u001b[0m\n",
268
- "\u001b[31m╰──────────────────────────────────────────────────────────────────────────────────────────────────╯\u001b[0m\n",
269
- "\u001b[1;91mIndexError: \u001b[0mlist index out of range\n"
270
- ]
271
- },
272
- "metadata": {},
273
- "output_type": "display_data"
274
- }
275
- ],
276
  "source": [
277
  "text_prompt = '' # text of the audio \n",
278
  "audio_prompt = '' # path to the audio file\n",
@@ -305,10 +527,7 @@
305
  "execution_count": 3,
306
  "id": "723c13c7-36f5-4af6-bc0b-bbf6d65c2e3a",
307
  "metadata": {
308
- "collapsed": true,
309
- "jupyter": {
310
- "outputs_hidden": true
311
- },
312
  "tags": []
313
  },
314
  "outputs": [
@@ -316,80 +535,114 @@
316
  "name": "stdout",
317
  "output_type": "stream",
318
  "text": [
319
- "Defaulting to user installation because normal site-packages is not writeable\n",
320
- "\u001b[33mWARNING: Ignoring invalid distribution -orch (/home/dongsun/.local/lib/python3.10/site-packages)\u001b[0m\u001b[33m\n",
321
- "\u001b[0m\u001b[33mWARNING: Ignoring invalid distribution -orch (/home/dongsun/.local/lib/python3.10/site-packages)\u001b[0m\u001b[33m\n",
322
- "\u001b[0mRequirement already satisfied: gradio in /home/dongsun/.local/lib/python3.10/site-packages (3.32.0)\n",
323
- "Requirement already satisfied: markdown-it-py[linkify]>=2.0.0 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (2.1.0)\n",
324
- "Requirement already satisfied: semantic-version in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (2.10.0)\n",
325
- "Requirement already satisfied: pandas in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (2.0.3)\n",
326
- "Requirement already satisfied: uvicorn>=0.14.0 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.19.0)\n",
327
- "Requirement already satisfied: mdit-py-plugins<=0.3.3 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.3.1)\n",
328
- "Requirement already satisfied: httpx in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.23.0)\n",
329
- "Requirement already satisfied: orjson in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (3.8.0)\n",
330
- "Requirement already satisfied: ffmpy in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.3.0)\n",
331
- "Requirement already satisfied: pygments>=2.12.0 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (2.14.0)\n",
332
- "Requirement already satisfied: pillow in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (9.5.0)\n",
333
- "Requirement already satisfied: numpy in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (1.23.0)\n",
334
- "Requirement already satisfied: python-multipart in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.0.5)\n",
335
- "Requirement already satisfied: markupsafe in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (2.1.0)\n",
336
- "Requirement already satisfied: pydantic in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (1.8.2)\n",
337
- "Requirement already satisfied: aiohttp in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (3.8.1)\n",
338
- "Requirement already satisfied: websockets>=10.0 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (10.3)\n",
339
- "Requirement already satisfied: typing-extensions in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (4.5.0)\n",
340
- "Requirement already satisfied: gradio-client>=0.2.4 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.2.5)\n",
341
- "Requirement already satisfied: matplotlib in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (3.7.0)\n",
342
- "Requirement already satisfied: huggingface-hub>=0.13.0 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.15.1)\n",
343
- "Requirement already satisfied: pydub in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.25.1)\n",
344
- "Requirement already satisfied: fastapi in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (0.94.0)\n",
345
- "Requirement already satisfied: requests in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (2.31.0)\n",
346
- "Requirement already satisfied: jinja2 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (3.0.3)\n",
347
- "Requirement already satisfied: pyyaml in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (6.0)\n",
348
- "Requirement already satisfied: aiofiles in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (23.1.0)\n",
349
- "Requirement already satisfied: altair>=4.2.0 in /home/dongsun/.local/lib/python3.10/site-packages (from gradio) (4.2.2)\n",
350
- "Requirement already satisfied: jsonschema>=3.0 in /home/dongsun/.local/lib/python3.10/site-packages (from altair>=4.2.0->gradio) (4.4.0)\n",
351
- "Requirement already satisfied: entrypoints in /home/dongsun/.local/lib/python3.10/site-packages (from altair>=4.2.0->gradio) (0.4)\n",
352
- "Requirement already satisfied: toolz in /home/dongsun/.local/lib/python3.10/site-packages (from altair>=4.2.0->gradio) (0.11.2)\n",
353
- "Requirement already satisfied: fsspec in /home/dongsun/.local/lib/python3.10/site-packages (from gradio-client>=0.2.4->gradio) (2022.3.0)\n",
354
- "Requirement already satisfied: packaging in /home/dongsun/.local/lib/python3.10/site-packages (from gradio-client>=0.2.4->gradio) (23.1)\n",
355
- "Requirement already satisfied: filelock in /home/dongsun/.local/lib/python3.10/site-packages (from huggingface-hub>=0.13.0->gradio) (3.11.0)\n",
356
- "Requirement already satisfied: tqdm>=4.42.1 in /home/dongsun/.local/lib/python3.10/site-packages (from huggingface-hub>=0.13.0->gradio) (4.65.0)\n",
357
- "Requirement already satisfied: mdurl~=0.1 in /home/dongsun/.local/lib/python3.10/site-packages (from markdown-it-py[linkify]>=2.0.0->gradio) (0.1.2)\n",
358
- "Requirement already satisfied: linkify-it-py~=1.0 in /home/dongsun/.local/lib/python3.10/site-packages (from markdown-it-py[linkify]>=2.0.0->gradio) (1.0.3)\n",
359
- "Requirement already satisfied: pytz>=2020.1 in /usr/lib/python3.10/site-packages (from pandas->gradio) (2022.7)\n",
360
- "Requirement already satisfied: tzdata>=2022.1 in /home/dongsun/.local/lib/python3.10/site-packages (from pandas->gradio) (2022.7)\n",
361
- "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/lib/python3.10/site-packages (from pandas->gradio) (2.8.2)\n",
362
- "Requirement already satisfied: h11>=0.8 in /home/dongsun/.local/lib/python3.10/site-packages (from uvicorn>=0.14.0->gradio) (0.12.0)\n",
363
- "Requirement already satisfied: click>=7.0 in /usr/lib/python3.10/site-packages (from uvicorn>=0.14.0->gradio) (8.1.3)\n",
364
- "Requirement already satisfied: frozenlist>=1.1.1 in /home/dongsun/.local/lib/python3.10/site-packages (from aiohttp->gradio) (1.3.0)\n",
365
- "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /home/dongsun/.local/lib/python3.10/site-packages (from aiohttp->gradio) (4.0.2)\n",
366
- "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in /home/dongsun/.local/lib/python3.10/site-packages (from aiohttp->gradio) (2.1.1)\n",
367
- "Requirement already satisfied: attrs>=17.3.0 in /home/dongsun/.local/lib/python3.10/site-packages (from aiohttp->gradio) (21.4.0)\n",
368
- "Requirement already satisfied: yarl<2.0,>=1.0 in /home/dongsun/.local/lib/python3.10/site-packages (from aiohttp->gradio) (1.7.2)\n",
369
- "Requirement already satisfied: multidict<7.0,>=4.5 in /home/dongsun/.local/lib/python3.10/site-packages (from aiohttp->gradio) (6.0.2)\n",
370
- "Requirement already satisfied: aiosignal>=1.1.2 in /home/dongsun/.local/lib/python3.10/site-packages (from aiohttp->gradio) (1.2.0)\n",
371
- "Requirement already satisfied: starlette<0.27.0,>=0.26.0 in /home/dongsun/.local/lib/python3.10/site-packages (from fastapi->gradio) (0.26.1)\n",
372
- "Requirement already satisfied: certifi in /home/dongsun/.local/lib/python3.10/site-packages (from httpx->gradio) (2022.12.7)\n",
373
- "Requirement already satisfied: sniffio in /home/dongsun/.local/lib/python3.10/site-packages (from httpx->gradio) (1.2.0)\n",
374
- "Requirement already satisfied: rfc3986[idna2008]<2,>=1.3 in /home/dongsun/.local/lib/python3.10/site-packages (from httpx->gradio) (1.5.0)\n",
375
- "Requirement already satisfied: httpcore<0.16.0,>=0.15.0 in /home/dongsun/.local/lib/python3.10/site-packages (from httpx->gradio) (0.15.0)\n",
376
- "Requirement already satisfied: kiwisolver>=1.0.1 in /home/dongsun/.local/lib/python3.10/site-packages (from matplotlib->gradio) (1.3.2)\n",
377
- "Requirement already satisfied: fonttools>=4.22.0 in /home/dongsun/.local/lib/python3.10/site-packages (from matplotlib->gradio) (4.29.1)\n",
378
- "Requirement already satisfied: contourpy>=1.0.1 in /home/dongsun/.local/lib/python3.10/site-packages (from matplotlib->gradio) (1.0.7)\n",
379
- "Requirement already satisfied: pyparsing>=2.3.1 in /usr/lib/python3.10/site-packages (from matplotlib->gradio) (3.0.9)\n",
380
- "Requirement already satisfied: cycler>=0.10 in /home/dongsun/.local/lib/python3.10/site-packages (from matplotlib->gradio) (0.11.0)\n",
381
- "Requirement already satisfied: six>=1.4.0 in /usr/lib/python3.10/site-packages (from python-multipart->gradio) (1.16.0)\n",
382
- "Requirement already satisfied: idna<4,>=2.5 in /home/dongsun/.local/lib/python3.10/site-packages (from requests->gradio) (2.10)\n",
383
- "Requirement already satisfied: urllib3<3,>=1.21.1 in /home/dongsun/.local/lib/python3.10/site-packages (from requests->gradio) (1.26.15)\n",
384
- "Requirement already satisfied: anyio==3.* in /home/dongsun/.local/lib/python3.10/site-packages (from httpcore<0.16.0,>=0.15.0->httpx->gradio) (3.5.0)\n",
385
- "Requirement already satisfied: pyrsistent!=0.17.0,!=0.17.1,!=0.17.2,>=0.14.0 in /home/dongsun/.local/lib/python3.10/site-packages (from jsonschema>=3.0->altair>=4.2.0->gradio) (0.18.1)\n",
386
- "Requirement already satisfied: uc-micro-py in /home/dongsun/.local/lib/python3.10/site-packages (from linkify-it-py~=1.0->markdown-it-py[linkify]>=2.0.0->gradio) (1.0.1)\n",
387
- "\u001b[33mWARNING: Ignoring invalid distribution -orch (/home/dongsun/.local/lib/python3.10/site-packages)\u001b[0m\u001b[33m\n",
388
- "\u001b[0m\u001b[33mWARNING: Ignoring invalid distribution -orch (/home/dongsun/.local/lib/python3.10/site-packages)\u001b[0m\u001b[33m\n",
389
- "\u001b[0m\u001b[33mWARNING: Ignoring invalid distribution -orch (/home/dongsun/.local/lib/python3.10/site-packages)\u001b[0m\u001b[33m\n",
390
- "\u001b[0m\u001b[33mWARNING: Ignoring invalid distribution -orch (/home/dongsun/.local/lib/python3.10/site-packages)\u001b[0m\u001b[33m\n",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
391
  "\u001b[0m\n",
392
- "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.0.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m23.2.1\u001b[0m\n",
393
  "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpython -m pip install --upgrade pip\u001b[0m\n"
394
  ]
395
  }
@@ -409,15 +662,15 @@
409
  "output_type": "stream",
410
  "text": [
411
  "Running on local URL: http://127.0.0.1:7860\n",
412
- "Running on public URL: https://b3512daf295a0b63b1.gradio.live\n",
413
  "\n",
414
- "This share link expires in 72 hours. For free permanent hosting and GPU upgrades (NEW!), check out Spaces: https://huggingface.co/spaces\n"
415
  ]
416
  },
417
  {
418
  "data": {
419
  "text/html": [
420
- "<div><iframe src=\"https://b3512daf295a0b63b1.gradio.live\" width=\"100%\" height=\"500\" allow=\"autoplay; camera; microphone; clipboard-read; clipboard-write;\" frameborder=\"0\" allowfullscreen></iframe></div>"
421
  ],
422
  "text/plain": [
423
  "<IPython.core.display.HTML object>"
@@ -433,23 +686,6 @@
433
  "execution_count": 4,
434
  "metadata": {},
435
  "output_type": "execute_result"
436
- },
437
- {
438
- "name": "stdout",
439
- "output_type": "stream",
440
- "text": [
441
- "text_loaded\n",
442
- "Audio encoded\n",
443
- "VALL-E EOS [356 -> 899]\n"
444
- ]
445
- },
446
- {
447
- "name": "stderr",
448
- "output_type": "stream",
449
- "text": [
450
- "/home/dongsun/.local/lib/python3.10/site-packages/gradio/processing_utils.py:171: UserWarning: Trying to convert audio automatically from float32 to 16-bit int format.\n",
451
- " warnings.warn(warning.format(data.dtype))\n"
452
- ]
453
  }
454
  ],
455
  "source": [
@@ -502,7 +738,7 @@
502
  "name": "python",
503
  "nbconvert_exporter": "python",
504
  "pygments_lexer": "ipython3",
505
- "version": "3.10.9"
506
  }
507
  },
508
  "nbformat": 4,
 
2
  "cells": [
3
  {
4
  "cell_type": "code",
5
+ "execution_count": 2,
6
  "id": "cb5d0890-3f2d-4020-8270-f3a9bb9f63c6",
7
+ "metadata": {
8
+ "scrolled": true
9
+ },
10
+ "outputs": [
11
+ {
12
+ "name": "stdout",
13
+ "output_type": "stream",
14
+ "text": [
15
+ "Looking in indexes: https://pypi.org/simple, https://download.pytorch.org/whl/cu116\n",
16
+ "Requirement already satisfied: torch==1.13.1 in /usr/local/lib/python3.10/dist-packages (1.13.1+cu117)\n",
17
+ "Requirement already satisfied: torchaudio==0.13.1 in /usr/local/lib/python3.10/dist-packages (0.13.1+cu117)\n",
18
+ "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch==1.13.1) (4.7.1)\n"
19
+ ]
20
+ },
21
+ {
22
+ "name": "stderr",
23
+ "output_type": "stream",
24
+ "text": [
25
+ "WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\n",
26
+ "\n",
27
+ "[notice] A new release of pip is available: 23.1.2 -> 23.2.1\n",
28
+ "[notice] To update, run: python -m pip install --upgrade pip\n"
29
+ ]
30
+ },
31
+ {
32
+ "name": "stdout",
33
+ "output_type": "stream",
34
+ "text": [
35
+ "Requirement already satisfied: torchmetrics==0.11.1 in /usr/local/lib/python3.10/dist-packages (0.11.1)\n",
36
+ "Requirement already satisfied: numpy>=1.17.2 in /usr/local/lib/python3.10/dist-packages (from torchmetrics==0.11.1) (1.24.4)\n",
37
+ "Requirement already satisfied: torch>=1.8.1 in /usr/local/lib/python3.10/dist-packages (from torchmetrics==0.11.1) (1.13.1+cu117)\n",
38
+ "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from torchmetrics==0.11.1) (23.1)\n",
39
+ "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch>=1.8.1->torchmetrics==0.11.1) (4.7.1)\n"
40
+ ]
41
+ },
42
+ {
43
+ "name": "stderr",
44
+ "output_type": "stream",
45
+ "text": [
46
+ "WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\n",
47
+ "\n",
48
+ "[notice] A new release of pip is available: 23.1.2 -> 23.2.1\n",
49
+ "[notice] To update, run: python -m pip install --upgrade pip\n"
50
+ ]
51
+ },
52
+ {
53
+ "name": "stdout",
54
+ "output_type": "stream",
55
+ "text": [
56
+ "Requirement already satisfied: librosa in /usr/local/lib/python3.10/dist-packages (0.10.1)\n",
57
+ "Requirement already satisfied: matplotlib in /usr/local/lib/python3.10/dist-packages (3.8.0)\n",
58
+ "Requirement already satisfied: audioread>=2.1.9 in /usr/local/lib/python3.10/dist-packages (from librosa) (3.0.0)\n",
59
+ "Requirement already satisfied: numpy!=1.22.0,!=1.22.1,!=1.22.2,>=1.20.3 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.24.4)\n",
60
+ "Requirement already satisfied: scipy>=1.2.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.11.2)\n",
61
+ "Requirement already satisfied: scikit-learn>=0.20.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.3.0)\n",
62
+ "Requirement already satisfied: joblib>=0.14 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.3.2)\n",
63
+ "Requirement already satisfied: decorator>=4.3.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (5.1.1)\n",
64
+ "Requirement already satisfied: numba>=0.51.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (0.57.1)\n",
65
+ "Requirement already satisfied: soundfile>=0.12.1 in /usr/local/lib/python3.10/dist-packages (from librosa) (0.12.1)\n",
66
+ "Requirement already satisfied: pooch>=1.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.7.0)\n",
67
+ "Requirement already satisfied: soxr>=0.3.2 in /usr/local/lib/python3.10/dist-packages (from librosa) (0.3.6)\n",
68
+ "Requirement already satisfied: typing-extensions>=4.1.1 in /usr/local/lib/python3.10/dist-packages (from librosa) (4.7.1)\n",
69
+ "Requirement already satisfied: lazy-loader>=0.1 in /usr/local/lib/python3.10/dist-packages (from librosa) (0.3)\n",
70
+ "Requirement already satisfied: msgpack>=1.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.0.5)\n",
71
+ "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (1.1.1)\n",
72
+ "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (0.11.0)\n",
73
+ "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (4.42.1)\n",
74
+ "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (1.4.5)\n",
75
+ "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (23.1)\n",
76
+ "Requirement already satisfied: pillow>=6.2.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (10.0.0)\n",
77
+ "Requirement already satisfied: pyparsing>=2.3.1 in /usr/lib/python3/dist-packages (from matplotlib) (2.4.7)\n",
78
+ "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (2.8.2)\n",
79
+ "Requirement already satisfied: llvmlite<0.41,>=0.40.0dev0 in /usr/local/lib/python3.10/dist-packages (from numba>=0.51.0->librosa) (0.40.1)\n",
80
+ "Requirement already satisfied: platformdirs>=2.5.0 in /usr/local/lib/python3.10/dist-packages (from pooch>=1.0->librosa) (3.8.1)\n",
81
+ "Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.10/dist-packages (from pooch>=1.0->librosa) (2.31.0)\n",
82
+ "Requirement already satisfied: six>=1.5 in /usr/lib/python3/dist-packages (from python-dateutil>=2.7->matplotlib) (1.16.0)\n",
83
+ "Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.20.0->librosa) (3.2.0)\n",
84
+ "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.10/dist-packages (from soundfile>=0.12.1->librosa) (1.15.1)\n",
85
+ "Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0->soundfile>=0.12.1->librosa) (2.21)\n",
86
+ "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (3.2.0)\n",
87
+ "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (3.4)\n",
88
+ "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (1.26.16)\n",
89
+ "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2023.5.7)\n"
90
+ ]
91
+ },
92
+ {
93
+ "name": "stderr",
94
+ "output_type": "stream",
95
+ "text": [
96
+ "WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\n",
97
+ "\n",
98
+ "[notice] A new release of pip is available: 23.1.2 -> 23.2.1\n",
99
+ "[notice] To update, run: python -m pip install --upgrade pip\n"
100
+ ]
101
+ },
102
+ {
103
+ "name": "stdout",
104
+ "output_type": "stream",
105
+ "text": [
106
+ "Reading package lists...\n",
107
+ "Building dependency tree...\n",
108
+ "Reading state information...\n"
109
+ ]
110
+ },
111
+ {
112
+ "name": "stderr",
113
+ "output_type": "stream",
114
+ "text": [
115
+ "E: Unable to locate package espeak-ng\n"
116
+ ]
117
+ },
118
+ {
119
+ "name": "stdout",
120
+ "output_type": "stream",
121
+ "text": [
122
+ "Requirement already satisfied: phonemizer==3.2.1 in /usr/local/lib/python3.10/dist-packages (3.2.1)\n",
123
+ "Requirement already satisfied: pypinyin==0.48.0 in /usr/local/lib/python3.10/dist-packages (0.48.0)\n",
124
+ "Requirement already satisfied: joblib in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (1.3.2)\n",
125
+ "Requirement already satisfied: segments in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (2.2.1)\n",
126
+ "Requirement already satisfied: attrs>=18.1 in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (23.1.0)\n",
127
+ "Requirement already satisfied: dlinfo in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (1.2.1)\n",
128
+ "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (4.7.1)\n",
129
+ "Requirement already satisfied: clldutils>=1.7.3 in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer==3.2.1) (3.20.0)\n",
130
+ "Requirement already satisfied: csvw>=1.5.6 in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer==3.2.1) (3.1.3)\n",
131
+ "Requirement already satisfied: regex in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer==3.2.1) (2023.8.8)\n",
132
+ "Requirement already satisfied: python-dateutil in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (2.8.2)\n",
133
+ "Requirement already satisfied: tabulate>=0.7.7 in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (0.9.0)\n",
134
+ "Requirement already satisfied: colorlog in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (6.7.0)\n",
135
+ "Requirement already satisfied: pylatexenc in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (2.10)\n",
136
+ "Requirement already satisfied: markdown in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (3.4.4)\n",
137
+ "Requirement already satisfied: lxml in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (4.9.3)\n",
138
+ "Requirement already satisfied: markupsafe in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (2.1.3)\n",
139
+ "Requirement already satisfied: babel in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (2.12.1)\n",
140
+ "Requirement already satisfied: colorama in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (0.4.6)\n",
141
+ "Requirement already satisfied: isodate in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (0.6.1)\n",
142
+ "Requirement already satisfied: jsonschema in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (4.18.0)\n",
143
+ "Requirement already satisfied: language-tags in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (1.2.0)\n",
144
+ "Requirement already satisfied: rdflib in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (7.0.0)\n",
145
+ "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (2.31.0)\n",
146
+ "Requirement already satisfied: rfc3986<2 in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (1.5.0)\n",
147
+ "Requirement already satisfied: uritemplate>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (4.1.1)\n",
148
+ "Requirement already satisfied: six in /usr/lib/python3/dist-packages (from isodate->csvw>=1.5.6->segments->phonemizer==3.2.1) (1.16.0)\n",
149
+ "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer==3.2.1) (2023.6.1)\n",
150
+ "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer==3.2.1) (0.29.1)\n",
151
+ "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer==3.2.1) (0.8.10)\n",
152
+ "Requirement already satisfied: pyparsing<4,>=2.1.0 in /usr/lib/python3/dist-packages (from rdflib->csvw>=1.5.6->segments->phonemizer==3.2.1) (2.4.7)\n",
153
+ "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (3.2.0)\n",
154
+ "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (3.4)\n",
155
+ "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (1.26.16)\n",
156
+ "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (2023.5.7)\n"
157
+ ]
158
+ },
159
+ {
160
+ "name": "stderr",
161
+ "output_type": "stream",
162
+ "text": [
163
+ "WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\n",
164
+ "\n",
165
+ "[notice] A new release of pip is available: 23.1.2 -> 23.2.1\n",
166
+ "[notice] To update, run: python -m pip install --upgrade pip\n"
167
+ ]
168
+ },
169
+ {
170
+ "name": "stdout",
171
+ "output_type": "stream",
172
+ "text": [
173
+ "Requirement already satisfied: lhotse in /usr/local/lib/python3.10/dist-packages (1.16.0)\n",
174
+ "Requirement already satisfied: audioread>=2.1.9 in /usr/local/lib/python3.10/dist-packages (from lhotse) (3.0.0)\n",
175
+ "Requirement already satisfied: SoundFile>=0.10 in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.12.1)\n",
176
+ "Requirement already satisfied: click>=7.1.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (8.1.7)\n",
177
+ "Requirement already satisfied: cytoolz>=0.10.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.12.2)\n",
178
+ "Requirement already satisfied: dataclasses in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.6)\n",
179
+ "Requirement already satisfied: intervaltree>=3.1.0 in /usr/local/lib/python3.10/dist-packages (from lhotse) (3.1.0)\n",
180
+ "Requirement already satisfied: numpy>=1.18.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (1.24.4)\n",
181
+ "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from lhotse) (23.1)\n",
182
+ "Requirement already satisfied: pyyaml>=5.3.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (6.0)\n",
183
+ "Requirement already satisfied: tabulate>=0.8.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.9.0)\n",
184
+ "Requirement already satisfied: tqdm in /usr/local/lib/python3.10/dist-packages (from lhotse) (4.66.1)\n",
185
+ "Requirement already satisfied: lilcom>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from lhotse) (1.7)\n",
186
+ "Requirement already satisfied: toolz>=0.8.0 in /usr/local/lib/python3.10/dist-packages (from cytoolz>=0.10.1->lhotse) (0.12.0)\n",
187
+ "Requirement already satisfied: sortedcontainers<3.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from intervaltree>=3.1.0->lhotse) (2.4.0)\n",
188
+ "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.10/dist-packages (from SoundFile>=0.10->lhotse) (1.15.1)\n",
189
+ "Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0->SoundFile>=0.10->lhotse) (2.21)\n"
190
+ ]
191
+ },
192
+ {
193
+ "name": "stderr",
194
+ "output_type": "stream",
195
+ "text": [
196
+ "WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\n",
197
+ "\n",
198
+ "[notice] A new release of pip is available: 23.1.2 -> 23.2.1\n",
199
+ "[notice] To update, run: python -m pip install --upgrade pip\n"
200
+ ]
201
+ },
202
+ {
203
+ "name": "stdout",
204
+ "output_type": "stream",
205
+ "text": [
206
+ "Collecting k2==1.23.4.dev20230224+cuda11.7.torch1.13.1\n",
207
+ " Downloading https://huggingface.co/csukuangfj/k2/resolve/main/cuda/k2-1.23.4.dev20230224+cuda11.7.torch1.13.1-cp310-cp310-linux_x86_64.whl (103.1 MB)\n",
208
+ "\u001b[2K ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 103.1/103.1 MB 29.2 MB/s eta 0:00:00\n",
209
+ "\u001b[?25hRequirement already satisfied: torch==1.13.1 in /usr/local/lib/python3.10/dist-packages (from k2==1.23.4.dev20230224+cuda11.7.torch1.13.1) (1.13.1+cu117)\n",
210
+ "Requirement already satisfied: graphviz in /usr/local/lib/python3.10/dist-packages (from k2==1.23.4.dev20230224+cuda11.7.torch1.13.1) (0.20.1)\n",
211
+ "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch==1.13.1->k2==1.23.4.dev20230224+cuda11.7.torch1.13.1) (4.7.1)\n"
212
+ ]
213
+ },
214
+ {
215
+ "name": "stderr",
216
+ "output_type": "stream",
217
+ "text": [
218
+ "WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\n",
219
+ "\n",
220
+ "[notice] A new release of pip is available: 23.1.2 -> 23.2.1\n",
221
+ "[notice] To update, run: python -m pip install --upgrade pip\n",
222
+ "mkdir: cannot create directory ‘tmp’: File exists\n",
223
+ "Cloning into 'icefall'...\n",
224
+ "fetch-pack: unexpected disconnect while reading sideband packet\n"
225
+ ]
226
+ },
227
+ {
228
+ "name": "stdout",
229
+ "output_type": "stream",
230
+ "text": [
231
+ "Process is interrupted.\n"
232
+ ]
233
+ }
234
+ ],
235
  "source": [
236
+ "%%bash\n",
237
+ "# install the vall-e and required libraries\n",
238
  "# PyTorch\n",
239
  "pip install torch==1.13.1 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116\n",
240
  "pip install torchmetrics==0.11.1\n",
241
  "# fbank\n",
242
+ "pip install librosa matplotlib\n",
243
  "\n",
244
  "# phonemizer pypinyin\n",
245
+ "apt-get install espeak-ng -y\n",
246
  "## OSX: brew install espeak\n",
247
  "pip install phonemizer==3.2.1 pypinyin==0.48.0\n",
248
  "\n",
 
 
 
 
249
  "pip install lhotse\n",
250
  "\n",
251
  "# k2\n",
252
  "# find the right version in https://huggingface.co/csukuangfj/k2\n",
253
+ "pip install https://huggingface.co/csukuangfj/k2/resolve/main/cuda/k2-1.23.4.dev20230224+cuda11.7.torch1.13.1-cp310-cp310-linux_x86_64.whl\n",
254
+ "mkdir tmp\n",
255
  "\n",
 
256
  "git clone https://github.com/k2-fsa/icefall\n",
257
+ "mv icefall tmp\n",
258
+ "cd tmp/icefall\n",
259
  "pip install -r requirements.txt\n",
260
+ "pip install -e .\n",
261
  "export PYTHONPATH=`pwd`/../icefall:$PYTHONPATH\n",
262
  "echo \"export PYTHONPATH=`pwd`/../icefall:\\$PYTHONPATH\" >> ~/.zshrc\n",
263
  "echo \"export PYTHONPATH=`pwd`/../icefall:\\$PYTHONPATH\" >> ~/.bashrc\n",
264
+ "cd ../..\n",
265
  "source ~/.zshrc\n",
266
+ "source ~/.bashrc\n",
267
  "\n",
268
+ "\n",
269
+ "git clone https://github.com/lifeiteng/vall-e\n",
270
+ "mv vall-e tmp\n",
271
+ "cd tmp/vall-e\n",
272
+ "pip install -e .\n",
273
+ "\n",
274
+ "pip install vocos"
275
+ ]
276
+ },
277
+ {
278
+ "cell_type": "code",
279
+ "execution_count": 2,
280
+ "id": "fc4f7f9d-235b-4dd5-9384-42c3f6c65428",
281
+ "metadata": {
282
+ "scrolled": true
283
+ },
284
+ "outputs": [
285
+ {
286
+ "name": "stdout",
287
+ "output_type": "stream",
288
+ "text": [
289
+ "--2023-09-21 06:28:48-- https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/vall-e_ko_v0.pt\n",
290
+ "Resolving huggingface.co (huggingface.co)... 13.32.110.77, 13.32.110.109, 13.32.110.28, ...\n",
291
+ "Connecting to huggingface.co (huggingface.co)|13.32.110.77|:443... connected.\n",
292
+ "HTTP request sent, awaiting response... 302 Found\n",
293
+ "Location: https://cdn-lfs.huggingface.co/repos/f8/b9/f8b90061950052a23944dd83f71a6f031a5d39c73dbb799693620ca8a4186a97/e2894775b160c24132f8f6d6d7df6cc8bf59a9b465778d08989e200859610560?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27vall-e_ko_v0.pt%3B+filename%3D%22vall-e_ko_v0.pt%22%3B&Expires=1695536928&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NTUzNjkyOH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9mOC9iOS9mOGI5MDA2MTk1MDA1MmEyMzk0NGRkODNmNzFhNmYwMzFhNWQzOWM3M2RiYjc5OTY5MzYyMGNhOGE0MTg2YTk3L2UyODk0Nzc1YjE2MGMyNDEzMmY4ZjZkNmQ3ZGY2Y2M4YmY1OWE5YjQ2NTc3OGQwODk4OWUyMDA4NTk2MTA1NjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=EjVtvNUk%7E2tZyrflILNnAD6w-KTF1ymHSkMz%7EicG8YD05s8KvFGPJfmidMFLduH2RIPlzyucFCL7Nu3ncreEiQcyPaIcVVLW7dCzOktXKevQ9dRTeSTSOtyWe17lHT0SwQ8JTYH2DNydvYQXtf%7E6iaInP%7EINwzdlmYkxBW6pgKycakZliLgw0UmyfOY2IX424uNozaqKWhCfAB7EqBLsmfxXnRZtGrtrch78YK3FkowE5iQj0Gt87AwAEg30aOrSqLv7wmplMBiu8GegaUa40wWqH9AjuB1eeYvdkoMtt3eBEmzYXXMkd3xtY5E6aRGgwQepf4%7EeEsxuyNHvA%7EZpTA__&Key-Pair-Id=KVTP0A1DKRTAX [following]\n",
294
+ "--2023-09-21 06:28:48-- https://cdn-lfs.huggingface.co/repos/f8/b9/f8b90061950052a23944dd83f71a6f031a5d39c73dbb799693620ca8a4186a97/e2894775b160c24132f8f6d6d7df6cc8bf59a9b465778d08989e200859610560?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27vall-e_ko_v0.pt%3B+filename%3D%22vall-e_ko_v0.pt%22%3B&Expires=1695536928&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NTUzNjkyOH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9mOC9iOS9mOGI5MDA2MTk1MDA1MmEyMzk0NGRkODNmNzFhNmYwMzFhNWQzOWM3M2RiYjc5OTY5MzYyMGNhOGE0MTg2YTk3L2UyODk0Nzc1YjE2MGMyNDEzMmY4ZjZkNmQ3ZGY2Y2M4YmY1OWE5YjQ2NTc3OGQwODk4OWUyMDA4NTk2MTA1NjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=EjVtvNUk%7E2tZyrflILNnAD6w-KTF1ymHSkMz%7EicG8YD05s8KvFGPJfmidMFLduH2RIPlzyucFCL7Nu3ncreEiQcyPaIcVVLW7dCzOktXKevQ9dRTeSTSOtyWe17lHT0SwQ8JTYH2DNydvYQXtf%7E6iaInP%7EINwzdlmYkxBW6pgKycakZliLgw0UmyfOY2IX424uNozaqKWhCfAB7EqBLsmfxXnRZtGrtrch78YK3FkowE5iQj0Gt87AwAEg30aOrSqLv7wmplMBiu8GegaUa40wWqH9AjuB1eeYvdkoMtt3eBEmzYXXMkd3xtY5E6aRGgwQepf4%7EeEsxuyNHvA%7EZpTA__&Key-Pair-Id=KVTP0A1DKRTAX\n",
295
+ "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 18.66.122.69, 18.66.122.21, 18.66.122.62, ...\n",
296
+ "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|18.66.122.69|:443... connected.\n",
297
+ "HTTP request sent, awaiting response... 200 OK\n",
298
+ "Length: 2699959616 (2.5G) [binary/octet-stream]\n",
299
+ "Saving to: ‘vall-e_ko_v0.pt’\n",
300
+ "\n",
301
+ "vall-e_ko_v0.pt 100%[===================>] 2.51G 55.9MB/s in 48s \n",
302
+ "\n",
303
+ "2023-09-21 06:29:36 (53.4 MB/s) - ‘vall-e_ko_v0.pt’ saved [2699959616/2699959616]\n",
304
+ "\n",
305
+ "--2023-09-21 06:29:36-- https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/unique_text_tokens.k2symbols\n",
306
+ "Resolving huggingface.co (huggingface.co)... 13.32.110.77, 13.32.110.109, 13.32.110.28, ...\n",
307
+ "Connecting to huggingface.co (huggingface.co)|13.32.110.77|:443... connected.\n",
308
+ "HTTP request sent, awaiting response... 200 OK\n",
309
+ "Length: 3238 (3.2K) [text/plain]\n",
310
+ "Saving to: ‘unique_text_tokens.k2symbols’\n",
311
+ "\n",
312
+ "unique_text_tokens. 100%[===================>] 3.16K --.-KB/s in 0s \n",
313
+ "\n",
314
+ "2023-09-21 06:29:37 (2.02 GB/s) - ‘unique_text_tokens.k2symbols’ saved [3238/3238]\n",
315
+ "\n"
316
+ ]
317
+ }
318
+ ],
319
+ "source": [
320
+ "!wget https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/vall-e_ko_v0.pt\n",
321
+ "!wget https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/unique_text_tokens.k2symbols"
322
  ]
323
  },
324
  {
 
328
  "metadata": {},
329
  "outputs": [
330
  {
331
+ "name": "stdout",
332
  "output_type": "stream",
333
  "text": [
334
+ "Use 32 cpu cores for computing\n"
 
335
  ]
336
  },
337
  {
338
+ "name": "stderr",
339
  "output_type": "stream",
340
  "text": [
341
+ "Downloading: \"https://dl.fbaipublicfiles.com/encodec/v0/encodec_24khz-d7cc33bc.th\" to /root/.cache/torch/hub/checkpoints/encodec_24khz-d7cc33bc.th\n"
 
342
  ]
343
+ },
344
+ {
345
+ "data": {
346
+ "application/vnd.jupyter.widget-view+json": {
347
+ "model_id": "57d28016d2664410925e41c812bddbca",
348
+ "version_major": 2,
349
+ "version_minor": 0
350
+ },
351
+ "text/plain": [
352
+ " 0%| | 0.00/88.9M [00:00<?, ?B/s]"
353
+ ]
354
+ },
355
+ "metadata": {},
356
+ "output_type": "display_data"
357
+ },
358
+ {
359
+ "data": {
360
+ "application/vnd.jupyter.widget-view+json": {
361
+ "model_id": "c0cc48c2c58b45db90b76ed142bec40d",
362
+ "version_major": 2,
363
+ "version_minor": 0
364
+ },
365
+ "text/plain": [
366
+ "Downloading (…)lve/main/config.yaml: 0%| | 0.00/503 [00:00<?, ?B/s]"
367
+ ]
368
+ },
369
+ "metadata": {},
370
+ "output_type": "display_data"
371
+ },
372
+ {
373
+ "data": {
374
+ "application/vnd.jupyter.widget-view+json": {
375
+ "model_id": "e777aaf1ff994a1aab7befed6600df09",
376
+ "version_major": 2,
377
+ "version_minor": 0
378
+ },
379
+ "text/plain": [
380
+ "Downloading pytorch_model.bin: 0%| | 0.00/40.4M [00:00<?, ?B/s]"
381
+ ]
382
+ },
383
+ "metadata": {},
384
+ "output_type": "display_data"
385
  }
386
  ],
387
  "source": [
 
403
  " AudioTokenizer,\n",
404
  " TextTokenizer,\n",
405
  " tokenize_audio,\n",
406
+ " tokenize_text\n",
407
  ")\n",
408
  "from icefall.utils import AttributeDict\n",
409
  "from valle.data.collation import get_text_token_collater\n",
 
491
  },
492
  {
493
  "cell_type": "code",
494
+ "execution_count": null,
495
  "id": "41e40fe5-595e-4f9a-8dd7-dfda52944529",
496
  "metadata": {},
497
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
498
  "source": [
499
  "text_prompt = '' # text of the audio \n",
500
  "audio_prompt = '' # path to the audio file\n",
 
527
  "execution_count": 3,
528
  "id": "723c13c7-36f5-4af6-bc0b-bbf6d65c2e3a",
529
  "metadata": {
530
+ "scrolled": true,
 
 
 
531
  "tags": []
532
  },
533
  "outputs": [
 
535
  "name": "stdout",
536
  "output_type": "stream",
537
  "text": [
538
+ "Collecting gradio\n",
539
+ " Downloading gradio-3.44.4-py3-none-any.whl (20.2 MB)\n",
540
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m20.2/20.2 MB\u001b[0m \u001b[31m12.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
541
+ "\u001b[?25hCollecting aiofiles<24.0,>=22.0 (from gradio)\n",
542
+ " Downloading aiofiles-23.2.1-py3-none-any.whl (15 kB)\n",
543
+ "Collecting altair<6.0,>=4.2.0 (from gradio)\n",
544
+ " Downloading altair-5.1.1-py3-none-any.whl (520 kB)\n",
545
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m520.6/520.6 kB\u001b[0m \u001b[31m16.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
546
+ "\u001b[?25hCollecting fastapi (from gradio)\n",
547
+ " Downloading fastapi-0.103.1-py3-none-any.whl (66 kB)\n",
548
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m66.2/66.2 kB\u001b[0m \u001b[31m19.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
549
+ "\u001b[?25hCollecting ffmpy (from gradio)\n",
550
+ " Downloading ffmpy-0.3.1.tar.gz (5.5 kB)\n",
551
+ " Preparing metadata (setup.py) ... \u001b[?25ldone\n",
552
+ "\u001b[?25hCollecting gradio-client==0.5.1 (from gradio)\n",
553
+ " Downloading gradio_client-0.5.1-py3-none-any.whl (298 kB)\n",
554
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m298.2/298.2 kB\u001b[0m \u001b[31m22.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
555
+ "\u001b[?25hCollecting httpx (from gradio)\n",
556
+ " Downloading httpx-0.25.0-py3-none-any.whl (75 kB)\n",
557
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m75.7/75.7 kB\u001b[0m \u001b[31m23.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
558
+ "\u001b[?25hRequirement already satisfied: huggingface-hub>=0.14.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (0.17.2)\n",
559
+ "Collecting importlib-resources<7.0,>=1.3 (from gradio)\n",
560
+ " Downloading importlib_resources-6.1.0-py3-none-any.whl (33 kB)\n",
561
+ "Requirement already satisfied: jinja2<4.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (3.1.2)\n",
562
+ "Requirement already satisfied: markupsafe~=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (2.1.3)\n",
563
+ "Requirement already satisfied: matplotlib~=3.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (3.8.0)\n",
564
+ "Requirement already satisfied: numpy~=1.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (1.24.4)\n",
565
+ "Collecting orjson~=3.0 (from gradio)\n",
566
+ " Downloading orjson-3.9.7-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (138 kB)\n",
567
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m138.7/138.7 kB\u001b[0m \u001b[31m35.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
568
+ "\u001b[?25hRequirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from gradio) (23.1)\n",
569
+ "Collecting pandas<3.0,>=1.0 (from gradio)\n",
570
+ " Downloading pandas-2.1.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (12.3 MB)\n",
571
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m12.3/12.3 MB\u001b[0m \u001b[31m16.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
572
+ "\u001b[?25hRequirement already satisfied: pillow<11.0,>=8.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (10.0.0)\n",
573
+ "Collecting pydantic!=1.8,!=1.8.1,!=2.0.0,!=2.0.1,<3.0.0,>=1.7.4 (from gradio)\n",
574
+ " Downloading pydantic-2.3.0-py3-none-any.whl (374 kB)\n",
575
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m374.5/374.5 kB\u001b[0m \u001b[31m26.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
576
+ "\u001b[?25hCollecting pydub (from gradio)\n",
577
+ " Downloading pydub-0.25.1-py2.py3-none-any.whl (32 kB)\n",
578
+ "Collecting python-multipart (from gradio)\n",
579
+ " Downloading python_multipart-0.0.6-py3-none-any.whl (45 kB)\n",
580
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m45.7/45.7 kB\u001b[0m \u001b[31m17.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
581
+ "\u001b[?25hRequirement already satisfied: pyyaml<7.0,>=5.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (6.0)\n",
582
+ "Requirement already satisfied: requests~=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (2.31.0)\n",
583
+ "Collecting semantic-version~=2.0 (from gradio)\n",
584
+ " Downloading semantic_version-2.10.0-py2.py3-none-any.whl (15 kB)\n",
585
+ "Requirement already satisfied: typing-extensions~=4.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (4.7.1)\n",
586
+ "Collecting uvicorn>=0.14.0 (from gradio)\n",
587
+ " Downloading uvicorn-0.23.2-py3-none-any.whl (59 kB)\n",
588
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m59.5/59.5 kB\u001b[0m \u001b[31m22.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
589
+ "\u001b[?25hCollecting websockets<12.0,>=10.0 (from gradio)\n",
590
+ " Downloading websockets-11.0.3-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (129 kB)\n",
591
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m129.9/129.9 kB\u001b[0m \u001b[31m45.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
592
+ "\u001b[?25hRequirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from gradio-client==0.5.1->gradio) (2023.9.1)\n",
593
+ "Requirement already satisfied: jsonschema>=3.0 in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio) (4.18.0)\n",
594
+ "Requirement already satisfied: toolz in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio) (0.12.0)\n",
595
+ "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub>=0.14.0->gradio) (3.12.4)\n",
596
+ "Requirement already satisfied: tqdm>=4.42.1 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub>=0.14.0->gradio) (4.66.1)\n",
597
+ "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (1.1.1)\n",
598
+ "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (0.11.0)\n",
599
+ "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (4.42.1)\n",
600
+ "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (1.4.5)\n",
601
+ "Requirement already satisfied: pyparsing>=2.3.1 in /usr/lib/python3/dist-packages (from matplotlib~=3.0->gradio) (2.4.7)\n",
602
+ "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (2.8.2)\n",
603
+ "Collecting pytz>=2020.1 (from pandas<3.0,>=1.0->gradio)\n",
604
+ " Downloading pytz-2023.3.post1-py2.py3-none-any.whl (502 kB)\n",
605
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m502.5/502.5 kB\u001b[0m \u001b[31m23.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
606
+ "\u001b[?25hCollecting tzdata>=2022.1 (from pandas<3.0,>=1.0->gradio)\n",
607
+ " Downloading tzdata-2023.3-py2.py3-none-any.whl (341 kB)\n",
608
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━��━━━━━━━━━━━━━━━\u001b[0m \u001b[32m341.8/341.8 kB\u001b[0m \u001b[31m20.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
609
+ "\u001b[?25hCollecting annotated-types>=0.4.0 (from pydantic!=1.8,!=1.8.1,!=2.0.0,!=2.0.1,<3.0.0,>=1.7.4->gradio)\n",
610
+ " Downloading annotated_types-0.5.0-py3-none-any.whl (11 kB)\n",
611
+ "Collecting pydantic-core==2.6.3 (from pydantic!=1.8,!=1.8.1,!=2.0.0,!=2.0.1,<3.0.0,>=1.7.4->gradio)\n",
612
+ " Downloading pydantic_core-2.6.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.9 MB)\n",
613
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.9/1.9 MB\u001b[0m \u001b[31m10.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m00:01\u001b[0m00:01\u001b[0m\n",
614
+ "\u001b[?25hRequirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (3.2.0)\n",
615
+ "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (3.4)\n",
616
+ "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (1.26.16)\n",
617
+ "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (2023.5.7)\n",
618
+ "Requirement already satisfied: click>=7.0 in /usr/local/lib/python3.10/dist-packages (from uvicorn>=0.14.0->gradio) (8.1.7)\n",
619
+ "Collecting h11>=0.8 (from uvicorn>=0.14.0->gradio)\n",
620
+ " Downloading h11-0.14.0-py3-none-any.whl (58 kB)\n",
621
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.3/58.3 kB\u001b[0m \u001b[31m18.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
622
+ "\u001b[?25hRequirement already satisfied: anyio<4.0.0,>=3.7.1 in /usr/local/lib/python3.10/dist-packages (from fastapi->gradio) (3.7.1)\n",
623
+ "Collecting starlette<0.28.0,>=0.27.0 (from fastapi->gradio)\n",
624
+ " Downloading starlette-0.27.0-py3-none-any.whl (66 kB)\n",
625
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m67.0/67.0 kB\u001b[0m \u001b[31m24.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
626
+ "\u001b[?25hCollecting httpcore<0.19.0,>=0.18.0 (from httpx->gradio)\n",
627
+ " Downloading httpcore-0.18.0-py3-none-any.whl (76 kB)\n",
628
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m76.0/76.0 kB\u001b[0m \u001b[31m23.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
629
+ "\u001b[?25hRequirement already satisfied: sniffio in /usr/local/lib/python3.10/dist-packages (from httpx->gradio) (1.3.0)\n",
630
+ "Requirement already satisfied: exceptiongroup in /usr/local/lib/python3.10/dist-packages (from anyio<4.0.0,>=3.7.1->fastapi->gradio) (1.1.2)\n",
631
+ "Requirement already satisfied: attrs>=22.2.0 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (23.1.0)\n",
632
+ "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (2023.6.1)\n",
633
+ "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (0.29.1)\n",
634
+ "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (0.8.10)\n",
635
+ "Requirement already satisfied: six>=1.5 in /usr/lib/python3/dist-packages (from python-dateutil>=2.7->matplotlib~=3.0->gradio) (1.16.0)\n",
636
+ "Building wheels for collected packages: ffmpy\n",
637
+ " Building wheel for ffmpy (setup.py) ... \u001b[?25ldone\n",
638
+ "\u001b[?25h Created wheel for ffmpy: filename=ffmpy-0.3.1-py3-none-any.whl size=5579 sha256=97b9a5fbfa40c640a1a096fb921cf42f65fb02d09b80a4e8195a50d27270698e\n",
639
+ " Stored in directory: /root/.cache/pip/wheels/01/a6/d1/1c0828c304a4283b2c1639a09ad86f83d7c487ef34c6b4a1bf\n",
640
+ "Successfully built ffmpy\n",
641
+ "Installing collected packages: pytz, pydub, ffmpy, websockets, tzdata, semantic-version, python-multipart, pydantic-core, orjson, importlib-resources, h11, annotated-types, aiofiles, uvicorn, starlette, pydantic, pandas, httpcore, httpx, fastapi, gradio-client, altair, gradio\n",
642
+ "Successfully installed aiofiles-23.2.1 altair-5.1.1 annotated-types-0.5.0 fastapi-0.103.1 ffmpy-0.3.1 gradio-3.44.4 gradio-client-0.5.1 h11-0.14.0 httpcore-0.18.0 httpx-0.25.0 importlib-resources-6.1.0 orjson-3.9.7 pandas-2.1.1 pydantic-2.3.0 pydantic-core-2.6.3 pydub-0.25.1 python-multipart-0.0.6 pytz-2023.3.post1 semantic-version-2.10.0 starlette-0.27.0 tzdata-2023.3 uvicorn-0.23.2 websockets-11.0.3\n",
643
+ "\u001b[33mWARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\u001b[0m\u001b[33m\n",
644
  "\u001b[0m\n",
645
+ "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.1.2\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m23.2.1\u001b[0m\n",
646
  "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpython -m pip install --upgrade pip\u001b[0m\n"
647
  ]
648
  }
 
662
  "output_type": "stream",
663
  "text": [
664
  "Running on local URL: http://127.0.0.1:7860\n",
665
+ "Running on public URL: https://e3c6ff480c5537ff44.gradio.live\n",
666
  "\n",
667
+ "This share link expires in 72 hours. For free permanent hosting and GPU upgrades, run `gradio deploy` from Terminal to deploy to Spaces (https://huggingface.co/spaces)\n"
668
  ]
669
  },
670
  {
671
  "data": {
672
  "text/html": [
673
+ "<div><iframe src=\"https://e3c6ff480c5537ff44.gradio.live\" width=\"100%\" height=\"500\" allow=\"autoplay; camera; microphone; clipboard-read; clipboard-write;\" frameborder=\"0\" allowfullscreen></iframe></div>"
674
  ],
675
  "text/plain": [
676
  "<IPython.core.display.HTML object>"
 
686
  "execution_count": 4,
687
  "metadata": {},
688
  "output_type": "execute_result"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
689
  }
690
  ],
691
  "source": [
 
738
  "name": "python",
739
  "nbconvert_exporter": "python",
740
  "pygments_lexer": "ipython3",
741
+ "version": "3.10.6"
742
  }
743
  },
744
  "nbformat": 4,