update
Browse files- app.py +10 -10
- bigvgan.py +5 -4
app.py
CHANGED
@@ -275,7 +275,7 @@ with iface:
|
|
275 |
</h1>
|
276 |
</div>
|
277 |
<p style="margin-bottom: 10px; font-size: 125%">
|
278 |
-
<a href="https://arxiv.org/abs/2206.04658">[Paper]</a> <a href="https://github.com/NVIDIA/BigVGAN">[Code]</a> <a href="https://bigvgan-demo.github.io/">[Demo]</a> <a href="https://research.nvidia.com/labs/adlr/projects/bigvgan/">[Project page]</a>
|
279 |
</p>
|
280 |
</div>
|
281 |
"""
|
@@ -362,7 +362,7 @@ with iface:
|
|
362 |
</thead>
|
363 |
<tbody>
|
364 |
<tr>
|
365 |
-
<td>bigvgan_v2_44khz_128band_512x</td>
|
366 |
<td>44 kHz</td>
|
367 |
<td>128</td>
|
368 |
<td>22050</td>
|
@@ -372,7 +372,7 @@ with iface:
|
|
372 |
<td>No</td>
|
373 |
</tr>
|
374 |
<tr>
|
375 |
-
<td>bigvgan_v2_44khz_128band_256x</td>
|
376 |
<td>44 kHz</td>
|
377 |
<td>128</td>
|
378 |
<td>22050</td>
|
@@ -382,7 +382,7 @@ with iface:
|
|
382 |
<td>No</td>
|
383 |
</tr>
|
384 |
<tr>
|
385 |
-
<td>bigvgan_v2_24khz_100band_256x</td>
|
386 |
<td>24 kHz</td>
|
387 |
<td>100</td>
|
388 |
<td>12000</td>
|
@@ -392,7 +392,7 @@ with iface:
|
|
392 |
<td>No</td>
|
393 |
</tr>
|
394 |
<tr>
|
395 |
-
<td>bigvgan_v2_22khz_80band_256x</td>
|
396 |
<td>22 kHz</td>
|
397 |
<td>80</td>
|
398 |
<td>11025</td>
|
@@ -402,7 +402,7 @@ with iface:
|
|
402 |
<td>No</td>
|
403 |
</tr>
|
404 |
<tr>
|
405 |
-
<td>bigvgan_v2_22khz_80band_fmax8k_256x</td>
|
406 |
<td>22 kHz</td>
|
407 |
<td>80</td>
|
408 |
<td>8000</td>
|
@@ -412,7 +412,7 @@ with iface:
|
|
412 |
<td>No</td>
|
413 |
</tr>
|
414 |
<tr>
|
415 |
-
<td>bigvgan_24khz_100band</td>
|
416 |
<td>24 kHz</td>
|
417 |
<td>100</td>
|
418 |
<td>12000</td>
|
@@ -422,7 +422,7 @@ with iface:
|
|
422 |
<td>No</td>
|
423 |
</tr>
|
424 |
<tr>
|
425 |
-
<td>bigvgan_base_24khz_100band</td>
|
426 |
<td>24 kHz</td>
|
427 |
<td>100</td>
|
428 |
<td>12000</td>
|
@@ -432,7 +432,7 @@ with iface:
|
|
432 |
<td>No</td>
|
433 |
</tr>
|
434 |
<tr>
|
435 |
-
<td>bigvgan_22khz_80band</td>
|
436 |
<td>22 kHz</td>
|
437 |
<td>80</td>
|
438 |
<td>8000</td>
|
@@ -442,7 +442,7 @@ with iface:
|
|
442 |
<td>No</td>
|
443 |
</tr>
|
444 |
<tr>
|
445 |
-
<td>bigvgan_base_22khz_80band</td>
|
446 |
<td>22 kHz</td>
|
447 |
<td>80</td>
|
448 |
<td>8000</td>
|
|
|
275 |
</h1>
|
276 |
</div>
|
277 |
<p style="margin-bottom: 10px; font-size: 125%">
|
278 |
+
<a href="https://arxiv.org/abs/2206.04658">[Paper]</a> <a href="https://github.com/NVIDIA/BigVGAN">[Code]</a> <a href="https://bigvgan-demo.github.io/">[Demo]</a> <a href="https://research.nvidia.com/labs/adlr/projects/bigvgan/">[Project page]</a>
|
279 |
</p>
|
280 |
</div>
|
281 |
"""
|
|
|
362 |
</thead>
|
363 |
<tbody>
|
364 |
<tr>
|
365 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_v2_44khz_128band_512x">bigvgan_v2_44khz_128band_512x</a></td>
|
366 |
<td>44 kHz</td>
|
367 |
<td>128</td>
|
368 |
<td>22050</td>
|
|
|
372 |
<td>No</td>
|
373 |
</tr>
|
374 |
<tr>
|
375 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_v2_44khz_128band_256x">bigvgan_v2_44khz_128band_256x</a></td>
|
376 |
<td>44 kHz</td>
|
377 |
<td>128</td>
|
378 |
<td>22050</td>
|
|
|
382 |
<td>No</td>
|
383 |
</tr>
|
384 |
<tr>
|
385 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_v2_24khz_100band_256x">bigvgan_v2_24khz_100band_256x</a></td>
|
386 |
<td>24 kHz</td>
|
387 |
<td>100</td>
|
388 |
<td>12000</td>
|
|
|
392 |
<td>No</td>
|
393 |
</tr>
|
394 |
<tr>
|
395 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_v2_22khz_80band_256x">bigvgan_v2_22khz_80band_256x</a></td>
|
396 |
<td>22 kHz</td>
|
397 |
<td>80</td>
|
398 |
<td>11025</td>
|
|
|
402 |
<td>No</td>
|
403 |
</tr>
|
404 |
<tr>
|
405 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_v2_22khz_80band_fmax8k_256x">bigvgan_v2_22khz_80band_fmax8k_256x</a></td>
|
406 |
<td>22 kHz</td>
|
407 |
<td>80</td>
|
408 |
<td>8000</td>
|
|
|
412 |
<td>No</td>
|
413 |
</tr>
|
414 |
<tr>
|
415 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_24khz_100band">bigvgan_24khz_100band</a></td>
|
416 |
<td>24 kHz</td>
|
417 |
<td>100</td>
|
418 |
<td>12000</td>
|
|
|
422 |
<td>No</td>
|
423 |
</tr>
|
424 |
<tr>
|
425 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_base_24khz_100band">bigvgan_base_24khz_100band</a></td>
|
426 |
<td>24 kHz</td>
|
427 |
<td>100</td>
|
428 |
<td>12000</td>
|
|
|
432 |
<td>No</td>
|
433 |
</tr>
|
434 |
<tr>
|
435 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_22khz_80band">bigvgan_22khz_80band</a></td>
|
436 |
<td>22 kHz</td>
|
437 |
<td>80</td>
|
438 |
<td>8000</td>
|
|
|
442 |
<td>No</td>
|
443 |
</tr>
|
444 |
<tr>
|
445 |
+
<td><a href="https://huggingface.co/nvidia/bigvgan_base_22khz_80band">bigvgan_base_22khz_80band</a></td>
|
446 |
<td>22 kHz</td>
|
447 |
<td>80</td>
|
448 |
<td>8000</td>
|
bigvgan.py
CHANGED
@@ -321,9 +321,10 @@ class BigVGAN(
|
|
321 |
# instantiate BigVGAN using h
|
322 |
##################################################################
|
323 |
if use_cuda_kernel:
|
324 |
-
print(f"[
|
325 |
-
print(f"[
|
326 |
-
|
|
|
327 |
|
328 |
##################################################################
|
329 |
# download and load pretrained generator weight
|
@@ -332,7 +333,7 @@ class BigVGAN(
|
|
332 |
print("Loading weights from local directory")
|
333 |
model_file = os.path.join(model_id, 'bigvgan_generator.pt')
|
334 |
else:
|
335 |
-
print(f"
|
336 |
model_file = hf_hub_download(
|
337 |
repo_id=model_id,
|
338 |
filename='bigvgan_generator.pt',
|
|
|
321 |
# instantiate BigVGAN using h
|
322 |
##################################################################
|
323 |
if use_cuda_kernel:
|
324 |
+
print(f"[WARNING] You have specified use_cuda_kernel=True during BigVGAN.from_pretrained(). Only inference is supported (training is not implemented)!")
|
325 |
+
print(f"[WARNING] You need nvcc and ninja installed in your system that matches your PyTorch build is using to build the kernel. If not, the model will fail to initialize or generate incorrect waveform!")
|
326 |
+
print(f"[WARNING] For detail, see the official GitHub repository: https://github.com/NVIDIA/BigVGAN?tab=readme-ov-file#using-custom-cuda-kernel-for-synthesis")
|
327 |
+
model = cls(h, use_cuda_kernel=use_cuda_kernel)
|
328 |
|
329 |
##################################################################
|
330 |
# download and load pretrained generator weight
|
|
|
333 |
print("Loading weights from local directory")
|
334 |
model_file = os.path.join(model_id, 'bigvgan_generator.pt')
|
335 |
else:
|
336 |
+
print(f"Loading weights from {model_id}")
|
337 |
model_file = hf_hub_download(
|
338 |
repo_id=model_id,
|
339 |
filename='bigvgan_generator.pt',
|