Omnibus commited on
Commit
d10d42c
1 Parent(s): 3f1c26e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +13 -4
app.py CHANGED
@@ -2,6 +2,7 @@ import gradio as gr
2
  import torch
3
  from transformers import AutoProcessor, BarkModel
4
  import scipy
 
5
 
6
 
7
  # device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -34,15 +35,23 @@ def run_bark(text, n, lang):
34
  scipy.io.wavfile.write("bark_out.wav", rate=sampling_rate, data=speech_values.cpu().numpy().squeeze())
35
  return ("bark_out.wav")
36
 
 
 
 
 
 
 
37
  with gr.Blocks() as app:
38
  with gr.Column():
39
  in_text = gr.Textbox()
40
  with gr.Tab("Default"):
41
- speaker_num = gr.Dropdown(label="Speaker Voice", choices=num_list,value="1")
42
- speaker_lang = gr.Dropdown(label="Speaker Language", choices=lang_list,value="en")
 
43
  with gr.Tab("Upload"):
44
- in_aud_mic = gr.Audio(source='microphone')
45
- in_aud_file = gr.Audio(source='upload')
 
46
  in_aud_yout = gr.Textbox(label="YouTube URL")
47
  yout_vid = gr.Video()
48
  #speaker_num = gr.Number(value=0)
 
2
  import torch
3
  from transformers import AutoProcessor, BarkModel
4
  import scipy
5
+ from pytube import YouTube
6
 
7
 
8
  # device = "cuda" if torch.cuda.is_available() else "cpu"
 
35
  scipy.io.wavfile.write("bark_out.wav", rate=sampling_rate, data=speech_values.cpu().numpy().squeeze())
36
  return ("bark_out.wav")
37
 
38
+ def load_video_yt(vid):
39
+ yt = YouTube(vid)
40
+ vid = yt.streams.filter(progressive=True, file_extension='mp4').order_by('resolution').desc().first().download(filename="tmp.mp4")
41
+ vid_aud = yt.streams.filter(only_audio=True)[0].download(filename="tmp_aud.mp3")
42
+ return vid, vid_aud
43
+
44
  with gr.Blocks() as app:
45
  with gr.Column():
46
  in_text = gr.Textbox()
47
  with gr.Tab("Default"):
48
+ with gr.Row():
49
+ speaker_num = gr.Dropdown(label="Speaker Voice", choices=num_list,value="1")
50
+ speaker_lang = gr.Dropdown(label="Speaker Language", choices=lang_list,value="en")
51
  with gr.Tab("Upload"):
52
+ with gr.Row():
53
+ in_aud_mic = gr.Audio(source='microphone')
54
+ in_aud_file = gr.Audio(source='upload')
55
  in_aud_yout = gr.Textbox(label="YouTube URL")
56
  yout_vid = gr.Video()
57
  #speaker_num = gr.Number(value=0)