Commit
·
4b5e5e7
1
Parent(s):
cd4126a
fix global vars
Browse files
app.py
CHANGED
@@ -234,6 +234,9 @@ config = Config()
|
|
234 |
logging.getLogger("numba").setLevel(logging.WARNING)
|
235 |
|
236 |
hubert_model = None
|
|
|
|
|
|
|
237 |
|
238 |
def load_hubert():
|
239 |
global hubert_model
|
@@ -256,9 +259,7 @@ def load_hubert():
|
|
256 |
# hubert_model = models[0]
|
257 |
|
258 |
def load_voicecraft():
|
259 |
-
global voicecraft_model
|
260 |
-
global phn2num
|
261 |
-
global voicecraft_config
|
262 |
|
263 |
from lib.voicecraft.models import voicecraft
|
264 |
voicecraft_name = "giga330M.pth"
|
@@ -1493,6 +1494,8 @@ def transcribe_btn_click(audio_choice):
|
|
1493 |
|
1494 |
def run(seed, stop_repetition, sample_batch_size, left_margin, right_margin, codec_audio_sr, codec_sr, top_k, top_p,
|
1495 |
temperature, kvcache, cutoff_value, target_transcript, silence_tokens, transcribed_text):
|
|
|
|
|
1496 |
os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"
|
1497 |
os.environ["CUDA_VISIBLE_DEVICES"] = "0"
|
1498 |
# take a look at demo/temp/mfa_alignment, decide which part of the audio to use as prompt
|
|
|
234 |
logging.getLogger("numba").setLevel(logging.WARNING)
|
235 |
|
236 |
hubert_model = None
|
237 |
+
voicecraft_model = None
|
238 |
+
voicecraft_config = None
|
239 |
+
phn2num = None
|
240 |
|
241 |
def load_hubert():
|
242 |
global hubert_model
|
|
|
259 |
# hubert_model = models[0]
|
260 |
|
261 |
def load_voicecraft():
|
262 |
+
global voicecraft_model, phn2num, voicecraft_config
|
|
|
|
|
263 |
|
264 |
from lib.voicecraft.models import voicecraft
|
265 |
voicecraft_name = "giga330M.pth"
|
|
|
1494 |
|
1495 |
def run(seed, stop_repetition, sample_batch_size, left_margin, right_margin, codec_audio_sr, codec_sr, top_k, top_p,
|
1496 |
temperature, kvcache, cutoff_value, target_transcript, silence_tokens, transcribed_text):
|
1497 |
+
global voicecraft_model, voicecraft_config, phn2num
|
1498 |
+
|
1499 |
os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"
|
1500 |
os.environ["CUDA_VISIBLE_DEVICES"] = "0"
|
1501 |
# take a look at demo/temp/mfa_alignment, decide which part of the audio to use as prompt
|