Spaces:
Running
on
A10G
Running
on
A10G
File size: 1,122 Bytes
96ea36d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 |
import os
import argparse
from VoiceParser.model import VoiceParser
def main():
parser = argparse.ArgumentParser()
parser.add_argument('--wav-path', type=str, help="Path of a wav file")
parser.add_argument('--wav-dir', type=str, help="Directory of wav files")
parser.add_argument('--out-dir', type=str, help="Directory of output npz files")
args = parser.parse_args()
if (args.wav_path is None and args.wav_dir is None) or (args.wav_path is not None and args.wav_dir is not None):
parser.error("Please provide either '--wav-path' or '--wav-dir', but not both.")
out_dir = args.out_dir
model = VoiceParser(device='cpu')
if args.wav_path is not None:
model.extract_acoustic_embed(args.wav_path, out_dir)
print(f'Sucessfully parsed {args.wav_path}')
else:
wav_name_list = os.listdir(args.wav_dir)
for wav_name in wav_name_list:
wav_path = os.path.join(args.wav_dir, wav_name)
model.extract_acoustic_embed(wav_path, out_dir)
print(f'Sucessfully parsed {wav_path}')
if __name__ == '__main__':
main()
|