|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
import json |
|
import torchaudio |
|
|
|
|
|
def read_lists(list_file): |
|
lists = [] |
|
with open(list_file, 'r', encoding='utf8') as fin: |
|
for line in fin: |
|
lists.append(line.strip()) |
|
return lists |
|
|
|
def read_json_lists(list_file): |
|
lists = read_lists(list_file) |
|
results = {} |
|
for fn in lists: |
|
with open(fn, 'r', encoding='utf8') as fin: |
|
results.update(json.load(fin)) |
|
return results |
|
|
|
def load_wav(wav, target_sr): |
|
speech, sample_rate = torchaudio.load(wav) |
|
speech = speech.mean(dim=0, keepdim=True) |
|
if sample_rate != target_sr: |
|
assert sample_rate > target_sr, 'wav sample rate {} must be greater than {}'.format(sample_rate, target_sr) |
|
speech = torchaudio.transforms.Resample(orig_freq=sample_rate, new_freq=target_sr)(speech) |
|
return speech |
|
|