|
import ffmpeg |
|
import numpy as np |
|
import re |
|
import unicodedata |
|
|
|
|
|
def load_audio(file, sampling_rate): |
|
try: |
|
file = file.strip(" ").strip('"').strip("\n").strip('"').strip(" ") |
|
out, _ = ( |
|
ffmpeg.input(file, threads=0) |
|
.output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sampling_rate) |
|
.run(cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True) |
|
) |
|
except Exception as error: |
|
raise RuntimeError(f"Failed to load audio: {error}") |
|
|
|
return np.frombuffer(out, np.float32).flatten() |
|
|
|
|
|
def format_title(title): |
|
formatted_title = ( |
|
unicodedata.normalize("NFKD", title).encode("ascii", "ignore").decode("utf-8") |
|
) |
|
formatted_title = re.sub(r"[\u2500-\u257F]+", "", formatted_title) |
|
formatted_title = re.sub(r"[^\w\s.-]", "", formatted_title) |
|
formatted_title = re.sub(r"\s+", "_", formatted_title) |
|
return formatted_title |
|
|