| import ffmpeg | |
| import numpy as np | |
| import re | |
| import unicodedata | |
| def load_audio(file, sampling_rate): | |
| try: | |
| file = file.strip(" ").strip('"').strip("\n").strip('"').strip(" ") | |
| out, _ = ( | |
| ffmpeg.input(file, threads=0) | |
| .output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sampling_rate) | |
| .run(cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True) | |
| ) | |
| except Exception as error: | |
| raise RuntimeError(f"Failed to load audio: {error}") | |
| return np.frombuffer(out, np.float32).flatten() | |
| def format_title(title): | |
| formatted_title = ( | |
| unicodedata.normalize("NFKD", title).encode("ascii", "ignore").decode("utf-8") | |
| ) | |
| formatted_title = re.sub(r"[\u2500-\u257F]+", "", formatted_title) | |
| formatted_title = re.sub(r"[^\w\s.-]", "", formatted_title) | |
| formatted_title = re.sub(r"\s+", "_", formatted_title) | |
| return formatted_title | |