|
import numpy as np |
|
import pydub |
|
import yt_dlp |
|
import yt_dlp.options |
|
|
|
|
|
def mp3_write(f: str, sr: int, x: np.ndarray, normalized: bool = False): |
|
channels = 2 if (x.ndim == 2 and x.shape[1] == 2) else 1 |
|
if normalized: |
|
y = np.int16(x * 2**15) |
|
else: |
|
y = np.int16(x) |
|
song = pydub.AudioSegment( |
|
y.tobytes(), frame_rate=sr, sample_width=2, channels=channels |
|
) |
|
song.export(f, format="mp3", bitrate="256k") |
|
|
|
|
|
def normalize( |
|
audio: np.ndarray, min_y: float = -1.0, max_y: float = 1.0, eps: float = 1e-8 |
|
): |
|
max_y -= eps |
|
min_y += eps |
|
amax = audio.max() |
|
amin = audio.min() |
|
audio = (max_y - min_y) * (audio - amin) / (amax - amin) + min_y |
|
return audio |
|
|
|
|
|
|
|
create_parser = yt_dlp.options.create_parser |
|
|
|
|
|
def parse_patched_options(opts): |
|
patched_parser = create_parser() |
|
patched_parser.defaults.update( |
|
{ |
|
"ignoreerrors": False, |
|
"retries": 0, |
|
"fragment_retries": 0, |
|
"extract_flat": False, |
|
"concat_playlist": "never", |
|
} |
|
) |
|
yt_dlp.options.create_parser = lambda: patched_parser |
|
try: |
|
return yt_dlp.parse_options(opts) |
|
finally: |
|
yt_dlp.options.create_parser = create_parser |
|
|
|
|
|
default_opts = parse_patched_options([]).ydl_opts |
|
|
|
|
|
def cli_to_api(opts, cli_defaults=False): |
|
opts = (yt_dlp.parse_options if cli_defaults else parse_patched_options)( |
|
opts |
|
).ydl_opts |
|
|
|
diff = {k: v for k, v in opts.items() if default_opts[k] != v} |
|
if "postprocessors" in diff: |
|
diff["postprocessors"] = [ |
|
pp |
|
for pp in diff["postprocessors"] |
|
if pp not in default_opts["postprocessors"] |
|
] |
|
return diff |
|
|