Spaces:
Running
Running
import numpy as np | |
import pydub | |
import yt_dlp | |
import yt_dlp.options | |
def mp3_write(f: str, sr: int, x: np.ndarray, normalized: bool = False): | |
channels = 2 if (x.ndim == 2 and x.shape[1] == 2) else 1 | |
if normalized: # normalized array - each item should be a float in [-1, 1) | |
y = np.int16(x * 2**15) | |
else: | |
y = np.int16(x) | |
song = pydub.AudioSegment( | |
y.tobytes(), frame_rate=sr, sample_width=2, channels=channels | |
) | |
song.export(f, format="mp3", bitrate="256k") | |
def normalize( | |
audio: np.ndarray, min_y: float = -1.0, max_y: float = 1.0, eps: float = 1e-8 | |
): | |
max_y -= eps | |
min_y += eps | |
amax = audio.max() | |
amin = audio.min() | |
audio = (max_y - min_y) * (audio - amin) / (amax - amin) + min_y | |
return audio | |
# yt_dlp script copied from https://github.com/yt-dlp/yt-dlp/blob/28d485714fef88937c82635438afba5db81f9089/devscripts/cli_to_api.py | |
create_parser = yt_dlp.options.create_parser | |
def parse_patched_options(opts): | |
patched_parser = create_parser() | |
patched_parser.defaults.update( | |
{ | |
"ignoreerrors": False, | |
"retries": 0, | |
"fragment_retries": 0, | |
"extract_flat": False, | |
"concat_playlist": "never", | |
} | |
) | |
yt_dlp.options.create_parser = lambda: patched_parser | |
try: | |
return yt_dlp.parse_options(opts) | |
finally: | |
yt_dlp.options.create_parser = create_parser | |
default_opts = parse_patched_options([]).ydl_opts | |
def cli_to_api(opts, cli_defaults=False): | |
opts = (yt_dlp.parse_options if cli_defaults else parse_patched_options)( | |
opts | |
).ydl_opts | |
diff = {k: v for k, v in opts.items() if default_opts[k] != v} | |
if "postprocessors" in diff: | |
diff["postprocessors"] = [ | |
pp | |
for pp in diff["postprocessors"] | |
if pp not in default_opts["postprocessors"] | |
] | |
return diff | |