Spaces:
Running
Running
import argparse | |
import sys | |
from pathlib import Path | |
from typing import List | |
from dora.log import fatal | |
import torch as th | |
from demucs.apply import apply_model, BagOfModels | |
from demucs.audio import save_audio | |
from demucs.pretrained import get_model_from_args, ModelLoadingError | |
from demucs.separate import load_track | |
def separator( | |
tracks: List[Path], | |
out: Path, | |
model: str, | |
device: str, | |
shifts: int, | |
overlap: float, | |
stem: str, | |
int24: bool, | |
float32: bool, | |
clip_mode: str, | |
mp3: bool, | |
mp3_bitrate: int, | |
jobs: int, | |
verbose: bool, | |
): | |
"""Separate the sources for the given tracks | |
Args: | |
tracks (Path): Path to tracks | |
out (Path): Folder where to put extracted tracks. A subfolder with the model name will be created. | |
model (str): Model name | |
device (str): Device to use, default is cuda if available else cpu | |
shifts (int): Number of random shifts for equivariant stabilization. Increase separation time but improves quality for Demucs. 10 was used in the original paper. | |
overlap (float): Overlap | |
stem (str): Only separate audio into {STEM} and no_{STEM}. | |
int24 (bool): Save wav output as 24 bits wav. | |
float32 (bool): Save wav output as float32 (2x bigger). | |
clip_mode (str): Strategy for avoiding clipping: rescaling entire signal if necessary (rescale) or hard clipping (clamp). | |
mp3 (bool): Convert the output wavs to mp3. | |
mp3_bitrate (int): Bitrate of converted mp3. | |
jobs (int): Number of jobs. This can increase memory usage but will be much faster when multiple cores are available. | |
verbose (bool): Verbose | |
""" | |
args = argparse.Namespace() | |
args.tracks = tracks | |
args.out = out | |
args.model = model | |
args.device = device | |
args.shifts = shifts | |
args.overlap = overlap | |
args.stem = stem | |
args.int24 = int24 | |
args.float32 = float32 | |
args.clip_mode = clip_mode | |
args.mp3 = mp3 | |
args.mp3_bitrate = mp3_bitrate | |
args.jobs = jobs | |
args.verbose = verbose | |
args.filename = "{track}/{stem}.{ext}" | |
args.split = True | |
args.segment = None | |
args.name = model | |
args.repo = None | |
try: | |
model = get_model_from_args(args) | |
except ModelLoadingError as error: | |
fatal(error.args[0]) | |
if args.segment is not None and args.segment < 8: | |
fatal("Segment must greater than 8. ") | |
if ".." in args.filename.replace("\\", "/").split("/"): | |
fatal('".." must not appear in filename. ') | |
if isinstance(model, BagOfModels): | |
print( | |
f"Selected model is a bag of {len(model.models)} models. " | |
"You will see that many progress bars per track." | |
) | |
if args.segment is not None: | |
for sub in model.models: | |
sub.segment = args.segment | |
else: | |
if args.segment is not None: | |
model.segment = args.segment | |
model.cpu() | |
model.eval() | |
if args.stem is not None and args.stem not in model.sources: | |
fatal( | |
'error: stem "{stem}" is not in selected model. STEM must be one of {sources}.'.format( | |
stem=args.stem, sources=", ".join(model.sources) | |
) | |
) | |
out = args.out / args.name | |
out.mkdir(parents=True, exist_ok=True) | |
print(f"Separated tracks will be stored in {out.resolve()}") | |
for track in args.tracks: | |
if not track.exists(): | |
print( | |
f"File {track} does not exist. If the path contains spaces, " | |
'please try again after surrounding the entire path with quotes "".', | |
file=sys.stderr, | |
) | |
continue | |
print(f"Separating track {track}") | |
wav = load_track(track, model.audio_channels, model.samplerate) | |
ref = wav.mean(0) | |
wav = (wav - ref.mean()) / ref.std() | |
sources = apply_model( | |
model, | |
wav[None], | |
device=args.device, | |
shifts=args.shifts, | |
split=args.split, | |
overlap=args.overlap, | |
progress=True, | |
num_workers=args.jobs, | |
)[0] | |
sources = sources * ref.std() + ref.mean() | |
if args.mp3: | |
ext = "mp3" | |
else: | |
ext = "wav" | |
kwargs = { | |
"samplerate": model.samplerate, | |
"bitrate": args.mp3_bitrate, | |
"clip": args.clip_mode, | |
"as_float": args.float32, | |
"bits_per_sample": 24 if args.int24 else 16, | |
} | |
if args.stem is None: | |
for source, name in zip(sources, model.sources): | |
stem = out / args.filename.format( | |
track=track.name.rsplit(".", 1)[0], | |
trackext=track.name.rsplit(".", 1)[-1], | |
stem=name, | |
ext=ext, | |
) | |
stem.parent.mkdir(parents=True, exist_ok=True) | |
save_audio(source, str(stem), **kwargs) | |
else: | |
sources = list(sources) | |
stem = out / args.filename.format( | |
track=track.name.rsplit(".", 1)[0], | |
trackext=track.name.rsplit(".", 1)[-1], | |
stem=args.stem, | |
ext=ext, | |
) | |
stem.parent.mkdir(parents=True, exist_ok=True) | |
save_audio(sources.pop(model.sources.index(args.stem)), str(stem), **kwargs) | |
# Warning : after poping the stem, selected stem is no longer in the list 'sources' | |
other_stem = th.zeros_like(sources[0]) | |
for i in sources: | |
other_stem += i | |
stem = out / args.filename.format( | |
track=track.name.rsplit(".", 1)[0], | |
trackext=track.name.rsplit(".", 1)[-1], | |
stem="no_" + args.stem, | |
ext=ext, | |
) | |
stem.parent.mkdir(parents=True, exist_ok=True) | |
save_audio(other_stem, str(stem), **kwargs) | |