Spaces:
Running
on
Zero
Running
on
Zero
File size: 1,992 Bytes
c9ce2d9 2bbecd3 c9ce2d9 5c463b7 c9ce2d9 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 |
import sys
import librosa
from transformers import Pop2PianoForConditionalGeneration, Pop2PianoProcessor, Pop2PianoTokenizer
import torch
from post_processor import post_process
import tempfile
import shutil
def generate_midi(song_path, output_dir=None):
if output_dir is None:
output_dir = "./Outputs"
print("Loading Model...")
device = "cuda" if torch.cuda.is_available() else "cpu"
print(f"Using {device}")
model = Pop2PianoForConditionalGeneration.from_pretrained("Tim-gubski/Audio2Hero").to(device)
model.eval()
processor = Pop2PianoProcessor.from_pretrained("sweetcocoa/pop2piano")
tokenizer = Pop2PianoTokenizer.from_pretrained("sweetcocoa/pop2piano")
print("Processing Song...")
# load an example audio file and corresponding ground truth midi file
audio, sr = librosa.load(song_path, sr=44100) # feel free to change the sr to a suitable value.
inputs = processor(audio=audio, sampling_rate=sr, return_tensors="pt")
# generate model output
print("Generating output...")
model.generation_config.output_logits = True
model.generation_config.return_dict_in_generate = True
model_output = model.generate(inputs["input_features"].to(device))
tokenizer_output = processor.batch_decode(
token_ids=model_output.sequences.cpu(),
feature_extractor_output=inputs
)
# save to temp file
temp_dir = tempfile.TemporaryDirectory()
tokenizer_output["pretty_midi_objects"][0].write(f"{temp_dir.name}/temp.mid")
print("Post Processing...")
post_process(song_path, f"{temp_dir.name}/temp.mid", output_dir)
# zip folder
song_name = song_path.split("/")[-1]
song_name = ".".join(song_name.split(".")[0:-1])
shutil.make_archive(f"{output_dir}/{song_name}", 'zip', f"{output_dir}/{song_name}")
temp_dir.cleanup()
print("Done.")
return f"{output_dir}/{song_name}.zip"
if __name__=="__main__":
args = sys.argv[1:]
song_path = args[0]
output_dir = args[1]
generate_midi(song_path, output_dir)
|