MusicGen

Build error

App Files Files Community

adefossez commited on Jun 9, 2023

Commit

40689f8

2 Parent(s): 378cf0a 9d7284e

Merge branch 'main' into our_hf

Browse files

Files changed (3) hide show

app.py +16 -2
app_batched.py +14 -3
hf_loading.py +1 -4

app.py CHANGED Viewed

@@ -66,6 +66,16 @@ with gr.Blocks() as demo:
         1. Melody -- a music generation model capable of generating music condition on text and melody inputs. **Note**, you can also use text only.
         2. Small -- a 300M transformer decoder conditioned on text only.
         3. Medium -- a 1.5B transformer decoder conditioned on text only.
         See [github.com/facebookresearch/audiocraft](https://github.com/facebookresearch/audiocraft)
         for more details.
@@ -79,7 +89,7 @@ with gr.Blocks() as demo:
             with gr.Row():
                 submit = gr.Button("Submit")
             with gr.Row():
-                model = gr.Radio(["melody", "medium", "small"], label="Model", value="melody", interactive=True)
             with gr.Row():
                 duration = gr.Slider(minimum=1, maximum=30, value=10, label="Duration", interactive=True)
             with gr.Row():
@@ -107,7 +117,11 @@ with gr.Blocks() as demo:
                 "a light and cheerly EDM track, with syncopated drums, aery pads, and strong emotions",
                 "./assets/bach.mp3",
                 "melody"
-            ]
         ],
         inputs=[text, melody, model],
         outputs=[output]

         1. Melody -- a music generation model capable of generating music condition on text and melody inputs. **Note**, you can also use text only.
         2. Small -- a 300M transformer decoder conditioned on text only.
         3. Medium -- a 1.5B transformer decoder conditioned on text only.
+        4. Large -- a 3.3B transformer decoder conditioned on text only (might OOM for the longest sequences.)
+        When the optional melody conditioning wav is provided, the model will extract
+        a broad melody and try to follow it in the generated samples.
+        For skipping queue, you can duplicate this space, and upgrade to GPU in the settings.
+        <br/>
+        <a href="https://huggingface.co/spaces/musicgen/MusicGen?duplicate=true">
+        <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a>
+        </p>
         See [github.com/facebookresearch/audiocraft](https://github.com/facebookresearch/audiocraft)
         for more details.
             with gr.Row():
                 submit = gr.Button("Submit")
             with gr.Row():
+                model = gr.Radio(["melody", "medium", "small", "large"], label="Model", value="melody", interactive=True)
             with gr.Row():
                 duration = gr.Slider(minimum=1, maximum=30, value=10, label="Duration", interactive=True)
             with gr.Row():
                 "a light and cheerly EDM track, with syncopated drums, aery pads, and strong emotions",
                 "./assets/bach.mp3",
                 "melody"
+            ],
+            [
+                "lofi slow bpm electro chill with organic samples",
+                "medium",
+            ],
         ],
         inputs=[text, melody, model],
         outputs=[output]

app_batched.py CHANGED Viewed

@@ -71,8 +71,15 @@ with gr.Blocks() as demo:
         presented at: "Simple and Controllable Music Generation".
         Enter the description of the music you want and an optional audio used for melody conditioning.
-        This will generate a 12s extract with the `melody` model. For generating longer sequences
-        (up to 30 seconds), use the Colab demo or your own GPU.
         See [github.com/facebookresearch/audiocraft](https://github.com/facebookresearch/audiocraft)
         for more details.
@@ -100,9 +107,13 @@ with gr.Blocks() as demo:
                 None,
             ],
             [
-                "a light and cheerly EDM track, with syncopated drums, aery pads, and strong emotions",
                 "./assets/bach.mp3",
             ]
         ],
         inputs=[text, melody],
         outputs=[output]

         presented at: "Simple and Controllable Music Generation".
         Enter the description of the music you want and an optional audio used for melody conditioning.
+        The model will extract the broad melody from the uploaded wav if provided.
+        This will generate a 12s extract with the `melody` model.
+        For generating longer sequences (up to 30 seconds) and skipping queue, you can duplicate
+        to full demo space, which contains more control and upgrade to GPU in the settings.
+        <br/>
+        <a href="https://huggingface.co/spaces/musicgen/MusicGen?duplicate=true">
+        <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a>
+        </p>
         See [github.com/facebookresearch/audiocraft](https://github.com/facebookresearch/audiocraft)
         for more details.
                 None,
             ],
             [
+                "a light and cheerly EDM track, with syncopated drums, aery pads, and strong emotions bpm: 130",
                 "./assets/bach.mp3",
             ]
+            [
+                "lofi slow bpm electro chill with organic samples",
+                None,
+            ],
         ],
         inputs=[text, melody],
         outputs=[output]

hf_loading.py CHANGED Viewed

@@ -1,10 +1,9 @@
 """Utility for loading the models from HF."""
-import os
 from pathlib import Path
 import typing as tp
 from omegaconf import OmegaConf
-from huggingface_hub import hf_hub_download, login
 import torch
 from audiocraft.models import builders, MusicGen
@@ -16,8 +15,6 @@ MODEL_CHECKPOINTS_MAP = {
     "melody": "facebook/musicgen-melody",
 }
-login(os.environ['ACCESS_TOKEN'])
 def _get_state_dict(file_or_url: tp.Union[Path, str],
                     filename="state_dict.bin", device='cpu'):

 """Utility for loading the models from HF."""
 from pathlib import Path
 import typing as tp
 from omegaconf import OmegaConf
+from huggingface_hub import hf_hub_download
 import torch
 from audiocraft.models import builders, MusicGen
     "melody": "facebook/musicgen-melody",
 }
 def _get_state_dict(file_or_url: tp.Union[Path, str],
                     filename="state_dict.bin", device='cpu'):