Spaces:

szili2011
/

ExtendSong

Runtime error

App Files Files Community

szili2011 commited on Oct 20, 2024

Commit

007a1b7

verified ·

1 Parent(s): 4710acd

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -19

app.py CHANGED Viewed

@@ -4,56 +4,46 @@ import librosa
 # Function to load audio using librosa
 def load_audio(file):
-    # Load the audio file and return the audio array and sample rate
     audio, sr = librosa.load(file, sr=None)
     return audio, sr
 # Function to get a relevant audio segment based on onset detection
 def get_segment(audio, sr):
-    # Calculate onset envelope and detect onsets
     onset_env = librosa.onset.onset_strength(y=audio, sr=sr)
     onset_frames = librosa.onset.onset_detect(onset_envelope=onset_env, sr=sr, backtrack=True)
-    # If no onsets are detected, return a segment from the beginning
     if len(onset_frames) == 0:
-        return audio[:2048], sr  # Return the first segment of 1 second
     # Calculate energy over time
     energy = np.array([np.sum(np.abs(audio[i:i + 2048]**2)) for i in range(0, len(audio), 2048)])
-    # Threshold to consider a segment musically relevant
     energy_threshold = np.mean(energy) + np.std(energy)
-    # Find onsets that exceed the energy threshold
     relevant_onsets = [f for f in onset_frames if f < len(energy) and energy[f] > energy_threshold]
-    # If no relevant onsets are found, fall back to the first detected onset
     start_frame = relevant_onsets[0] if relevant_onsets else onset_frames[0]
     start_sample = librosa.frames_to_samples(start_frame)
-    # Define a segment length in samples (1 second)
-    segment_length = sr  # 1 second segment
     end_sample = min(start_sample + segment_length, len(audio))
-    # Return the selected segment
     return audio[start_sample:end_sample], sr
 # Function to extend music by adding silence
 def extend_music(file, added_minutes):
     audio, sr = load_audio(file)
-    # Get a relevant segment from the audio
     segment, sr = get_segment(audio, sr)
-    # Calculate the number of samples to add based on the duration in minutes
     additional_samples = int(added_minutes * 60 * sr)
-    extended_audio = np.concatenate([segment, np.zeros(additional_samples)])  # Append zeros for silence
     # Normalize audio to the range of [-1, 1]
-    extended_audio = extended_audio / np.max(np.abs(extended_audio))  # Avoid overflow
     # Return the audio as a NumPy array and the sample rate as an integer
-    return extended_audio.astype(np.float32), sr
 # Gradio UI setup
 with gr.Blocks() as app:
@@ -66,5 +56,5 @@ with gr.Blocks() as app:
     submit_button = gr.Button("Extend Audio")
     submit_button.click(extend_music, inputs=[audio_input, added_minutes], outputs=audio_output)
-# Launch the app
-app.launch()

 # Function to load audio using librosa
 def load_audio(file):
     audio, sr = librosa.load(file, sr=None)
     return audio, sr
 # Function to get a relevant audio segment based on onset detection
 def get_segment(audio, sr):
     onset_env = librosa.onset.onset_strength(y=audio, sr=sr)
     onset_frames = librosa.onset.onset_detect(onset_envelope=onset_env, sr=sr, backtrack=True)
     if len(onset_frames) == 0:
+        return audio[:2048], sr  # Return the first 2048 samples if no onsets
     # Calculate energy over time
     energy = np.array([np.sum(np.abs(audio[i:i + 2048]**2)) for i in range(0, len(audio), 2048)])
+    # Threshold for musical relevance
     energy_threshold = np.mean(energy) + np.std(energy)
     relevant_onsets = [f for f in onset_frames if f < len(energy) and energy[f] > energy_threshold]
     start_frame = relevant_onsets[0] if relevant_onsets else onset_frames[0]
     start_sample = librosa.frames_to_samples(start_frame)
+    segment_length = sr  # Length of segment in samples (1 second)
     end_sample = min(start_sample + segment_length, len(audio))
     return audio[start_sample:end_sample], sr
 # Function to extend music by adding silence
 def extend_music(file, added_minutes):
     audio, sr = load_audio(file)
     segment, sr = get_segment(audio, sr)
+    # Calculate additional samples
     additional_samples = int(added_minutes * 60 * sr)
+    extended_audio = np.concatenate([segment, np.zeros(additional_samples)])  # Add silence
     # Normalize audio to the range of [-1, 1]
+    extended_audio = extended_audio / np.max(np.abs(extended_audio)) if np.max(np.abs(extended_audio)) > 0 else extended_audio
     # Return the audio as a NumPy array and the sample rate as an integer
+    return extended_audio.astype(np.float32), sr  # Ensure it's a float32 NumPy array
 # Gradio UI setup
 with gr.Blocks() as app:
     submit_button = gr.Button("Extend Audio")
     submit_button.click(extend_music, inputs=[audio_input, added_minutes], outputs=audio_output)
+# Launch the app with a public link
+app.launch(share=True)