Spaces:

tee342
/

AudioMaster

Sleeping

App Files Files Community

tee342 commited on Jun 14

Commit

825b041

verified ·

1 Parent(s): 26b8861

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -26

app.py CHANGED Viewed

@@ -26,6 +26,14 @@ import json
 # Suppress warnings
 warnings.filterwarnings("ignore")
 # === Helper Functions ===
 def audiosegment_to_array(audio):
     return np.array(audio.get_array_of_samples()), audio.frame_rate
@@ -33,7 +41,7 @@ def audiosegment_to_array(audio):
 def array_to_audiosegment(samples, frame_rate, channels=1):
     return AudioSegment(
         samples.tobytes(),
-        frame_rate=frame_rate,
         sample_width=samples.dtype.itemsize,
         channels=channels
     )
@@ -196,7 +204,7 @@ def ai_mastering_chain(audio_path, genre="Pop", target_lufs=-14.0):
     final_audio.export(out_path, format="wav")
     return out_path
-# === Harmonic Saturation / Exciter – Now Defined Before Use ===
 def harmonic_saturation(audio, saturation_type="Tube", intensity=0.2):
     samples = np.array(audio.get_array_of_samples()).astype(np.float32)
@@ -361,17 +369,9 @@ preset_choices = {
     "🌫 ASMR Vocal": ["Auto Gain", "Low-Pass Filter (3000Hz)", "Noise Gate"],
     "🎼 Stage Mode": ["Reverb", "Bass Boost", "Limiter"],
     "🎵 Auto-Tune Style": ["Pitch Shift (+1 semitone)", "Normalize", "Treble Boost"],
-    "🎷 Jazz Vocal": ["Bass Boost (-200-400Hz)", "Treble Boost (-3000Hz)", "Normalize"],
-    "🎹 Jazz Piano": ["Treble Boost (4000-6000Hz)", "Normalize", "Stereo Widening"],
-    "🎻 Classical Strings": ["Bass Boost (100-500Hz)", "Treble Boost (3000-6000Hz)", "Reverb"],
-    "☕ Chillhop": ["Noise Gate", "Treble Boost (-3000Hz)", "Reverb"],
-    "🌌 Ambient": ["Reverb", "Noise Gate", "Treble Boost (6000-12000Hz)"],
     "🎤 R&B Vocal": ["Noise Reduction", "Bass Boost (100-300Hz)", "Treble Boost (2000-4000Hz)"],
     "💃 Soul Vocal": ["Noise Reduction", "Bass Boost (80-200Hz)", "Treble Boost (1500-3500Hz)"],
-    "🕺 Funk Groove": ["Bass Boost (80-200Hz)", "Treble Boost (1000-3000Hz)", "Stereo Widening"],
-    "🎹 Jazz Piano Solo": ["Treble Boost (2000-5000Hz)", "Normalize", "Stage Mode"],
-    "🎸 Trap EDM": ["Bass Boost (60-120Hz)", "Treble Boost (2000-5000Hz)", "Limiter"],
-    "🎸 Indie Rock": ["Bass Boost (150-400Hz)", "Treble Boost (2000-5000Hz)", "Compress Dynamic Range"]
 }
 preset_names = list(preset_choices.keys())
@@ -404,10 +404,25 @@ def batch_process_audio(files, selected_effects, isolate_vocals, preset_name, ex
 # === Vocal Pitch Correction – Auto-Tune Style ===
 def auto_tune_vocal(audio_path, target_key="C"):
     try:
-        return apply_pitch_shift(AudioSegment.from_file(audio_path), 0.2)
     except Exception as e:
         return None
 # === Real-Time Spectrum Analyzer + Live EQ Preview ===
 def visualize_spectrum(audio_path):
     y, sr = torchaudio.load(audio_path)
@@ -472,7 +487,7 @@ with gr.Blocks(css="""
         border-radius: 10px;
         padding: 10px 20px;
         font-weight: bold;
-        box-shadow: 0 0 10px #2563eb88;
         border: none;
         font-size: 16px;
     }
@@ -560,7 +575,7 @@ with gr.Blocks(css="""
     }
 """) as demo:
-    # Header
     gr.HTML('''
     <div class="studio-header">
         <img src="logo.png" width="400" />
@@ -675,7 +690,7 @@ with gr.Blocks(css="""
         )
     # --- Vocal Pitch Correction – Auto-Tune Style ===
-    with gr.Tab("🧬 Vocal Pitch Correction"):
         gr.Interface(
             fn=auto_tune_vocal,
             inputs=[
@@ -683,8 +698,9 @@ with gr.Blocks(css="""
                 gr.Textbox(label="Target Key", value="C", lines=1)
             ],
             outputs=gr.Audio(label="Pitch-Corrected Output", type="filepath"),
-            title="Auto-Tune Style Pitch Correction",
-            description="Correct vocal pitch automatically"
         )
     # --- Frequency Spectrum Tab – Real-time Visualizer ===
@@ -737,8 +753,7 @@ with gr.Blocks(css="""
             ],
             outputs=gr.File(label="Project File (.aiproj)"),
             title="Save Everything Together",
-            description="Save your session, effects, and settings in one file to reuse later.",
-            allow_flagging="never"
         )
         gr.Interface(
@@ -756,13 +771,13 @@ with gr.Blocks(css="""
     with gr.Tab("🎛 Preset Gallery"):
         gr.Markdown("### Select a preset visually")
         preset_gallery = gr.Gallery(value=[
-            ("images/pop_card.png",  "Pop"),
-            ("images/edm_card.png",  "EDM"),
-            ("images/rock_card.png",  "Rock"),
-            ("images/hiphop_card.png",  "Hip-Hop"),
-            ("images/rnb_card.png",  "R&B"),
-            ("images/soul_card.png",  "Soul"),
-            ("images/funk_card.png",  "Funk")
         ], label="Preset Cards", columns=4, height="auto")
         preset_name_out = gr.Dropdown(choices=preset_names, label="Selected Preset")

 # Suppress warnings
 warnings.filterwarnings("ignore")
+try:
+    import pyrubberband as pyrb
+except ImportError:
+    print("Installing pyrubberband...")
+    import subprocess
+    subprocess.run(["pip", "install", "pyrubberband"])
+    import pyrubberband as pyrb
 # === Helper Functions ===
 def audiosegment_to_array(audio):
     return np.array(audio.get_array_of_samples()), audio.frame_rate
 def array_to_audiosegment(samples, frame_rate, channels=1):
     return AudioSegment(
         samples.tobytes(),
+        frame_rate=int(frame_rate),
         sample_width=samples.dtype.itemsize,
         channels=channels
     )
     final_audio.export(out_path, format="wav")
     return out_path
+# === Harmonic Saturation / Exciter – Now Included ===
 def harmonic_saturation(audio, saturation_type="Tube", intensity=0.2):
     samples = np.array(audio.get_array_of_samples()).astype(np.float32)
     "🌫 ASMR Vocal": ["Auto Gain", "Low-Pass Filter (3000Hz)", "Noise Gate"],
     "🎼 Stage Mode": ["Reverb", "Bass Boost", "Limiter"],
     "🎵 Auto-Tune Style": ["Pitch Shift (+1 semitone)", "Normalize", "Treble Boost"],
     "🎤 R&B Vocal": ["Noise Reduction", "Bass Boost (100-300Hz)", "Treble Boost (2000-4000Hz)"],
     "💃 Soul Vocal": ["Noise Reduction", "Bass Boost (80-200Hz)", "Treble Boost (1500-3500Hz)"],
+    "🕺 Funk Groove": ["Bass Boost (80-200Hz)", "Treble Boost (1000-3000Hz)"]
 }
 preset_names = list(preset_choices.keys())
 # === Vocal Pitch Correction – Auto-Tune Style ===
 def auto_tune_vocal(audio_path, target_key="C"):
     try:
+        # Load audio
+        audio = AudioSegment.from_file(audio_path)
+        # Apply auto-tune
+        semitones = key_to_semitone(target_key)
+        tuned_audio = apply_pitch_shift(audio, semitones)
+        out_path = os.path.join(tempfile.gettempdir(), "autotuned_output.wav")
+        tuned_audio.export(out_path, format="wav")
+        return out_path
     except Exception as e:
+        print(f"Auto-Tune Error: {e}")
         return None
+def key_to_semitone(key="C"):
+    keys = {"C": 0, "C#": 1, "D": 2, "D#": 3, "E": 4, "F": 5,
+            "F#": 6, "G": 7, "G#": 8, "A": 9, "A#": 10, "B": 11}
+    return keys.get(key, 0)
 # === Real-Time Spectrum Analyzer + Live EQ Preview ===
 def visualize_spectrum(audio_path):
     y, sr = torchaudio.load(audio_path)
         border-radius: 10px;
         padding: 10px 20px;
         font-weight: bold;
+        box-shadow: 0 0 10px #2563eb44;
         border: none;
         font-size: 16px;
     }
     }
 """) as demo:
+    # Header with logo and tagline
     gr.HTML('''
     <div class="studio-header">
         <img src="logo.png" width="400" />
         )
     # --- Vocal Pitch Correction – Auto-Tune Style ===
+    with gr.Tab("🎤 AI Auto-Tune"):
         gr.Interface(
             fn=auto_tune_vocal,
             inputs=[
                 gr.Textbox(label="Target Key", value="C", lines=1)
             ],
             outputs=gr.Audio(label="Pitch-Corrected Output", type="filepath"),
+            title="AI Auto-Tune",
+            description="Correct vocal pitch automatically using AI",
+            allow_flagging="never"
         )
     # --- Frequency Spectrum Tab – Real-time Visualizer ===
             ],
             outputs=gr.File(label="Project File (.aiproj)"),
             title="Save Everything Together",
+            description="Save your session, effects, and settings in one file to reuse later."
         )
         gr.Interface(
     with gr.Tab("🎛 Preset Gallery"):
         gr.Markdown("### Select a preset visually")
         preset_gallery = gr.Gallery(value=[
+            ("https://picsum.photos/id/10/150/100",  "Pop"),
+            ("https://picsum.photos/id/20/150/100",  "EDM"),
+            ("https://picsum.photos/id/30/150/100",  "Rock"),
+            ("https://picsum.photos/id/40/150/100",  "Hip-Hop"),
+            ("https://picsum.photos/id/50/150/100",  "R&B"),
+            ("https://picsum.photos/id/60/150/100",  "Soul"),
+            ("https://picsum.photos/id/70/150/100",  "Funk")
         ], label="Preset Cards", columns=4, height="auto")
         preset_name_out = gr.Dropdown(choices=preset_names, label="Selected Preset")