Spaces:

tee342
/

AudioMaster

Sleeping

App Files Files Community

tee342 commited on Jun 12

Commit

7b9755f

verified ·

1 Parent(s): 98d55b3

Update app.py

Browse files

Files changed (1) hide show

app.py +74 -39

app.py CHANGED Viewed

@@ -85,7 +85,7 @@ def apply_bass_boost(audio, gain=10):
 def apply_treble_boost(audio, gain=10):
     return audio.high_pass_filter(4000).apply_gain(gain)
-def apply_noise_gate(audio, threshold=-50.0, attack=50, release=100):
     samples = np.array(audio.get_array_of_samples())
     rms = np.sqrt(np.mean(samples**2))
     if rms < 1:
@@ -99,8 +99,8 @@ def apply_limiter(audio, limit_dB=-1):
     limiter = audio._spawn(audio.raw_data, overrides={"frame_rate": audio.frame_rate})
     return limiter.apply_gain(limit_dB)
-def apply_phaser(audio, rate=0.5, depth=0.7, feedback=0.2, mix=0.5):
-    return audio._spawn(audio.raw_data, overrides={"frame_rate": int(audio.frame_rate * rate)})
 def apply_bitcrush(audio, bit_depth=8):
     samples = np.array(audio.get_array_of_samples()).astype(np.float32)
@@ -127,6 +127,23 @@ def apply_stage_mode(audio):
     processed = apply_bass_boost(processed, gain=6)
     return apply_limiter(processed, limit_dB=-2)
 # === Vocal Isolation Helpers ===
 def load_track_local(path, sample_rate, channels=2):
     sig, rate = torchaudio.load(path)
@@ -390,10 +407,49 @@ def mix_tracks(track1, track2, volume_offset=0):
     mixed.export(out_path, format="wav")
     return out_path
 # === Dummy Voice Cloning Tab – Works Locally Only ===
 def clone_voice(*args):
     return "⚠️ Voice cloning requires local install – use Python 3.9 or below"
 # === Speaker Diarization ("Who Spoke When?") ===
 try:
     from pyannote.audio import Pipeline as DiarizationPipeline
@@ -417,7 +473,6 @@ def diarize_and_transcribe(audio_path):
     audio.export(temp_wav, format="wav")
     try:
-        from pyannote.audio import Pipeline as DiarizationPipeline
         diarization = diarize_pipeline(temp_wav)
         result = whisper.transcribe(temp_wav)
@@ -525,6 +580,20 @@ with gr.Blocks(title="AI Audio Studio", css="style.css") as demo:
             clear_btn=None
         )
     # --- Transcribe & Edit Tab ===
     with gr.Tab("📝 Transcribe & Edit"):
         gr.Interface(
@@ -535,40 +604,6 @@ with gr.Blocks(title="AI Audio Studio", css="style.css") as demo:
             description="Convert voice to text and edit it before exporting again."
         )
-    # --- Vocal Presets for Singers ===
-    with gr.Tab("🎤 Vocal Presets for Singers"):
-        gr.Interface(
-            fn=process_audio,
-            inputs=[
-                gr.Audio(label="Upload Vocal Track", type="filepath"),
-                gr.CheckboxGroup(choices=[
-                    "Noise Reduction",
-                    "Normalize",
-                    "Compress Dynamic Range",
-                    "Bass Boost",
-                    "Treble Boost",
-                    "Reverb",
-                    "Auto Gain",
-                    "Vocal Distortion",
-                    "Harmony",
-                    "Stage Mode"
-                ]),
-                gr.Checkbox(label="Isolate Vocals After Effects"),
-                gr.Dropdown(choices=preset_names, label="Select Vocal Preset", value=preset_names[0] if preset_names else None),
-                gr.Dropdown(choices=["MP3", "WAV"], label="Export Format", value="MP3")
-            ],
-            outputs=[
-                gr.Audio(label="Processed Vocal", type="filepath"),
-                gr.Image(label="Waveform Preview"),
-                gr.Textbox(label="Session Log (JSON)", lines=5),
-                gr.Textbox(label="Detected Genre", lines=1),
-                gr.Textbox(label="Status", value="✅ Ready", lines=1)
-            ],
-            title="Create Studio-Quality Vocal Tracks",
-            description="Apply singer-friendly presets and effects to enhance vocals.",
-            allow_flagging="never"
-        )
     # --- Voice Cloning (Local Only) ===
     with gr.Tab("🎭 Voice Cloning (Local Only)"):
         gr.Interface(
@@ -679,7 +714,7 @@ with gr.Blocks(title="AI Audio Studio", css="style.css") as demo:
         )
     # --- Mix Two Tracks ===
-    with gr.Tab("🔀 Mix Two Tracks"):
         gr.Interface(
             fn=mix_tracks,
             inputs=[

 def apply_treble_boost(audio, gain=10):
     return audio.high_pass_filter(4000).apply_gain(gain)
+def apply_noise_gate(audio, threshold=-50.0):
     samples = np.array(audio.get_array_of_samples())
     rms = np.sqrt(np.mean(samples**2))
     if rms < 1:
     limiter = audio._spawn(audio.raw_data, overrides={"frame_rate": audio.frame_rate})
     return limiter.apply_gain(limit_dB)
+def apply_phaser(audio):
+    return audio._spawn(audio.raw_data, overrides={"frame_rate": int(audio.frame_rate * 1.1)})
 def apply_bitcrush(audio, bit_depth=8):
     samples = np.array(audio.get_array_of_samples()).astype(np.float32)
     processed = apply_bass_boost(processed, gain=6)
     return apply_limiter(processed, limit_dB=-2)
+# === Genre Mastering Presets ===
+genre_presets = {
+    "Soul": ["Warmth", "Bass Boost (+6dB)", "Mid Enhance"],
+    "Funk": ["Treble Boost (+6dB)", "Compression", "Stereo Widening"],
+    "Rock": ["Distortion", "Punchy Mids", "Reverb"],
+    "Pop": ["Vocal Clarity", "Limiter", "Stereo Expansion"],
+    "Acoustic": ["Natural Reverb", "Gentle Compression", "Mid Focus"],
+    "Dance": ["Loudness Maximizer", "Bass Emphasis", "Stereo Widen"],
+    "EDM": ["Heavy Bass", "Stereo Expansion", "Limiter", "Phaser"],
+    "Country": ["Clean Mix", "Subtle Reverb", "Mid Focus"],
+    "Disco": ["Rhythmic Echo", "Bass Thump", "Treble Boost (+8dB)"],
+    "Metal": ["Distortion", "High Gain", "Crisp Highs"],
+    "Hip-Hop": ["Deep Bass", "Vocal Presence", "Saturation"],
+    "Trap": ["808 Bass", "Reverb", "Lo-Fi Texture"],
+    "LoFi": ["Bitcrusher", "Tape Hiss", "Soft Compression"]
+}
 # === Vocal Isolation Helpers ===
 def load_track_local(path, sample_rate, channels=2):
     sig, rate = torchaudio.load(path)
     mixed.export(out_path, format="wav")
     return out_path
+# === Genre Mastering Tab ===
+def apply_genre_preset(audio, genre):
+    global preset_choices
+    selected_preset = preset_choices.get(genre, [])
+    return process_audio(audio, selected_preset, False, genre, "WAV")
+with gr.Tab("🎧 Genre Mastering"):
+    gr.Markdown("Apply pre-tuned mastering settings for different music genres.")
+    genre_dropdown = gr.Dropdown(
+        choices=list(genre_presets.keys()),
+        label="Select Genre",
+        value="Pop"
+    )
+    gr.Interface(
+        fn=lambda audio, genre: apply_genre_preset(audio, genre)[0],
+        inputs=[
+            gr.Audio(label="Upload Track", type="filepath"),
+            genre_dropdown
+        ],
+        outputs=gr.Audio(label="Mastered Output", type="filepath"),
+        title="Genre-Specific Mastering",
+        description="Apply professionally tuned presets for popular music genres."
+    )
 # === Dummy Voice Cloning Tab – Works Locally Only ===
 def clone_voice(*args):
     return "⚠️ Voice cloning requires local install – use Python 3.9 or below"
+with gr.Tab("🎭 Voice Cloning (Local Only)"):
+    gr.Interface(
+        fn=clone_voice,
+        inputs=[
+            gr.File(label="Source Voice Clip"),
+            gr.File(label="Target Voice Clip"),
+            gr.Textbox(label="Text to Clone", lines=5)
+        ],
+        outputs=gr.Audio(label="Cloned Output", type="filepath"),
+        title="Replace One Voice With Another",
+        description="Clone voice from source to target speaker using AI"
+    )
 # === Speaker Diarization ("Who Spoke When?") ===
 try:
     from pyannote.audio import Pipeline as DiarizationPipeline
     audio.export(temp_wav, format="wav")
     try:
         diarization = diarize_pipeline(temp_wav)
         result = whisper.transcribe(temp_wav)
             clear_btn=None
         )
+    # --- Genre Mastering Tab ===
+    with gr.Tab("🎧 Genre Mastering"):
+        gr.Interface(
+            fn=lambda audio, genre: apply_genre_preset(audio, genre)[0],
+            inputs=[
+                gr.Audio(label="Upload Track", type="filepath"),
+                gr.Dropdown(choices=list(genre_presets.keys()), label="Select Genre", value="Pop")
+            ],
+            outputs=gr.Audio(label="Mastered Output", type="filepath"),
+            title="Genre-Specific Mastering",
+            description="Apply professionally tuned presets for popular music genres.",
+            allow_flagging="never"
+        )
     # --- Transcribe & Edit Tab ===
     with gr.Tab("📝 Transcribe & Edit"):
         gr.Interface(
             description="Convert voice to text and edit it before exporting again."
         )
     # --- Voice Cloning (Local Only) ===
     with gr.Tab("🎭 Voice Cloning (Local Only)"):
         gr.Interface(
         )
     # --- Mix Two Tracks ===
+    with gr.Tab(" remix mode"),
         gr.Interface(
             fn=mix_tracks,
             inputs=[