Spaces:

gnosticdev
/

audio-a-video

Running

App Files Files Community

gnosticdev commited on Mar 30

Commit

9d50291

verified ·

1 Parent(s): bf377f6

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -11

app.py CHANGED Viewed

@@ -3,8 +3,8 @@ import moviepy.editor as mp
 import numpy as np
 import librosa
 from PIL import Image, ImageDraw
-import os
 import tempfile
 import logging
 # Configuración de logging
@@ -17,8 +17,11 @@ logger = logging.getLogger("audio_to_video")
 def generate_video(audio_file, image_file):
     try:
         # 1. Cargar audio
-        y, sr = librosa.load(audio_file)
         duration = librosa.get_duration(y=y, sr=sr)
         logger.info(f"Audio cargado: {duration:.1f} segundos")
@@ -32,10 +35,12 @@ def generate_video(audio_file, image_file):
         audio_envelope_zoom = audio_envelope * 0.2 + 0.9  # Para zoom
         audio_envelope_wave = audio_envelope * (img_h // 6)  # Para waveform
-        # 4. Generar frames
         def make_frame(t):
-            # --- Zoom automático ---
             time_idx = int(t * sr)
             zoom_factor = audio_envelope_zoom[time_idx] if time_idx < len(audio_envelope_zoom) else 1.0
             new_size = (int(img_w * zoom_factor), int(img_h * zoom_factor))
             zoomed_img = img.resize(new_size, Image.LANCZOS)
@@ -50,7 +55,7 @@ def generate_video(audio_file, image_file):
                 y_offset + img_h
             ))
-            # --- Waveform ---
             frame = ImageDraw.Draw(cropped_img)
             start_y = int(img_h * 0.8)  # 80% hacia abajo
@@ -68,7 +73,7 @@ def generate_video(audio_file, image_file):
                 points.extend([(x, y_pos), (x, y_neg)])
             if len(points) > 2:
-                frame.polygon(points, fill=(255, 0, 0, 150))
             return np.array(cropped_img)
@@ -77,10 +82,11 @@ def generate_video(audio_file, image_file):
         video.fps = 24
         video = video.set_audio(mp.AudioFileClip(audio_file))
-        # 6. Guardar video
         temp_dir = tempfile.mkdtemp()
         output_path = os.path.join(temp_dir, "output.mp4")
         video.write_videofile(
             output_path,
             codec="libx264",
@@ -89,12 +95,16 @@ def generate_video(audio_file, image_file):
             logger=None
         )
-        logger.info(f"Video guardado en: {output_path}")
         return output_path  # Retornar la ruta completa
     except Exception as e:
-        logger.error(f"Error crítico: {str(e)}")
-        return None  # Retornar None en caso de error
 # Interfaz Gradio
 iface = gr.Interface(
@@ -109,4 +119,4 @@ iface = gr.Interface(
 )
 if __name__ == "__main__":
-    iface.queue().launch()

 import numpy as np
 import librosa
 from PIL import Image, ImageDraw
 import tempfile
+import os
 import logging
 # Configuración de logging
 def generate_video(audio_file, image_file):
     try:
+        logger.info("Iniciando generación del video...")
         # 1. Cargar audio
+        logger.info(f"Cargando audio: {audio_file}")
+        y, sr = librosa.load(audio_file, sr=None, mono=True)  # Carga completa del audio
         duration = librosa.get_duration(y=y, sr=sr)
         logger.info(f"Audio cargado: {duration:.1f} segundos")
         audio_envelope_zoom = audio_envelope * 0.2 + 0.9  # Para zoom
         audio_envelope_wave = audio_envelope * (img_h // 6)  # Para waveform
+        # 4. Generar frames con zoom y waveform
         def make_frame(t):
+            # Calcular posición en el audio
             time_idx = int(t * sr)
+            # --- Efecto de Zoom ---
             zoom_factor = audio_envelope_zoom[time_idx] if time_idx < len(audio_envelope_zoom) else 1.0
             new_size = (int(img_w * zoom_factor), int(img_h * zoom_factor))
             zoomed_img = img.resize(new_size, Image.LANCZOS)
                 y_offset + img_h
             ))
+            # --- Dibujar Waveform ---
             frame = ImageDraw.Draw(cropped_img)
             start_y = int(img_h * 0.8)  # 80% hacia abajo
                 points.extend([(x, y_pos), (x, y_neg)])
             if len(points) > 2:
+                frame.polygon(points, fill=(255, 0, 0, 150))  # Rojo semitransparente
             return np.array(cropped_img)
         video.fps = 24
         video = video.set_audio(mp.AudioFileClip(audio_file))
+        # 6. Guardar video en un directorio temporal persistente
         temp_dir = tempfile.mkdtemp()
         output_path = os.path.join(temp_dir, "output.mp4")
+        logger.info(f"Exportando video a: {output_path}")
         video.write_videofile(
             output_path,
             codec="libx264",
             logger=None
         )
+        # Verificar que el archivo existe
+        if not os.path.exists(output_path):
+            raise Exception("Error: El archivo de video no se generó correctamente.")
+        logger.info(f"Video guardado correctamente: {output_path}")
         return output_path  # Retornar la ruta completa
     except Exception as e:
+        logger.error(f"Error crítico: {str(e)}", exc_info=True)
+        return None
 # Interfaz Gradio
 iface = gr.Interface(
 )
 if __name__ == "__main__":
+    iface.queue(max_size=1).launch(show_error=True)