from fastapi import FastAPI, HTTPException from fastapi.staticfiles import StaticFiles from pydantic import BaseModel, HttpUrl from typing import List import os import asyncio import uuid import aiohttp import re from urllib.parse import urlparse import shutil import aiofiles # Create FastAPI app app = FastAPI() # Create and mount staticfiles directory os.makedirs("staticfiles", exist_ok=True) app.mount("/static", StaticFiles(directory="staticfiles"), name="static") # Define input model for the request class SlideshowRequest(BaseModel): image_urls: List[HttpUrl] audio_url: HttpUrl duration: int zoom: bool = False def extract_google_drive_id(url): """Extract file ID from a Google Drive URL""" pattern = r'(?:/file/d/|id=|/open\?id=)([^/&]+)' match = re.search(pattern, str(url)) return match.group(1) if match else None async def download_file(url, local_path): """Download a file from URL to local path asynchronously""" try: # Handle Google Drive URLs if "drive.google.com" in str(url): file_id = extract_google_drive_id(url) if file_id: url = f"https://drive.google.com/uc?export=download&id={file_id}" async with aiohttp.ClientSession() as session: async with session.get(str(url)) as response: response.raise_for_status() async with aiofiles.open(local_path, 'wb') as f: while True: chunk = await response.content.read(8192) if not chunk: break await f.write(chunk) return True except Exception as e: print(f"Error downloading {url}: {str(e)}") return False async def create_slideshow(image_paths, audio_path, output_path, duration, zoom=False, zoom_ratio=0.04): """Generate slideshow from images and audio using ffmpeg asynchronously, with optional zoom effect""" if not zoom: # Create temporary file list for ffmpeg concat concat_file = "temp_concat.txt" async with aiofiles.open(concat_file, "w") as f: for img in image_paths: await f.write(f"file '{img}'\n") await f.write(f"duration {duration}\n") # Add the last image again without duration (required by ffmpeg) if image_paths: await f.write(f"file '{image_paths[-1]}'\n") # Run ffmpeg command to create slideshow with audio (no zoom) total_duration = len(image_paths) * duration cmd = [ "ffmpeg", "-f", "concat", "-safe", "0", "-i", concat_file, "-i", audio_path, "-c:v", "libx264", "-pix_fmt", "yuv420p", "-c:a", "aac", "-shortest", "-y", "-t", str(total_duration), output_path ] else: # Generate slideshow with zoom effect using ffmpeg zoompan filter. # For each image, loop it for the specified duration and apply zoompan. fps = 25 # frames per second cmd = ["ffmpeg"] # Add each image as an input that loops for 'duration' seconds. for img in image_paths: cmd.extend(["-loop", "1", "-t", str(duration), "-i", img]) # Append the audio input. Its index will be len(image_paths) cmd.extend(["-i", audio_path]) # Build filter_complex for zoompan on each image. filter_complex = "" for i in range(len(image_paths)): # Each input's video stream is processed with zoompan. # The zoom increases by zoom_ratio per frame (starting at 1.0). filter_complex += ( f"[{i}:v]zoompan=z='if(eq(on,0),1,zoom+{zoom_ratio})':" f"d={duration*fps}:s=hd720, setpts=PTS-STARTPTS[v{i}];" ) # Concatenate all processed video segments. inputs = "".join(f"[v{i}]" for i in range(len(image_paths))) filter_complex += f"{inputs}concat=n={len(image_paths)}:v=1:a=0,format=yuv420p[v]" # Map the concatenated video and the audio stream (audio input is at index len(image_paths)) cmd = cmd + [ "-filter_complex", filter_complex, "-map", "[v]", "-map", f"{len(image_paths)}:a", "-c:v", "libx264", "-pix_fmt", "yuv420p", "-c:a", "aac", "-shortest", "-y", output_path ] try: process = await asyncio.create_subprocess_exec( *cmd, stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE ) stdout, stderr = await process.communicate() # Remove temporary concat file if it exists if not zoom and os.path.exists("temp_concat.txt"): os.remove("temp_concat.txt") if process.returncode != 0: print(f"FFmpeg error: {stderr.decode()}") return False return True except Exception as e: print(f"FFmpeg error: {str(e)}") if not zoom and os.path.exists("temp_concat.txt"): os.remove("temp_concat.txt") return False @app.post("/make_slideshow") async def make_slideshow(request: SlideshowRequest): """ Create a slideshow from images and audio with specified duration per image. Returns the URL of the generated video. """ # Create unique directory for this request request_id = str(uuid.uuid4()) request_dir = os.path.join("staticfiles", request_id) os.makedirs(request_dir, exist_ok=True) try: # Download images image_paths = [] download_tasks = [] for i, url in enumerate(request.image_urls): image_path = os.path.join(request_dir, f"image_{i:03d}.png") image_paths.append(image_path) download_tasks.append(download_file(url, image_path)) # Download audio audio_path = os.path.join(request_dir, "audio.mp3") download_tasks.append(download_file(request.audio_url, audio_path)) # Wait for all downloads to complete results = await asyncio.gather(*download_tasks) # Check if all downloads were successful if not all(results[:-1]): # All image downloads raise HTTPException(status_code=400, detail="Failed to download one or more images") if not results[-1]: # Audio download raise HTTPException(status_code=400, detail=f"Failed to download audio: {request.audio_url}") # Output video path output_path = os.path.join(request_dir, "slideshow.mp4") # Generate slideshow if not await create_slideshow(image_paths, audio_path, output_path, request.duration, request.zoom): raise HTTPException(status_code=500, detail="Failed to create slideshow") # Return URL to the video base_url = "https://saq1b-api.hf.space/static" video_url = f"{base_url}/{request_id}/slideshow.mp4" return {"url": video_url} except Exception as e: # Clean up on error if os.path.exists(request_dir): shutil.rmtree(request_dir) raise HTTPException(status_code=500, detail=f"Error: {str(e)}") if __name__ == "__main__": import uvicorn uvicorn.run(app, host="0.0.0.0", port=7860)