Spaces:

AZLABS
/

Comic-2

Running

App Files Files Community

AZLABS commited on Nov 24, 2024

Commit

b4e25f5

verified ·

1 Parent(s): 53514f2

Update app.py

Browse files

Files changed (1) hide show

app.py +121 -249

app.py CHANGED Viewed

@@ -1,257 +1,129 @@
 import os
-import json
-import urllib.request
-from PIL import Image
-import cv2
-import moviepy.editor as mp
 import logging
-import requests
 import uuid
-import time
-import gradio as gr
-from moviepy.editor import *
-from moviepy.video.tools.subtitles import SubtitlesClip
-from hercai import Hercai  # Import the hercai library
-from gtts import gTTS  # Import gTTS for text-to-speech
-from hercai import Hercai  # Import the hercai module
-# Configure logging for both file and console
-log_dir = os.getenv('LOG_DIRECTORY', './')
-LOGGER_FILE_PATH = os.path.join(str(log_dir), 'utils.log')
-# Create a formatter
-formatter = logging.Formatter(
-    '[%(asctime)s] [%(levelname)s] [%(filename)s] [%(lineno)s:%(funcName)s()] %(message)s',
-    datefmt='%Y-%b-%d %H:%M:%S'
-)
-# Create and configure the logger
-LOGGER = logging.getLogger(__name__)
-# Create file handler
-file_handler = logging.FileHandler(LOGGER_FILE_PATH, mode='a')
-file_handler.setFormatter(formatter)
-# Create console handler
-console_handler = logging.StreamHandler()
-console_handler.setFormatter(formatter)
-# Add both handlers to logger
-LOGGER.addHandler(file_handler)
-LOGGER.addHandler(console_handler)
-# Set log level
-log_level_env = os.getenv('LOG_LEVEL', 'INFO')
-log_level_dict = {
-    'DEBUG': logging.DEBUG,
-    'INFO': logging.INFO,
-    'WARNING': logging.WARNING,
-    'ERROR': logging.ERROR,
-    'CRITICAL': logging.CRITICAL
-}
-if log_level_env in log_level_dict:
-    log_level = log_level_dict[log_level_env]
-else:
-    log_level = log_level_dict['INFO']
-LOGGER.setLevel(log_level)
-# Set the path to the ImageMagick binary
-# os.environ["IMAGE_MAGICK_BINARY"] = "/usr/local/bin/convert"  # Update this path as needed (No longer needed)
-class Text2Video:
-    """A class to generate videos from text prompts."""
-    def __init__(self) -> None:
-        """Initialize the Text2Video class."""
-        self.hercai_api_key = "YOUR_HERCAI_API_KEY"  # Replace with your Hercai API key
-        self.hercai = Hercai(self.hercai_api_key)  # Initialize Hercai
-        self.hercai_base_url = "https://hercai.onrender.com/v3/text2image"
-        LOGGER.info("🚀 Text2Video class initialized.")
-    def generate_text(self, prompt: str) -> str:
-        """Generate text using GPT-3.5-turbo."""
-        LOGGER.info(f"📝 Generating text for prompt: {prompt}")
-        # ... (This part is not needed for Hercai) ...
-        return ""
-    def get_image(self, img_prompt: str) -> str:
-        """Generate an image based on the provided text prompt."""
-        LOGGER.info(f"🖼️ Generating image for prompt: {img_prompt}")
-        try:
-            image_result = self.hercai.draw_image(
-                model="simurg",  # Choose a Hercai model
-                prompt=img_prompt,
-                negative_prompt="Dark and gloomy"
-            )
-            image_url = image_result['url']
-            LOGGER.info(f"✅ Generated image URL: {image_url}")
-            return image_url
-        except requests.exceptions.RequestException as e:
-            LOGGER.error(f"❌ Error generating image: {str(e)}")
-            return ""
-    def download_img_from_url(self, image_url: str, image_path: str) -> str:
-        """Download an image from a URL."""
-        LOGGER.info(f"⬇️ Downloading image from URL: {image_url} to path: {image_path}")
-        try:
-            urllib.request.urlretrieve(image_url, image_path)
-            # Resize after downloading
-            img = Image.open(image_path)
-            img = img.resize((640, 480))  # Adjust resolution for reduced size
-            img.save(image_path)
-            LOGGER.info(f"✅ Image downloaded to: {image_path}")
-            return image_path
-        except Exception as e:
-            LOGGER.error(f"❌ Error downloading image from URL: {e}")
-            return ""
-    def text_to_audio(self, text: str, audio_path: str) -> str:
-        """Convert text to speech using gTTS."""
-        LOGGER.info(f"🔊 Converting text to audio for text: {text}")
-        try:
-            tts = gTTS(text=text, lang='en')  # You can change the language ('en' for English)
-            tts.save(audio_path, bitrate="128k")  # Reduce `bitrate` for smaller file size
-            LOGGER.info(f"✅ Audio saved to: {audio_path}")
-            return audio_path
-        except Exception as e:
-            LOGGER.error(f"❌ Error generating speech: {str(e)}")
-            return ""
-    #  The transcription part has been removed as it's no longer needed
-    def get_images_and_audio(self, list_prompts: list) -> tuple:
-        """Generate images and corresponding audio files from a list of prompts."""
-        LOGGER.info(f"🖼️🔊 Generating images and audio for prompts: {list_prompts}")
-        img_list = []
-        audio_paths = []
-        for img_prompt in list_prompts:
-            try:
-                unique_id = uuid.uuid4().hex
-                image_path = f"{img_prompt[:9]}_{unique_id}.png"
-                img_url = self.get_image(img_prompt)
-                if img_url:  # Only process if img_url exists & is not None
-                    image = self.download_img_from_url(img_url, image_path)
-                    img_list.append(image)
-                audio_path = f"{img_prompt[:9]}_{unique_id}.mp3"
-                audio = self.text_to_audio(img_prompt, audio_path)
-                if audio:  # Only process if audio exists
-                    audio_paths.append(audio)
-                LOGGER.info(f"✅ Processed prompt: {img_prompt}, Image: {image}, Audio: {audio}")
-            except Exception as e:
-                LOGGER.error(f"❌ Error processing prompt: {img_prompt}, {e}")
-        return img_list, audio_paths
-    def create_video_from_images_and_audio(self, image_files: list, audio_files: list, output_path: str) -> None:
-        """Create a video from images and corresponding audio files with pop-up bubbles."""
-        LOGGER.info(f"🎥 Creating video from images: {image_files}, audio files: {audio_files}")
-        try:
-            if len(image_files) != len(audio_files):
-                LOGGER.error("❌ Error: Number of images and audio files don't match.")
-                return
-            video_clips = []
-            for image_file, audio_file in zip(image_files, audio_files):
-                # Create the base video from the image and audio
-                if not os.path.exists(audio_file) or not os.path.exists(image_file):
-                    LOGGER.error(f"❌ Audio or image file missing for {image_file} or {audio_file}")
-                    continue
-                audio_clip = mp.AudioFileClip(audio_file)
-                video_clip = mp.ImageClip(image_file).set_duration(audio_clip.duration)
-                video_clip = video_clip.set_audio(audio_clip)
-                # Apply image cropping and bubble creation
-                try:
-                    img = Image.open(image_file)
-                    width, height = img.size
-                    cropped_image = img.crop((0, 0, int(width * 0.80), height))  # Cropping image to make space for bubble
-                    bubble_clip = mp.ImageClip(image_file).resize((150, 150))
-                    bubble_clip = bubble_clip.set_position((int(width * 0.90), 0))
-                    # Now combine the original video with the bubble
-                    video_clip = CompositeVideoClip([video_clip, bubble_clip])
-                except Exception as ex:
-                    LOGGER.error(f"❌ Error adding comic bubble: {str(ex)}")
-                video_clips.append(video_clip)
-                LOGGER.info(f"✅ Created video clip for image: {image_file}, audio: {audio_file}")
-            # Combine the generated clips into a single video
-            if video_clips:  # Only process if clip exists
-                final_clip = mp.concatenate_videoclips(video_clips)
-                final_clip.write_videofile(output_path, codec='libx264', fps=24) # Optimized codec and fps settings
-                LOGGER.info(f"✅ Video created successfully at: {output_path}")
-        except Exception as e:
-            LOGGER.error(f"❌ Error creating video: {str(e)}")
-    def generate_video(self, text: str) -> str:
-        """
-        Generate a video from a list of text prompts.
-        Args:
-            text (str): Text prompts separated by double commas.
-        Returns:
-            str: Path to the generated video file.
-        """
-        LOGGER.info(f"🎬 Generating video for text: {text}")
-        try:
-            list_prompts = [sentence.strip() for sentence in text.split(",,") if sentence.strip()]
-            LOGGER.info(f"📝 List of prompts: {list_prompts}")
-            # Set the output path for the generated video
-            output_path = f"output_video_{uuid.uuid4().hex[:8]}.mp4"
-            LOGGER.info(f"📁 Output path for video: {output_path}")
-            # Generate images and audio
-            img_list, audio_paths = self.get_images_and_audio(list_prompts)
-            # Create video from images and audio
-            self.create_video_from_images_and_audio(img_list, audio_paths, output_path)
-            return output_path
-        except Exception as e:
-            LOGGER.error(f"❌ Error generating video: {str(e)}")
-            return ""
-    def gradio_interface(self):
-        """Create and launch the Gradio interface."""
-        LOGGER.info("🌐 Launching Gradio interface.")
-        with gr.Blocks(css="style.css", theme='abidlabs/dracula_revamped') as demo:
-            example_txt = """once upon a time there was a village. It was a nice place to live, except for one thing. people did not like to share.,, One day a visitor came to town.
-            'Hello. Does anybody have food to share?' He asked. 'No', said everyone.,,
-            That's okay', said the visitor. 'I will make stone soup for everyone'.Then he took a stone and dropped it into a giant pot,,"""
-            gr.HTML("""
-                <center><h1 style="color:#fff">Comics Video Generator</h1></center>""")
-            with gr.Row(elem_id="col-container"):
-                input_text = gr.Textbox(label="Comics Text", placeholder="Enter the comics by double comma separated")
-            with gr.Row(elem_id="col-container"):
-                button = gr.Button("Generate Video")
-            with gr.Row(elem_id="col-container"):
-                output = gr.Video()
-            with gr.Row(elem_id="col-container"):
-                example = gr.Examples([example_txt], input_text)
-            button.click(self.generate_video, [input_text], output)
-        demo.launch(debug=True)
-        LOGGER.info("✅ Gradio interface launched.")
 if __name__ == "__main__":
-    LOGGER.info("🚀 Starting Text2Video application.")
-    text2video = Text2Video()
-    text2video.gradio_interface()

 import os
 import logging
 import uuid
+from gtts import gTTS
+import moviepy.editor as mp
+import g4f
+from g4f import Provider
+import urllib.request
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+def generate_image(prompt):
+    try:
+        unique_id = uuid.uuid4().hex
+        safe_prompt = prompt[:30].replace(' ', '_')  # Take first 30 chars and make filename safe
+        image_filename = f"{safe_prompt}_{unique_id}.png"
+        response = g4f.Image.create(
+            prompt=f"{prompt} in comic style",
+            model="dalle",
+            provider=Provider.DeepAI
+        )
+        if response:
+            urllib.request.urlretrieve(response, image_filename)
+            logger.info(f"✅ Generated image: {image_filename}")
+            return image_filename
+        return None
+    except Exception as e:
+        logger.error(f"❌ Error generating image: {e}")
+        return None
+def generate_audio(text):
+    try:
+        unique_id = uuid.uuid4().hex
+        safe_text = text[:30].replace(' ', '_')  # Take first 30 chars and make filename safe
+        audio_filename = f"{safe_text}_{unique_id}.mp3"
+        tts = gTTS(text=text, lang='en')
+        tts.save(audio_filename)
+        logger.info(f"✅ Generated audio: {audio_filename}")
+        return audio_filename
+    except Exception as e:
+        logger.error(f"❌ Error generating audio: {e}")
+        return None
+def get_images_and_audio(text):
+    segments = [s.strip() for s in text.split(",,") if s.strip()]
+    images = []
+    audio_files = []
+    for segment in segments:
+        image_file = generate_image(segment)
+        audio_file = generate_audio(segment)
+        if image_file and audio_file:
+            images.append(image_file)
+            audio_files.append(audio_file)
+            logger.info(f"✅ Processed prompt: {segment}, Image: {image_file}, Audio: {audio_file}")
+    return images, audio_files
+def create_video_from_images_and_audio(images, audio_files):
+    try:
+        if len(images) != len(audio_files):
+            raise ValueError("Number of images and audio files don't match.")
+        clips = []
+        for img, aud in zip(images, audio_files):
+            # Create audio clip
+            audio_clip = mp.AudioFileClip(aud)
+            # Create image clip
+            image_clip = mp.ImageClip(img).set_duration(audio_clip.duration)
+            # Combine image and audio
+            video_clip = image_clip.set_audio(audio_clip)
+            clips.append(video_clip)
+        # Concatenate all clips
+        final_clip = mp.concatenate_videoclips(clips)
+        # Write final video
+        output_filename = f"output_{uuid.uuid4().hex[:8]}.mp4"
+        final_clip.write_videofile(output_filename, fps=24)
+        # Clean up
+        final_clip.close()
+        for clip in clips:
+            clip.close()
+        # Clean up temporary files
+        for file in images + audio_files:
+            if os.path.exists(file):
+                os.remove(file)
+        logger.info(f"✅ Video created successfully: {output_filename}")
+        return output_filename
+    except Exception as e:
+        logger.error(f"❌ Error: {e}")
+        return None
+def create_video(text):
+    try:
+        # Get images and audio files
+        images, audio_files = get_images_and_audio(text)
+        # Create video
+        video_file = create_video_from_images_and_audio(images, audio_files)
+        return video_file
+    except Exception as e:
+        logger.error(f"❌ Error in create_video: {e}")
+        return None
 if __name__ == "__main__":
+    # Test the functionality
+    test_text = """Once upon a time there was a village.,,
+    One day a visitor came to town.,,
+    That's okay', said the visitor. 'I will make stone soup for everyone'."""
+    result = create_video(test_text)
+    if result:
+        print(f"Video created successfully: {result}")
+    else:
+        print("Failed to create video")