text2svg-demo-app

Running

App Files Files Community

Jinglong Xiong commited on Apr 21

Commit

bb5a422

1 Parent(s): 33dda45

can generate multiple variations

Browse files

Files changed (1) hide show

gen_image.py +40 -7

gen_image.py CHANGED Viewed

@@ -3,6 +3,15 @@ import torch
 class ImageGenerator:
     def __init__(self, model_id="stabilityai/stable-diffusion-2-1-base", device="cuda"):
         scheduler = EulerDiscreteScheduler.from_pretrained(model_id, subfolder="scheduler")
         self.pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
@@ -10,25 +19,49 @@ class ImageGenerator:
             torch_dtype=torch.float16
         )
         self.pipe = self.pipe.to(device)
-    def generate(self, prompt, negative_prompt=None, output_path=None):
-        image = self.pipe(prompt, negative_prompt=negative_prompt).images[0]
         if output_path:
-            image.save(output_path)
         return image
 # Example usage
 if __name__ == "__main__":
     generator = ImageGenerator()
     import time
     start_time = time.time()
     image = generator.generate(
-        prompt="magenta trapezoids layered on a transluscent silver sheet, simple, icon",
-        negative_prompt="3d, blurry, complex geometry, realistic",
-        output_path="sheet.png"
     )
     end_time = time.time()
     print(f"Time taken: {end_time - start_time} seconds")

 class ImageGenerator:
     def __init__(self, model_id="stabilityai/stable-diffusion-2-1-base", device="cuda"):
+        """
+        Initialize the image generator with a specific model.
+        Args:
+            model_id (str): The model identifier for the stable diffusion model.
+                Default is "stabilityai/stable-diffusion-2-1-base".
+            device (str): The device to run the model on, either "cuda" or "cpu".
+                Default is "cuda".
+        """
         scheduler = EulerDiscreteScheduler.from_pretrained(model_id, subfolder="scheduler")
         self.pipe = StableDiffusionPipeline.from_pretrained(
             model_id,
             torch_dtype=torch.float16
         )
         self.pipe = self.pipe.to(device)
+        self.positive_prompt = "simple, icon"
+        self.negative_prompt = "3d, blurry, complex geometry, realistic"
+    def generate(self, prompt, negative_prompt=None, output_path=None, num_images=1, num_inference_steps=50):
+        """
+        Generate an image based on the provided prompt.
+        Args:
+            prompt (str): The text description to generate an image from.
+            negative_prompt (str, optional): Elements to avoid in the generated image.
+                If None, uses the default negative prompt.
+            output_path (str, optional): Path to save the generated image.
+                If None, the image is not saved to disk.
+            num_images (int, optional): Number of images to generate.
+        Returns:
+            PIL.Image.Image: The generated image.
+        """
+        prompt = f"{prompt}, {self.positive_prompt}"
+        if negative_prompt is None:
+            negative_prompt = self.negative_prompt
+        images = self.pipe(
+            prompt,
+            negative_prompt=negative_prompt,
+            num_inference_steps=50,
+            num_images_per_prompt=num_images
+        ).images
         if output_path:
+            for i, image in enumerate(images):
+                image.save(f".cache/{output_path.replace('.png', f'_{i}.png')}")
         return image
 # Example usage
 if __name__ == "__main__":
     generator = ImageGenerator()
     import time
     start_time = time.time()
     image = generator.generate(
+        prompt="magenta trapezoids layered on a transluscent silver sheet",
+        output_path="sheet.png",
+        num_images=4
     )
     end_time = time.time()
     print(f"Time taken: {end_time - start_time} seconds")