Spaces:

slabstech
/

ghost-vision

Paused

App Files Files Community

sachin commited on 23 days ago

Commit

cb5e4aa

1 Parent(s): c43570d

add-genrate

Browse files

Files changed (1) hide show

intruct.py +117 -0

intruct.py CHANGED Viewed

@@ -5,6 +5,18 @@ import math
 from PIL import Image, ImageOps
 import torch
 from diffusers import StableDiffusionInstructPix2PixPipeline
 # Initialize FastAPI app
 app = FastAPI()
@@ -21,6 +33,111 @@ DEFAULT_TEXT_CFG = 7.5
 DEFAULT_IMAGE_CFG = 1.5
 DEFAULT_SEED = 1371
 def process_image(input_image: Image.Image, instruction: str, steps: int, text_cfg_scale: float, image_cfg_scale: float, seed: int):
     """
     Process the input image with the given instruction using InstructPix2Pix.

 from PIL import Image, ImageOps
 import torch
 from diffusers import StableDiffusionInstructPix2PixPipeline
+from fastapi import FastAPI, Response
+from fastapi.responses import FileResponse
+import torch
+from diffusers import StableDiffusionXLPipeline, UNet2DConditionModel, EulerDiscreteScheduler
+from huggingface_hub import hf_hub_download, login
+from safetensors.torch import load_file
+from io import BytesIO
+import os
+import base64  # Added for encoding images as base64
+from typing import List  # Added for type hinting the list of prompts
 # Initialize FastAPI app
 app = FastAPI()
 DEFAULT_IMAGE_CFG = 1.5
 DEFAULT_SEED = 1371
+HF_TOKEN = os.getenv("HF_TOKEN")
+def load_model():
+    try:
+        # Login to Hugging Face if token is provided
+        if HF_TOKEN:
+            login(token=HF_TOKEN)
+        base = "stabilityai/stable-diffusion-xl-base-1.0"
+        repo = "ByteDance/SDXL-Lightning"
+        ckpt = "sdxl_lightning_4step_unet.safetensors"
+        # Load model with explicit error handling
+        unet = UNet2DConditionModel.from_config(
+            base,
+            subfolder="unet"
+        ).to("cuda", torch.float16)
+        unet.load_state_dict(load_file(hf_hub_download(repo, ckpt), device="cuda"))
+        pipe = StableDiffusionXLPipeline.from_pretrained(
+            base,
+            unet=unet,
+            torch_dtype=torch.float16,
+            variant="fp16"
+        ).to("cuda")
+        # Configure scheduler
+        pipe.scheduler = EulerDiscreteScheduler.from_config(
+            pipe.scheduler.config,
+            timestep_spacing="trailing"
+        )
+        return pipe
+    except Exception as e:
+        raise Exception(f"Failed to load model: {str(e)}")
+# Load model at startup with error handling
+try:
+    pipe = load_model()
+except Exception as e:
+    print(f"Model initialization failed: {str(e)}")
+    raise
+@app.get("/generate")
+async def generate_image(prompt: str):
+    try:
+        # Generate image
+        image = pipe(
+            prompt,
+            num_inference_steps=4,
+            guidance_scale=0
+        ).images[0]
+        # Save image to buffer
+        buffer = BytesIO()
+        image.save(buffer, format="PNG")
+        buffer.seek(0)
+        return Response(content=buffer.getvalue(), media_type="image/png")
+    except Exception as e:
+        return {"error": str(e)}
+# New endpoint to handle a list of prompts
+@app.get("/generate_multiple")
+async def generate_multiple_images(prompts: List[str]):
+    try:
+        # List to store base64-encoded images
+        generated_images = []
+        # Generate an image for each prompt
+        for prompt in prompts:
+            image = pipe(
+                prompt,
+                num_inference_steps=4,
+                guidance_scale=0
+            ).images[0]
+            # Save image to buffer
+            buffer = BytesIO()
+            image.save(buffer, format="PNG")
+            buffer.seek(0)
+            # Encode the image as base64
+            image_base64 = base64.b64encode(buffer.getvalue()).decode("utf-8")
+            generated_images.append({
+                "prompt": prompt,
+                "image_base64": image_base64
+            })
+        return {"images": generated_images}
+    except Exception as e:
+        return {"error": str(e)}
+@app.get("/health")
+async def health_check():
+    return {"status": "healthy"}
 def process_image(input_image: Image.Image, instruction: str, steps: int, text_cfg_scale: float, image_cfg_scale: float, seed: int):
     """
     Process the input image with the given instruction using InstructPix2Pix.