amos1088 commited on
Commit
545ba28
·
1 Parent(s): 51f8f41
Files changed (2) hide show
  1. app.py +12 -2
  2. requirements.txt +2 -1
app.py CHANGED
@@ -6,6 +6,7 @@ import spaces
6
  from PIL import Image
7
  from huggingface_hub import login
8
  from diffusers.utils import load_image
 
9
 
10
  from models.transformer_sd3 import SD3Transformer2DModel
11
  from pipeline_stable_diffusion_3_ipa import StableDiffusion3Pipeline
@@ -50,9 +51,18 @@ pipe.init_ipadapter(
50
 
51
  @spaces.GPU
52
  def gui_generation(prompt, ref_img, guidance_scale, ipadapter_scale):
53
- # Load and convert reference image
 
 
 
 
 
 
 
54
  ref_img = Image.open(ref_img.name).convert('RGB')
 
55
 
 
56
  with torch.no_grad():
57
  image = pipe(
58
  width=1024,
@@ -62,7 +72,7 @@ def gui_generation(prompt, ref_img, guidance_scale, ipadapter_scale):
62
  num_inference_steps=24,
63
  guidance_scale=guidance_scale,
64
  generator=torch.Generator("cuda").manual_seed(42),
65
- clip_image=ref_img,
66
  ipadapter_scale=ipadapter_scale
67
  ).images[0]
68
 
 
6
  from PIL import Image
7
  from huggingface_hub import login
8
  from diffusers.utils import load_image
9
+ from torchvision import transforms
10
 
11
  from models.transformer_sd3 import SD3Transformer2DModel
12
  from pipeline_stable_diffusion_3_ipa import StableDiffusion3Pipeline
 
51
 
52
  @spaces.GPU
53
  def gui_generation(prompt, ref_img, guidance_scale, ipadapter_scale):
54
+
55
+ # Load and preprocess the reference image
56
+ preprocess = transforms.Compose([
57
+ transforms.Resize((384, 384)),
58
+ transforms.ToTensor(),
59
+ transforms.ConvertImageDtype(torch.float16)
60
+ ])
61
+
62
  ref_img = Image.open(ref_img.name).convert('RGB')
63
+ ref_img_tensor = preprocess(ref_img).unsqueeze(0).to("cuda")
64
 
65
+ # Generate the image
66
  with torch.no_grad():
67
  image = pipe(
68
  width=1024,
 
72
  num_inference_steps=24,
73
  guidance_scale=guidance_scale,
74
  generator=torch.Generator("cuda").manual_seed(42),
75
+ clip_image=ref_img_tensor,
76
  ipadapter_scale=ipadapter_scale
77
  ).images[0]
78
 
requirements.txt CHANGED
@@ -8,4 +8,5 @@ sentencepiece
8
  spaces
9
  pillow
10
  peft
11
- openai
 
 
8
  spaces
9
  pillow
10
  peft
11
+ openai
12
+ torchvision