hysts HF staff commited on
Commit
5708a7c
·
1 Parent(s): 7075804
Files changed (1) hide show
  1. edit_app.py +139 -139
edit_app.py CHANGED
@@ -46,154 +46,154 @@ example_instructions = [
46
  model_id = "timbrooks/instruct-pix2pix"
47
 
48
 
49
- def main():
50
- pipe = StableDiffusionInstructPix2PixPipeline.from_pretrained(
51
- model_id, torch_dtype=torch.float16, safety_checker=None
52
- ).to("cuda")
53
- example_image = Image.open("imgs/example.jpg").convert("RGB")
54
-
55
- def load_example(
56
- steps: int,
57
- randomize_seed: bool,
58
- seed: int,
59
- randomize_cfg: bool,
60
- text_cfg_scale: float,
61
- image_cfg_scale: float,
62
- ):
63
- example_instruction = random.choice(example_instructions)
64
- return [example_image, example_instruction] + generate(
65
- example_image,
66
- example_instruction,
67
- steps,
68
- randomize_seed,
69
- seed,
70
- randomize_cfg,
71
- text_cfg_scale,
72
- image_cfg_scale,
73
- )
74
-
75
- def generate(
76
- input_image: Image.Image,
77
- instruction: str,
78
- steps: int,
79
- randomize_seed: bool,
80
- seed: int,
81
- randomize_cfg: bool,
82
- text_cfg_scale: float,
83
- image_cfg_scale: float,
84
- ):
85
- seed = random.randint(0, 100000) if randomize_seed else seed
86
- text_cfg_scale = round(random.uniform(6.0, 9.0), ndigits=2) if randomize_cfg else text_cfg_scale
87
- image_cfg_scale = round(random.uniform(1.2, 1.8), ndigits=2) if randomize_cfg else image_cfg_scale
88
-
89
- width, height = input_image.size
90
- factor = 512 / max(width, height)
91
- factor = math.ceil(min(width, height) * factor / 64) * 64 / min(width, height)
92
- width = int((width * factor) // 64) * 64
93
- height = int((height * factor) // 64) * 64
94
- input_image = ImageOps.fit(input_image, (width, height), method=Image.Resampling.LANCZOS)
95
-
96
- if instruction == "":
97
- return [input_image, seed]
98
-
99
- generator = torch.manual_seed(seed)
100
- edited_image = pipe(
101
- instruction,
102
- image=input_image,
103
- guidance_scale=text_cfg_scale,
104
- image_guidance_scale=image_cfg_scale,
105
- num_inference_steps=steps,
106
- generator=generator,
107
- ).images[0]
108
- return [seed, text_cfg_scale, image_cfg_scale, edited_image]
109
-
110
- def reset():
111
- return [0, "Randomize Seed", 1371, "Fix CFG", 7.5, 1.5, None]
112
-
113
- with gr.Blocks() as demo:
114
- gr.HTML(
115
- """<h1 style="font-weight: 900; margin-bottom: 7px;">
116
- InstructPix2Pix: Learning to Follow Image Editing Instructions
 
 
 
117
  </h1>
118
  <p>For faster inference without waiting in queue, you may duplicate the space and upgrade to GPU in settings.
119
  <br/>
120
  <a href="https://huggingface.co/spaces/timbrooks/instruct-pix2pix?duplicate=true">
121
  <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a>
122
  <p/>"""
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
123
  )
124
- with gr.Row():
125
- with gr.Column(scale=1, min_width=100):
126
- generate_button = gr.Button("Generate")
127
- with gr.Column(scale=1, min_width=100):
128
- load_button = gr.Button("Load Example")
129
- with gr.Column(scale=1, min_width=100):
130
- reset_button = gr.Button("Reset")
131
- with gr.Column(scale=3):
132
- instruction = gr.Textbox(lines=1, label="Edit Instruction", interactive=True)
133
-
134
- with gr.Row():
135
- input_image = gr.Image(label="Input Image", type="pil", interactive=True)
136
- edited_image = gr.Image(label="Edited Image", type="pil", interactive=False)
137
- input_image.style(height=512, width=512)
138
- edited_image.style(height=512, width=512)
139
-
140
- with gr.Row():
141
- steps = gr.Number(value=50, precision=0, label="Steps", interactive=True)
142
- randomize_seed = gr.Radio(
143
- ["Fix Seed", "Randomize Seed"],
144
- value="Randomize Seed",
145
- type="index",
146
- show_label=False,
147
- interactive=True,
148
- )
149
- seed = gr.Number(value=1371, precision=0, label="Seed", interactive=True)
150
- randomize_cfg = gr.Radio(
151
- ["Fix CFG", "Randomize CFG"],
152
- value="Fix CFG",
153
- type="index",
154
- show_label=False,
155
- interactive=True,
156
- )
157
- text_cfg_scale = gr.Number(value=7.5, label="Text CFG", interactive=True)
158
- image_cfg_scale = gr.Number(value=1.5, label="Image CFG", interactive=True)
159
-
160
- gr.Markdown(help_text)
161
-
162
- load_button.click(
163
- fn=load_example,
164
- inputs=[
165
- steps,
166
- randomize_seed,
167
- seed,
168
- randomize_cfg,
169
- text_cfg_scale,
170
- image_cfg_scale,
171
- ],
172
- outputs=[input_image, instruction, seed, text_cfg_scale, image_cfg_scale, edited_image],
173
- )
174
- generate_button.click(
175
- fn=generate,
176
- inputs=[
177
- input_image,
178
- instruction,
179
- steps,
180
- randomize_seed,
181
- seed,
182
- randomize_cfg,
183
- text_cfg_scale,
184
- image_cfg_scale,
185
- ],
186
- outputs=[seed, text_cfg_scale, image_cfg_scale, edited_image],
187
- )
188
- reset_button.click(
189
- fn=reset,
190
- inputs=[],
191
- outputs=[steps, randomize_seed, seed, randomize_cfg, text_cfg_scale, image_cfg_scale, edited_image],
192
  )
 
 
 
 
193
 
194
- demo.queue(concurrency_count=1)
195
- demo.launch(share=False)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
196
 
197
 
198
  if __name__ == "__main__":
199
- main()
 
46
  model_id = "timbrooks/instruct-pix2pix"
47
 
48
 
49
+ pipe = StableDiffusionInstructPix2PixPipeline.from_pretrained(
50
+ model_id, torch_dtype=torch.float16, safety_checker=None
51
+ ).to("cuda")
52
+ example_image = Image.open("imgs/example.jpg").convert("RGB")
53
+
54
+
55
+ def load_example(
56
+ steps: int,
57
+ randomize_seed: bool,
58
+ seed: int,
59
+ randomize_cfg: bool,
60
+ text_cfg_scale: float,
61
+ image_cfg_scale: float,
62
+ ):
63
+ example_instruction = random.choice(example_instructions)
64
+ return [example_image, example_instruction] + generate(
65
+ example_image,
66
+ example_instruction,
67
+ steps,
68
+ randomize_seed,
69
+ seed,
70
+ randomize_cfg,
71
+ text_cfg_scale,
72
+ image_cfg_scale,
73
+ )
74
+
75
+
76
+ def generate(
77
+ input_image: Image.Image,
78
+ instruction: str,
79
+ steps: int,
80
+ randomize_seed: bool,
81
+ seed: int,
82
+ randomize_cfg: bool,
83
+ text_cfg_scale: float,
84
+ image_cfg_scale: float,
85
+ ):
86
+ seed = random.randint(0, 100000) if randomize_seed else seed
87
+ text_cfg_scale = round(random.uniform(6.0, 9.0), ndigits=2) if randomize_cfg else text_cfg_scale
88
+ image_cfg_scale = round(random.uniform(1.2, 1.8), ndigits=2) if randomize_cfg else image_cfg_scale
89
+
90
+ width, height = input_image.size
91
+ factor = 512 / max(width, height)
92
+ factor = math.ceil(min(width, height) * factor / 64) * 64 / min(width, height)
93
+ width = int((width * factor) // 64) * 64
94
+ height = int((height * factor) // 64) * 64
95
+ input_image = ImageOps.fit(input_image, (width, height), method=Image.Resampling.LANCZOS)
96
+
97
+ if instruction == "":
98
+ return [input_image, seed]
99
+
100
+ generator = torch.manual_seed(seed)
101
+ edited_image = pipe(
102
+ instruction,
103
+ image=input_image,
104
+ guidance_scale=text_cfg_scale,
105
+ image_guidance_scale=image_cfg_scale,
106
+ num_inference_steps=steps,
107
+ generator=generator,
108
+ ).images[0]
109
+ return [seed, text_cfg_scale, image_cfg_scale, edited_image]
110
+
111
+
112
+ def reset():
113
+ return [0, "Randomize Seed", 1371, "Fix CFG", 7.5, 1.5, None]
114
+
115
+
116
+ with gr.Blocks() as demo:
117
+ gr.HTML(
118
+ """<h1 style="font-weight: 900; margin-bottom: 7px;">
119
+ InstructPix2Pix: Learning to Follow Image Editing Instructions
120
  </h1>
121
  <p>For faster inference without waiting in queue, you may duplicate the space and upgrade to GPU in settings.
122
  <br/>
123
  <a href="https://huggingface.co/spaces/timbrooks/instruct-pix2pix?duplicate=true">
124
  <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a>
125
  <p/>"""
126
+ )
127
+ with gr.Row():
128
+ with gr.Column(scale=1, min_width=100):
129
+ generate_button = gr.Button("Generate")
130
+ with gr.Column(scale=1, min_width=100):
131
+ load_button = gr.Button("Load Example")
132
+ with gr.Column(scale=1, min_width=100):
133
+ reset_button = gr.Button("Reset")
134
+ with gr.Column(scale=3):
135
+ instruction = gr.Textbox(lines=1, label="Edit Instruction", interactive=True)
136
+
137
+ with gr.Row():
138
+ input_image = gr.Image(label="Input Image", type="pil", interactive=True)
139
+ edited_image = gr.Image(label="Edited Image", type="pil", interactive=False)
140
+ input_image.style(height=512, width=512)
141
+ edited_image.style(height=512, width=512)
142
+
143
+ with gr.Row():
144
+ steps = gr.Number(value=50, precision=0, label="Steps", interactive=True)
145
+ randomize_seed = gr.Radio(
146
+ ["Fix Seed", "Randomize Seed"],
147
+ value="Randomize Seed",
148
+ type="index",
149
+ show_label=False,
150
+ interactive=True,
151
  )
152
+ seed = gr.Number(value=1371, precision=0, label="Seed", interactive=True)
153
+ randomize_cfg = gr.Radio(
154
+ ["Fix CFG", "Randomize CFG"],
155
+ value="Fix CFG",
156
+ type="index",
157
+ show_label=False,
158
+ interactive=True,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
159
  )
160
+ text_cfg_scale = gr.Number(value=7.5, label="Text CFG", interactive=True)
161
+ image_cfg_scale = gr.Number(value=1.5, label="Image CFG", interactive=True)
162
+
163
+ gr.Markdown(help_text)
164
 
165
+ load_button.click(
166
+ fn=load_example,
167
+ inputs=[
168
+ steps,
169
+ randomize_seed,
170
+ seed,
171
+ randomize_cfg,
172
+ text_cfg_scale,
173
+ image_cfg_scale,
174
+ ],
175
+ outputs=[input_image, instruction, seed, text_cfg_scale, image_cfg_scale, edited_image],
176
+ )
177
+ generate_button.click(
178
+ fn=generate,
179
+ inputs=[
180
+ input_image,
181
+ instruction,
182
+ steps,
183
+ randomize_seed,
184
+ seed,
185
+ randomize_cfg,
186
+ text_cfg_scale,
187
+ image_cfg_scale,
188
+ ],
189
+ outputs=[seed, text_cfg_scale, image_cfg_scale, edited_image],
190
+ )
191
+ reset_button.click(
192
+ fn=reset,
193
+ inputs=[],
194
+ outputs=[steps, randomize_seed, seed, randomize_cfg, text_cfg_scale, image_cfg_scale, edited_image],
195
+ )
196
 
197
 
198
  if __name__ == "__main__":
199
+ demo.queue(max_size=20).launch()