ginipick commited on
Commit
15cc8b5
ยท
verified ยท
1 Parent(s): f8cac3e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +64 -25
app.py CHANGED
@@ -7,6 +7,8 @@ import base64
7
  import mimetypes
8
  import json
9
  import io
 
 
10
 
11
  import torch
12
  from PIL import Image
@@ -122,7 +124,7 @@ def generate_by_google_genai(text, file_name, model="gemini-2.0-flash-exp"):
122
  # ์ž„์‹œ ํŒŒ์ผ๋กœ ์ด๋ฏธ์ง€ ๋ฐ›์„ ์ค€๋น„
123
  with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
124
  temp_path = tmp.name
125
- # ์‘๋‹ต ์ŠคํŠธ๋ฆผ์„ ๋ฐ›์œผ๋ฉด์„œ ์ด๋ฏธ์ง€/ํ…์ŠคํŠธ ๊ตฌ๋ถ„ ์ฒ˜๋ฆฌ
126
  for chunk in client.models.generate_content_stream(
127
  model=model,
128
  contents=contents,
@@ -148,8 +150,28 @@ def generate_by_google_genai(text, file_name, model="gemini-2.0-flash-exp"):
148
  return image_path, text_response
149
 
150
  #######################################
151
- # 3. Gradio ํ•จ์ˆ˜
152
- # (1) FLUX๋กœ ์ด๋ฏธ์ง€ ์ƒ์„ฑ -> (2) Google GenAI๋กœ ํ…์ŠคํŠธ ๊ต์ฒด
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
153
  #######################################
154
 
155
  def generate_initial_image(prompt, text, height, width, steps, scale, seed):
@@ -162,8 +184,7 @@ def generate_initial_image(prompt, text, height, width, steps, scale, seed):
162
  combined_prompt = prompt.replace("<text>", text)
163
  else:
164
  combined_prompt = f"{prompt} with clear readable text that says '{text}'"
165
-
166
- # ๋””๋ฒ„๊ทธ์šฉ: ์ตœ์ข… ๋“ค์–ด๊ฐ€๋Š” ํ”„๋กฌํ”„ํŠธ๋ฅผ ํ™•์ธ
167
  print(f"[DEBUG] Final combined_prompt: {combined_prompt}")
168
 
169
  with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16), timer("inference"):
@@ -183,47 +204,43 @@ def change_text_in_image(original_image, new_text):
183
  """
184
  Google GenAI์˜ gemini ๋ชจ๋ธ์„ ํ†ตํ•ด,
185
  ์—…๋กœ๋“œ๋œ ์ด๋ฏธ์ง€ ๋‚ด๋ถ€์˜ ๋ฌธ๊ตฌ๋ฅผ `new_text`๋กœ ๋ณ€๊ฒฝํ•ด์ฃผ๋Š” ํ•จ์ˆ˜.
 
186
  """
187
  try:
188
  with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
189
  original_path = tmp.name
190
  original_image.save(original_path)
191
 
192
- # Gemini ๋ชจ๋ธ ํ˜ธ์ถœ
193
  image_path, text_response = generate_by_google_genai(
194
  text=f"Change the text in this image to: '{new_text}'",
195
  file_name=original_path
196
  )
197
 
198
  if image_path:
199
- # Gradio ๊ตฌ๋ฒ„์ „์—๋Š” decode_base64_to_image๊ฐ€ ์—†์œผ๋ฏ€๋กœ PIL๋กœ ์ฒ˜๋ฆฌ
200
  with open(image_path, "rb") as f:
201
  image_data = f.read()
202
  modified_img = Image.open(io.BytesIO(image_data))
203
  return modified_img, ""
204
  else:
205
- # ์ด๋ฏธ์ง€๊ฐ€ ์—†์ด ํ…์ŠคํŠธ๋งŒ ๋ฐ˜ํ™˜๋œ ๊ฒฝ์šฐ
206
  return None, text_response
207
 
208
  except Exception as e:
209
  raise gr.Error(f"Error: {e}")
210
 
211
  #######################################
212
- # 4. Gradio ์ธํ„ฐํŽ˜์ด์Šค ๊ตฌ์„ฑ
213
  #######################################
214
 
215
- with gr.Blocks(title="Flux + Google GenAI Text Replacement") as demo:
216
  gr.Markdown(
217
  """
218
- # Flux ๊ธฐ๋ฐ˜ ์ด๋ฏธ์ง€ ์ƒ์„ฑ + Google GenAI๋ฅผ ํ†ตํ•œ ํ…์ŠคํŠธ ๋ณ€ํ™˜
219
 
220
- **Usage**:
221
- - You can include `<text>` in the prompt. For example:
222
- `white cat with speech bubble says <text>`
223
- - Then, type the actual text in "Text to Include in the Image" (ex: "Hello" or "์•ˆ๋…•").
224
- - If `<text>` is not found in your prompt, the text will be automatically appended as:
225
- `with clear readable text that says '<text>'`.
226
- - Finally, you can optionally change the text again via Gemini.
227
 
228
  ---
229
  """
@@ -253,25 +270,47 @@ with gr.Blocks(title="Flux + Google GenAI Text Replacement") as demo:
253
  generated_image = gr.Image(label="Generated Image (with text)", type="pil")
254
 
255
  with gr.Column():
256
- gr.Markdown("## 2) Step 2: ์ƒ์„ฑ๋œ ์ด๋ฏธ์ง€ ๋‚ด ํ…์ŠคํŠธ ์ˆ˜์ •")
 
 
 
 
 
257
  new_text_input = gr.Textbox(
258
- label="์ƒˆ๋กœ ๋ฐ”๊ฟ€ ํ…์ŠคํŠธ",
259
- placeholder="์˜ˆ) Hello world"
260
  )
261
- modify_btn = gr.Button("Change Text in Image via Gemini", variant="secondary")
 
 
 
 
 
262
  output_img = gr.Image(label="Modified Image", type="pil")
263
  output_txt = gr.Textbox(label="(If only text returned)")
264
 
265
- # ๋ฒ„ํŠผ ์•ก์…˜ ์—ฐ๊ฒฐ
 
 
266
  generate_btn.click(
267
  fn=generate_initial_image,
268
  inputs=[prompt_input, text_input, height, width, steps, scale, seed],
269
  outputs=[generated_image]
270
  )
271
 
272
- modify_btn.click(
 
 
 
 
 
 
 
 
 
 
273
  fn=change_text_in_image,
274
- inputs=[generated_image, new_text_input],
275
  outputs=[output_img, output_txt]
276
  )
277
 
 
7
  import mimetypes
8
  import json
9
  import io
10
+ import random
11
+ import string
12
 
13
  import torch
14
  from PIL import Image
 
124
  # ์ž„์‹œ ํŒŒ์ผ๋กœ ์ด๋ฏธ์ง€ ๋ฐ›์„ ์ค€๋น„
125
  with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
126
  temp_path = tmp.name
127
+ # ์‘๋‹ต ์ŠคํŠธ๋ฆผ ์ฒ˜๋ฆฌ
128
  for chunk in client.models.generate_content_stream(
129
  model=model,
130
  contents=contents,
 
150
  return image_path, text_response
151
 
152
  #######################################
153
+ # 3. ์ž„์˜ ์•ŒํŒŒ๋ฒณ ์ƒ์„ฑ์šฉ ํ•จ์ˆ˜
154
+ #######################################
155
+
156
+ def generate_random_letters(length: int) -> str:
157
+ """
158
+ length ๊ธธ์ด์˜ ์ž„์˜์˜ ์•ŒํŒŒ๋ฒณ ๋ฌธ์ž์—ด์„ ์ƒ์„ฑํ•ด ๋ฐ˜ํ™˜.
159
+ ๋Œ€๋ฌธ์ž+์†Œ๋ฌธ์ž(a-z, A-Z) ๋ฒ”์œ„์—์„œ ๋žœ๋ค ๋ฝ‘๊ธฐ.
160
+ """
161
+ letters = string.ascii_uppercase + string.ascii_lowercase
162
+ return "".join(random.choice(letters) for _ in range(length))
163
+
164
+ def fill_text_input_with_random(new_text: str) -> str:
165
+ """
166
+ "์ƒˆ๋กœ ๋ฐ”๊ฟ€ ํ…์ŠคํŠธ"์˜ ๊ธธ์ด๋ฅผ ์„ธ์–ด, ๊ทธ ๊ธธ์ด๋งŒํผ ์ž„์˜์˜ ์•ŒํŒŒ๋ฒณ ๋ฌธ์ž์—ด ์ƒ์„ฑ ํ›„ ๋ฐ˜ํ™˜.
167
+ ์ด ๋ฐ˜ํ™˜๊ฐ’์ด ๊ณง "์ด๋ฏธ์ง€ ์•ˆ์— ๋“ค์–ด๊ฐˆ ํ…์ŠคํŠธ" UI(=text_input)์— ํ‘œ์‹œ๋จ.
168
+ """
169
+ length = len(new_text)
170
+ random_letters = generate_random_letters(length)
171
+ return random_letters
172
+
173
+ #######################################
174
+ # 4. Gradio ํ•จ์ˆ˜
175
  #######################################
176
 
177
  def generate_initial_image(prompt, text, height, width, steps, scale, seed):
 
184
  combined_prompt = prompt.replace("<text>", text)
185
  else:
186
  combined_prompt = f"{prompt} with clear readable text that says '{text}'"
187
+
 
188
  print(f"[DEBUG] Final combined_prompt: {combined_prompt}")
189
 
190
  with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16), timer("inference"):
 
204
  """
205
  Google GenAI์˜ gemini ๋ชจ๋ธ์„ ํ†ตํ•ด,
206
  ์—…๋กœ๋“œ๋œ ์ด๋ฏธ์ง€ ๋‚ด๋ถ€์˜ ๋ฌธ๊ตฌ๋ฅผ `new_text`๋กœ ๋ณ€๊ฒฝํ•ด์ฃผ๋Š” ํ•จ์ˆ˜.
207
+ (์—ฌ๊ธฐ์„œ๋Š” new_text๊ฐ€ ์ด๋ฏธ ์ž„์˜์˜ ์•ŒํŒŒ๋ฒณ์œผ๋กœ ์ฑ„์›Œ์ง„ ์ƒํƒœ๊ฐ€ ๋จ)
208
  """
209
  try:
210
  with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
211
  original_path = tmp.name
212
  original_image.save(original_path)
213
 
 
214
  image_path, text_response = generate_by_google_genai(
215
  text=f"Change the text in this image to: '{new_text}'",
216
  file_name=original_path
217
  )
218
 
219
  if image_path:
 
220
  with open(image_path, "rb") as f:
221
  image_data = f.read()
222
  modified_img = Image.open(io.BytesIO(image_data))
223
  return modified_img, ""
224
  else:
 
225
  return None, text_response
226
 
227
  except Exception as e:
228
  raise gr.Error(f"Error: {e}")
229
 
230
  #######################################
231
+ # 5. Gradio ์ธํ„ฐํŽ˜์ด์Šค ๊ตฌ์„ฑ
232
  #######################################
233
 
234
+ with gr.Blocks(title="Flux + Google GenAI + Random Text Replacement") as demo:
235
  gr.Markdown(
236
  """
237
+ # Flux ๊ธฐ๋ฐ˜ ์ด๋ฏธ์ง€ ์ƒ์„ฑ + Google GenAI + ์ž„์˜ ์•ŒํŒŒ๋ฒณ ์น˜ํ™˜
238
 
239
+ **๊ธฐ๋Šฅ ์š”์•ฝ**
240
+ 1) "์ƒˆ๋กœ ๋ฐ”๊ฟ€ ํ…์ŠคํŠธ"์— ์ž…๋ ฅ๋œ ๋ฌธ์ž์—ด ๊ธธ์ด๋ฅผ ์ธก์ •
241
+ 2) ๊ทธ ๊ธธ์ด๋งŒํผ **๋ฌด์ž‘์œ„ ์•ŒํŒŒ๋ฒณ**(๋Œ€์†Œ๋ฌธ์ž)์œผ๋กœ ๊ตฌ์„ฑ๋œ ๋ฌธ์ž์—ด์„ ๋งŒ๋“ค์–ด
242
+ 3) "์ด๋ฏธ์ง€ ์•ˆ์— ๋“ค์–ด๊ฐˆ ํ…์ŠคํŠธ" ์นธ์— ์ž๋™์œผ๋กœ ์ž…๋ ฅ (์ฆ‰, ์‹ค์ œ ๋ฐ”๋€” ํ…์ŠคํŠธ๋Š” ์™„์ „ํžˆ ๋žœ๋ค)
243
+ 4) ๊ทธ ํ›„ Google GenAI(gemini)๋กœ ์ด๋ฏธ์ง€ ๋ฌธ์ž๋ฅผ ๊ต์ฒด
 
 
244
 
245
  ---
246
  """
 
270
  generated_image = gr.Image(label="Generated Image (with text)", type="pil")
271
 
272
  with gr.Column():
273
+ gr.Markdown(
274
+ """
275
+ ## 2) Step 2: "์ƒˆ๋กœ ๋ฐ”๊ฟ€ ํ…์ŠคํŠธ" ๊ธธ์ด๋ฅผ ๊ธฐ์ค€์œผ๋กœ
276
+ ์ž„์˜ ์•ŒํŒŒ๋ฒณ์„ "์ด๋ฏธ์ง€ ์•ˆ์— ๋“ค์–ด๊ฐˆ ํ…์ŠคํŠธ"๋กœ ์ž๋™ ์„ค์ • โ†’ ์ด๋ฏธ์ง€ ๊ต์ฒด
277
+ """
278
+ )
279
  new_text_input = gr.Textbox(
280
+ label="์ƒˆ๋กœ ๋ฐ”๊ฟ€ ํ…์ŠคํŠธ (์ž…๋ ฅ๋œ ๊ธธ์ด๋ฅผ ๊ธฐ์ค€์œผ๋กœ ๋ฌด์ž‘์œ„ ์•ŒํŒŒ๋ฒณ ์ƒ์„ฑ)",
281
+ placeholder="์˜ˆ) Hello123 (๊ธธ์ด 8์ด๋ฉด, 8๊ธ€์ž ๋žœ๋ค)"
282
  )
283
+
284
+ # (A) ๋จผ์ € "์ƒˆ๋กœ ๋ฐ”๊ฟ€ ํ…์ŠคํŠธ" ๊ธ€์ž์ˆ˜๋ฅผ ์„ธ์–ด, ๋ฌด์ž‘์œ„ ์•ŒํŒŒ๋ฒณ์œผ๋กœ text_input ์ฑ„์šฐ๊ธฐ
285
+ # (B) ๊ทธ๋Ÿฐ ๋’ค change_text_in_image() ์‹คํ–‰
286
+ modify_btn = gr.Button("Generate Random Letters & Change Text in Image", variant="secondary")
287
+
288
+ # ์ตœ์ข… ๊ฒฐ๊ณผ
289
  output_img = gr.Image(label="Modified Image", type="pil")
290
  output_txt = gr.Textbox(label="(If only text returned)")
291
 
292
+ ###########################
293
+ # 1) Step1 ๋ฒ„ํŠผ ์•ก์…˜
294
+ ###########################
295
  generate_btn.click(
296
  fn=generate_initial_image,
297
  inputs=[prompt_input, text_input, height, width, steps, scale, seed],
298
  outputs=[generated_image]
299
  )
300
 
301
+ ###########################
302
+ # 2) Step2 ๋ฒ„ํŠผ ์•ก์…˜
303
+ ###########################
304
+ # (A) ๋ฌด์ž‘์œ„ ์•ŒํŒŒ๋ฒณ ์ƒ์„ฑํ•ด text_input์— ๋ฐ˜์˜
305
+ chain = modify_btn.click(
306
+ fn=fill_text_input_with_random,
307
+ inputs=[new_text_input],
308
+ outputs=[text_input]
309
+ )
310
+ # (B) ๋ฐฉ๊ธˆ ์—…๋ฐ์ดํŠธ๋œ text_input ๊ฐ’์„ ์ด์šฉํ•ด, ์ด๋ฏธ์ง€ ํ…์ŠคํŠธ ๊ต์ฒด
311
+ chain.then(
312
  fn=change_text_in_image,
313
+ inputs=[generated_image, text_input],
314
  outputs=[output_img, output_txt]
315
  )
316