SeedEdit-APP / app.py
Peng-Wang's picture
text
d86ec56
raw
history blame
6 kB
# Copyright (2024) Bytedance Ltd. and/or its affiliates
#
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.
from __future__ import annotations
import os
import random
import uuid
import gradio as gr
import numpy as np
from loguru import logger
from caller import (
SeedT2ICaller,
SeedEditCaller
)
from PIL import Image
help_text = """
## How to use this Demo
Step 1. Type in the caption/instruction text box, and click "Generate" to generate an initial image using Seed-T2I.
Step 2. Type in the caption/instruction text box, and click "Edit" to edit the current image using Seed-Edit.
This is a demo with limited QPS and a simple interface.
For a better experience, please use [Doubao](https://www.doubao.com/chat/)/[Dreamina](https://dreamina.capcut.com/ai-tool/image/generate) APP.
- The current demo does not support multi-round editing, which may lead to overexposure with multiple rounds of upload and download edits.
- Higher-quality input images will produce higher-quality edited results. For low-quality images, unwanted changes, e.g. facial id, may occur.
<font size=2>Note: This demo is governed by the license of CC BY-NC \
We strongly advise users not to knowingly generate or allow others to knowingly generate harmful content, \
including hate speech, violence, pornography, deception, etc. \
(注:本演示受CC BY-NC的许可协议限制。我们强烈建议,用户不应传播及不应允许他人传播以下内容,\
包括但不限于仇恨言论、暴力、色情、欺诈相关的有害信息。)
"""
example_instructions = [
"Make it a picasso painting",
"close its eye",
"convert to a bronze statue",
"make it wearing a hat",
"make it wearing a PhD suit",
"Turn it into an anime.",
"have it look like a graphic novel",
"make it gain weight",
"what would he look like bald?",
"Have it smile",
"Put in a cocktail party.",
"move to the beach.",
"add dramatic lighting",
"Convert to black and white",
"What if it were snowing?",
"Give a leather jacket",
"Turn into a cyborg!",
]
def main():
resolution = 1024
cfg = {"resolution": resolution}
model_t2i = SeedT2ICaller(cfg)
cfg_edit = {}
model_edit = SeedEditCaller(cfg_edit)
logger.info("All models loaded")
def load_example():
example_image = Image.open(f"uni_test/test.jpg").convert("RGB")
example_instruction = random.choice(example_instructions)
edited_image, example_instruction = generate(example_image,
example_instruction,
cfg_scale=0.5)
return example_image, example_instruction, edited_image
def generate_t2i(instruction: str, cfg_scale: float = 0.5):
if not instruction:
return None, ""
logger.info("Generate images ...")
# Call model and capture the status
gen_image, success = model_t2i.generate(instruction, batch_size=1, cfg_scale=cfg_scale)
if not success or gen_image is None:
logger.error("Image generation failed or returned None. please retry")
return None, instruction
return gen_image, instruction
def generate(input_image: Image.Image, instruction: str = None, cfg_scale: float = 0.5):
logger.info("Generating images ...")
if not instruction or input_image is None:
return input_image, ""
logger.info("Running diffusion models ...")
edited_image, success = model_edit.edit(input_image, instruction, batch_size=1, cfg_scale=cfg_scale)
if not success or edited_image is None:
logger.error("Image editting failed or returned None.")
return None, instruction
return edited_image, instruction
def reset():
return None, None, ""
with gr.Blocks(css="footer {visibility: hidden}") as demo:
with gr.Row():
with gr.Column(scale=1, min_width=100):
generate_button = gr.Button("Generate")
with gr.Column(scale=1, min_width=100):
edit_button = gr.Button("Edit")
with gr.Column(scale=1, min_width=100):
load_button = gr.Button("Load Example")
with gr.Column(scale=1, min_width=100):
reset_button = gr.Button("Reset")
with gr.Row():
with gr.Column(scale=3):
instruction = gr.Textbox(lines=1, label="Caption/Edit Instruction", interactive=True, value=None)
with gr.Column(scale=1):
cfg_scale = gr.Slider(value=0.5, minimum=0.0, maximum=1.0, step=0.1, label="Edit/Text Strength (CFG)", interactive=True)
with gr.Row():
input_image = gr.Image(label="Input Image", type="pil", interactive=True,
height=resolution, width=resolution)
edited_image = gr.Image(label="Edited Image", type="pil", interactive=False,
height=resolution, width=resolution)
gr.Markdown(help_text)
load_button.click(
fn=load_example,
inputs=[],
outputs=[input_image, instruction, edited_image]
)
generate_button.click(
fn=generate_t2i,
inputs=[instruction, cfg_scale],
outputs=[input_image, instruction]
)
edit_button.click(
fn=generate,
inputs=[input_image, instruction, cfg_scale],
outputs=[edited_image, instruction]
)
reset_button.click(
fn=reset,
inputs=[],
outputs=[input_image, edited_image, instruction]
)
# demo.launch(server_name="0.0.0.0", server_port=8024)
demo.queue().launch(share=False)
if __name__ == "__main__":
main()