Spaces:

ByteDance
/

SeedEdit-APP

Running

App Files Files Community

SeedEdit-APP / app.py

Peng-Wang

text

d86ec56 13 days ago

raw

history blame

6 kB

	# Copyright (2024) Bytedance Ltd. and/or its affiliates
	#
	# This source code is licensed under the license found in the
	# LICENSE file in the root directory of this source tree.

	from __future__ import annotations
	import os
	import random
	import uuid

	import gradio as gr
	import numpy as np

	from loguru import logger
	from caller import (
	SeedT2ICaller,
	SeedEditCaller
	)
	from PIL import Image

	help_text = """
	## How to use this Demo
	Step 1. Type in the caption/instruction text box, and click "Generate" to generate an initial image using Seed-T2I.

	Step 2. Type in the caption/instruction text box, and click "Edit" to edit the current image using Seed-Edit.

	This is a demo with limited QPS and a simple interface.
	For a better experience, please use [Doubao](https://www.doubao.com/chat/)/[Dreamina](https://dreamina.capcut.com/ai-tool/image/generate) APP.

	- The current demo does not support multi-round editing, which may lead to overexposure with multiple rounds of upload and download edits.
	- Higher-quality input images will produce higher-quality edited results. For low-quality images, unwanted changes, e.g. facial id, may occur.

	<font size=2>Note: This demo is governed by the license of CC BY-NC \
	We strongly advise users not to knowingly generate or allow others to knowingly generate harmful content, \
	including hate speech, violence, pornography, deception, etc. \
	(注：本演示受CC BY-NC的许可协议限制。我们强烈建议，用户不应传播及不应允许他人传播以下内容，\
	包括但不限于仇恨言论、暴力、色情、欺诈相关的有害信息。)
	"""

	example_instructions = [
	"Make it a picasso painting",
	"close its eye",
	"convert to a bronze statue",
	"make it wearing a hat",
	"make it wearing a PhD suit",
	"Turn it into an anime.",
	"have it look like a graphic novel",
	"make it gain weight",
	"what would he look like bald?",
	"Have it smile",
	"Put in a cocktail party.",
	"move to the beach.",
	"add dramatic lighting",
	"Convert to black and white",
	"What if it were snowing?",
	"Give a leather jacket",
	"Turn into a cyborg!",
	]

	def main():
	resolution = 1024
	cfg = {"resolution": resolution}
	model_t2i = SeedT2ICaller(cfg)

	cfg_edit = {}
	model_edit = SeedEditCaller(cfg_edit)
	logger.info("All models loaded")


	def load_example():
	example_image = Image.open(f"uni_test/test.jpg").convert("RGB")
	example_instruction = random.choice(example_instructions)
	edited_image, example_instruction = generate(example_image,
	example_instruction,
	cfg_scale=0.5)
	return example_image, example_instruction, edited_image

	def generate_t2i(instruction: str, cfg_scale: float = 0.5):
	if not instruction:
	return None, ""

	logger.info("Generate images ...")
	# Call model and capture the status
	gen_image, success = model_t2i.generate(instruction, batch_size=1, cfg_scale=cfg_scale)
	if not success or gen_image is None:
	logger.error("Image generation failed or returned None. please retry")
	return None, instruction
	return gen_image, instruction

	def generate(input_image: Image.Image, instruction: str = None, cfg_scale: float = 0.5):
	logger.info("Generating images ...")
	if not instruction or input_image is None:
	return input_image, ""

	logger.info("Running diffusion models ...")
	edited_image, success = model_edit.edit(input_image, instruction, batch_size=1, cfg_scale=cfg_scale)
	if not success or edited_image is None:
	logger.error("Image editting failed or returned None.")
	return None, instruction

	return edited_image, instruction

	def reset():
	return None, None, ""

	with gr.Blocks(css="footer {visibility: hidden}") as demo:
	with gr.Row():
	with gr.Column(scale=1, min_width=100):
	generate_button = gr.Button("Generate")
	with gr.Column(scale=1, min_width=100):
	edit_button = gr.Button("Edit")
	with gr.Column(scale=1, min_width=100):
	load_button = gr.Button("Load Example")
	with gr.Column(scale=1, min_width=100):
	reset_button = gr.Button("Reset")

	with gr.Row():
	with gr.Column(scale=3):
	instruction = gr.Textbox(lines=1, label="Caption/Edit Instruction", interactive=True, value=None)
	with gr.Column(scale=1):
	cfg_scale = gr.Slider(value=0.5, minimum=0.0, maximum=1.0, step=0.1, label="Edit/Text Strength (CFG)", interactive=True)

	with gr.Row():
	input_image = gr.Image(label="Input Image", type="pil", interactive=True,
	height=resolution, width=resolution)
	edited_image = gr.Image(label="Edited Image", type="pil", interactive=False,
	height=resolution, width=resolution)

	gr.Markdown(help_text)

	load_button.click(
	fn=load_example,
	inputs=[],
	outputs=[input_image, instruction, edited_image]
	)
	generate_button.click(
	fn=generate_t2i,
	inputs=[instruction, cfg_scale],
	outputs=[input_image, instruction]
	)
	edit_button.click(
	fn=generate,
	inputs=[input_image, instruction, cfg_scale],
	outputs=[edited_image, instruction]
	)
	reset_button.click(
	fn=reset,
	inputs=[],
	outputs=[input_image, edited_image, instruction]
	)

	# demo.launch(server_name="0.0.0.0", server_port=8024)
	demo.queue().launch(share=False)

	if __name__ == "__main__":
	main()