Spaces:

ByteDance-Seed
/

SeedEdit-APP

Runtime error

App Files Files Community

Peng-Wang commited on Nov 2, 2024

Commit

959541f

0 Parent(s):

Start fresh from current state

Browse files

Files changed (8) hide show

.gitignore +1 -0
LICENSE +11 -0
README.md +35 -0
app.py +152 -0
app_future.py +168 -0
caller.py +124 -0
requirements.txt +5 -0
uni_test/test.jpg +0 -0

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ *pyc

LICENSE ADDED Viewed

	@@ -0,0 +1,11 @@

+This work is licensed under a Creative Commons Attribution-NonCommercial 4.0 International License.
+You are free to:
+- Share — copy and redistribute the material in any medium or format
+- Adapt — remix, transform, and build upon the material
+Under the following terms:
+- Attribution — You must give appropriate credit, provide a link to the license, and indicate if changes were made. You may do so in any reasonable manner, but not in any way that suggests the licensor endorses you or your use.
+- NonCommercial — You may not use the material for commercial purposes.
+No additional restrictions — You may not apply legal terms or technological measures that legally restrict others from doing anything the license permits.

README.md ADDED Viewed

	@@ -0,0 +1,35 @@

+# Seed-Edit-APP
+This repository contains the code for the **Seed-Edit** application. Seed-Edit is designed to simplify and enhance editing processes using advanced algorithms and data-driven insights.
+## Overview
+Seed-Edit provides an intuitive interface and integrates with state-of-the-art tools to streamline your editing experience. The app leverages robust models to offer various editing options tailored to user needs.
+## Additional Resources
+For more information and trials, please visit our official webpage for more details: [Seed-Edit Webpage](https://team.doubao.com/seed-edit) and the **[Doubao](https://www.doubao.com/chat/)/[Dreamina](https://dreamina.capcut.com/ai-tool/image/generate) APPs**.
+## License
+This project is licensed under the CC BY-NC License. See `LICENSE` for more information.
+## Safety
+<font size=2>
+We strongly advise users not to knowingly generate or allow others to knowingly generate harmful content,
+including hate, violence, pornography, deception, etc.
+(注：本演示受CC BY-NC的许可协议限制。我们强烈建议，用户不应传播及不应允许他人传播以下内容，包括但不限于仇恨、暴力、色情、欺诈相关的有害信息。)
+---
+title: Seed-Edit
+emoji: 🌖
+colorFrom: blue
+colorTo: red
+sdk: gradio
+sdk_version: 4.44.1
+app_file: app.py
+pinned: false
+license: other
+---

app.py ADDED Viewed

	@@ -0,0 +1,152 @@

+# Copyright (2024) Bytedance Ltd. and/or its affiliates
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+from __future__ import annotations
+import os
+import random
+import uuid
+import gradio as gr
+import numpy as np
+from loguru import logger
+from caller import (
+    SeedT2ICaller,
+    SeedEditCaller
+)
+from PIL import Image
+help_text = """
+## How to use this Demo
+1. Type in the caption/instruction text box, and click "Generate" to generate an initial image using Seed-T2I.
+2. Type in the caption/instruction text box, and click "Edit" to edit the current image using Seed-Edit.
+This is a demo with limited QPS and a simple interface.
+For a better experience, please use Doubao/Dreamina APP.
+<font size=2>Note: This demo is governed by the license of CC BY-NC \
+We strongly advise users not to knowingly generate or allow others to knowingly generate harmful content, \
+including hate speech, violence, pornography, deception, etc. \
+(注：本演示受CC BY-NC的许可协议限制。我们强烈建议，用户不应传播及不应允许他人传播以下内容，\
+包括但不限于仇恨言论、暴力、色情、欺诈相关的有害信息。)
+"""
+example_instructions = [
+    "Make it a picasso painting",
+    "close its eye",
+    "convert to a bronze statue",
+    "make it wearing a hat",
+    "make it wearing a PhD suit",
+    "Turn it into an anime.",
+    "have it look like a graphic novel",
+    "make it gain weight",
+    "what would he look like bald?",
+    "Have it smile",
+    "Put in a cocktail party.",
+    "move to the beach.",
+    "add dramatic lighting",
+    "Convert to black and white",
+    "What if it were snowing?",
+    "Give a leather jacket",
+    "Turn into a cyborg!",
+]
+def main():
+    resolution = 1024
+    cfg = {"resolution": resolution}
+    model_t2i = SeedT2ICaller(cfg)
+    cfg_edit = {}
+    model_edit = SeedEditCaller(cfg_edit)
+    logger.info("All models loaded")
+    def load_example():
+        example_image = Image.open(f"uni_test/test.jpg").convert("RGB")
+        example_instruction = random.choice(example_instructions)
+        edited_image, example_instruction = generate(example_image,
+                                                     example_instruction,
+                                                     cfg_scale=0.5)
+        return example_image, example_instruction, edited_image
+    def generate_t2i(instruction: str, cfg_scale: float = 0.5):
+        if not instruction:
+            return None, ""
+        logger.info("Generate images ...")
+        # Call model and capture the status
+        gen_image, success = model_t2i.generate(instruction, batch_size=1, cfg_scale=cfg_scale)
+        if not success or gen_image is None:
+            logger.error("Image generation failed or returned None. please retry")
+            return None, instruction
+        return gen_image, instruction
+    def generate(input_image: Image.Image, instruction: str = None, cfg_scale: float = 0.5):
+        logger.info("Generating images ...")
+        if not instruction or input_image is None:
+            return input_image, ""
+        logger.info("Running diffusion models ...")
+        edited_image, success = model_edit.edit(input_image, instruction, batch_size=1, cfg_scale=cfg_scale)
+        if not success or edited_image is None:
+            logger.error("Image editting failed or returned None.")
+            return None, instruction
+        return edited_image, instruction
+    def reset():
+        return None, None, ""
+    with gr.Blocks(css="footer {visibility: hidden}") as demo:
+        with gr.Row():
+            with gr.Column(scale=1, min_width=100):
+                generate_button = gr.Button("Generate")
+            with gr.Column(scale=1, min_width=100):
+                edit_button = gr.Button("Edit")
+            with gr.Column(scale=1, min_width=100):
+                load_button = gr.Button("Load Example")
+            with gr.Column(scale=1, min_width=100):
+                reset_button = gr.Button("Reset")
+        with gr.Row():
+            with gr.Column(scale=3):
+                instruction = gr.Textbox(lines=1, label="Edit/Caption Instruction", interactive=True, value=None)
+            with gr.Column(scale=1):
+                cfg_scale = gr.Slider(value=0.5, minimum=0.0, maximum=1.0, step=0.1, label="Edit/Text Strength (CFG)", interactive=True)
+        with gr.Row():
+            input_image = gr.Image(label="Input Image", type="pil", interactive=True,
+                                    height=resolution, width=resolution)
+            edited_image = gr.Image(label="Edited Image", type="pil",
+                                    interactive=False, height=resolution, width=resolution)
+        gr.Markdown(help_text)
+        load_button.click(
+            fn=load_example,
+            inputs=[],
+            outputs=[input_image, instruction, edited_image]
+        )
+        generate_button.click(
+            fn=generate_t2i,
+            inputs=[instruction, cfg_scale],
+            outputs=[input_image, instruction]
+        )
+        edit_button.click(
+            fn=generate,
+            inputs=[input_image, instruction, cfg_scale],
+            outputs=[edited_image, instruction]
+        )
+        reset_button.click(
+            fn=reset,
+            inputs=[],
+            outputs=[input_image, edited_image, instruction]
+        )
+    # demo.launch(server_name="0.0.0.0", server_port=8024)
+    demo.queue().launch(share=False)
+if __name__ == "__main__":
+    main()

app_future.py ADDED Viewed

	@@ -0,0 +1,168 @@

+# Copyright (2024) Bytedance Ltd. and/or its affiliates
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+from __future__ import annotations
+import uuid
+from loguru import logger
+import hashlib
+import gradio as gr
+import io
+import base64
+from caller import (
+    SeedT2ICaller,
+    SeedEditCaller
+)
+from PIL import Image
+API_KEY = ""
+help_text = """
+## How to use this Demo
+1. Type-in the caption/instruction text box, and click "Generate" to generate an initial image using Seed_T2I_V14 (CFG and steps are not used here)
+2. Type-in the caption/instruction text box, and click "Edit" to edit the current image.
+3. Click Undo if you are not satisfied with the current results, and re-edit. Otherwise, edit will apply to current results.
+4. Currently, we do not support too many rounds of editing [as shown in our video] since the current API hasn't been updated to the new model yet.
+This is a demo with limited QPS and a simple interface.
+For a better experience, please use Doubao/Dreamina APP.
+<font size=2>Note: This demo is governed by the license of CC BY-NC \
+We strongly advise users not to knowingly generate or allow others to knowingly generate harmful content, \
+including hate speech, violence, pornography, deception, etc. \
+(注：本演示受CC BY-NC的许可协议限制。我们强烈建议，用户不应传播及不应允许他人传播以下内容，\
+包括但不限于仇恨言论、暴力、色情、欺诈相关的有害信息。)
+"""
+def image2str(image):
+    buf = io.BytesIO()
+    image.save(buf, format="PNG")
+    i_str = base64.b64encode(buf.getvalue()).decode()
+    return f'<div style="float:left"><img src="data:image/png;base64, {i_str}"></div>'
+def main():
+    resolution = 1024
+    max_edit_iter = 3
+    cfg_t2i = {
+        "resolution": resolution
+    }
+    model_t2i = SeedT2ICaller(cfg_t2i)
+    cfg_edit = cfg_t2i
+    model_edit = SeedEditCaller(cfg_edit)
+    logger.info("All models loaded")
+    def generate_t2i(instruction: str, state):
+        logger.info("Generate images ...")
+        # 调用模型生成图像并捕获返回结果
+        gen_image, success = model_t2i.generate(instruction, batch_size=1)
+        # 检查生成是否成功以及生成的图像是否有效
+        if not success or gen_image is None:
+            logger.error("Image generation failed or returned None.")
+            raise ValueError("Image generation was unsuccessful.")
+        # Write cache
+        if state is None:
+            state = {}
+        output_md5 = hashlib.md5(gen_image.tobytes()).hexdigest()
+        logger.info(output_md5)
+        state[output_md5] = gen_image
+        return instruction, gen_image, state
+    def generate(prev_image, cur_image, cfg_scale, instruction, state):
+        if len(state.keys()) >= max_edit_iter:
+            return prev_image, cur_image, instruction, state
+        try:
+            if cur_image is None:
+                cur_image = prev_image
+            logger.info("Generating edited images ...")
+            if not instruction:
+                return prev_image, cur_image, instruction, state
+            logger.info("Running diffusion models ...")
+            image_out = f"./cache/{'-'.join(instruction.split()[:10])[:50]}_{uuid.uuid4()}.jpg"
+            logger.info(f"Input size {cur_image.size}")
+            edited_image, success = model_edit.edit(cur_image, instruction, batch_size=1, cfg_scale=cfg_scale, filename=image_out)
+            if not success or edited_image is None:
+                logger.error("Image generation failed or returned None.")
+                raise ValueError("Image generation was unsuccessful.")
+            output_md5 = hashlib.md5(edited_image.tobytes()).hexdigest()
+            logger.info(f"EDIT adding {output_md5}")
+            state[output_md5] = edited_image
+            return cur_image, edited_image, instruction, state
+        except Exception as e:
+            logger.error(e)
+            return prev_image, cur_image, instruction, state
+    def reset():
+        return 0.5, None, None, "", {}
+    def undo(prev_image, cur_image, instruction, state):
+        if cur_image is not None:
+            cur_md5 = hashlib.md5(cur_image.tobytes()).hexdigest()
+            if cur_md5 in state:
+                logger.info(f"UNDO removing {cur_md5}")
+                state.pop(cur_md5, None)
+        return prev_image, prev_image, instruction, state
+    def show_state(state):
+        num_cache = len(state.keys())
+        return f"Num Cache: {num_cache}" if num_cache < max_edit_iter else "Max edit number reached. Please reset for testing."
+    with gr.Blocks(css="footer {visibility: hidden}") as demo:
+        state = gr.State({})
+        with gr.Row():
+            with gr.Column(scale=2):
+                prev_image = gr.Image(label="Input Image", type="pil", interactive=True, visible=False, height=resolution, width=resolution)
+                cur_image = gr.Image(label="Edited Image", type="pil", interactive=True, height=resolution, width=resolution)
+            with gr.Column(scale=1):
+                with gr.Row():
+                    generate_t2i_button = gr.Button("Generate")
+                    generate_button = gr.Button("Edit")
+                    reset_button = gr.Button("Reset")
+                    undo_button = gr.Button("Undo")
+                with gr.Row():
+                    instruction = gr.Textbox(lines=1, label="Caption (Generate) / Instruction (Edit)", interactive=True)
+                with gr.Row():
+                    cfg_scale = gr.Slider(value=0.5, minimum=0.0, maximum=1.0, step=0.1, label="Edit Strength (CFG)", interactive=True)
+                with gr.Row():
+                    output_label = gr.Label()
+        gr.Markdown(help_text)
+        # Function bindings
+        generate_t2i_button.click(generate_t2i, [instruction, state], [instruction, cur_image, state])
+        generate_button.click(generate, [prev_image, cur_image, cfg_scale, instruction, state], [prev_image, cur_image, instruction, state])
+        reset_button.click(reset, [], [cfg_scale, prev_image, cur_image, instruction, state])
+        undo_button.click(undo, [prev_image, cur_image, instruction, state], [prev_image, cur_image, instruction, state])
+        # Update state display
+        generate_t2i_button.click(show_state, [state], output_label)
+        generate_button.click(show_state, [state], output_label)
+        reset_button.click(show_state, [state], output_label)
+        undo_button.click(show_state, [state], output_label)
+    demo.launch(server_name="0.0.0.0", server_port=8024)
+if __name__ == "__main__":
+    main()

caller.py ADDED Viewed

	@@ -0,0 +1,124 @@

+# Copyright (2024) Bytedance Ltd. and/or its affiliates
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+from PIL import Image, ImageFilter
+from loguru import logger
+import requests
+import base64
+import json
+import io
+# 接口 URL
+t2i_url = 'https://magicarena.bytedance.com/api/evaluate/v1/algo/process'
+#注意:正式上线环境需要不设置header
+headers = {
+    'X-TT-ENV': 'ppe_general_20',
+    'X-USE-PPE': '1'
+}
+class SeedT2ICaller():
+    def __init__(self, cfg, *args, **kwargs):
+        self.cfg = cfg
+    def generate(self, text, *args, **kwargs):
+        try:
+            logger.info("Generate images ...")
+            req_json = json.dumps({
+                "prompt": str(text),
+                "use_sr": True,
+                "model_version": "general_v2.0_L",
+                "req_schedule_conf": "general_v20_9B_pe"
+                # "width": 64,
+                # "height": 64
+            })
+            logger.info(f"{req_json}")
+            # 请求发送
+            response = requests.post(
+                t2i_url,
+                headers=headers,
+                data={
+                    'AlgoType': 1,
+                    'ReqJson': req_json,
+                }
+            )
+            logger.info(f"header: {response.headers}")
+            if response.status_code != 200:
+                return None, False
+            resp = response.json()
+            if resp.get('code',{}) != 0:
+                logger.info(f"response error {resp}")
+                return None, False
+            binary_data1 = resp.get('data', {}).get('BinaryData')
+            binary_data = binary_data1[0]
+            #logger.info(f"binary_data: {binary_data}")
+            image = Image.open(io.BytesIO(base64.b64decode(binary_data)))
+            #image.save('./t2i_image.png')
+            image = image.resize((self.cfg['resolution'], self.cfg['resolution']))
+            return image, True
+        except Exception as e:
+            logger.exception("An error occurred during image generation.")
+            return None, False
+class SeedEditCaller():
+    def __init__(self, cfg, *args, **kwargs):
+        self.cfg = cfg
+    def edit(self, image, edit, cfg_scale=0.5, *args, **kwargs):
+        try:
+            image_bytes = io.BytesIO()
+            image.save(image_bytes, format='JPEG')  # 或 format='PNG'
+            logger.info("Edit images ...")
+            req_json = json.dumps({
+                "prompt": str(edit),
+                "model_version": "byteedit_v2.0",
+                "scale": cfg_scale,
+            })
+            logger.info(f"{req_json}")
+            binary =base64.b64encode(image_bytes.getvalue()).decode('utf-8')
+            # 请求发送
+            response = requests.post(
+                t2i_url,
+                headers=headers,
+                data=json.dumps({
+                    'AlgoType': 2,
+                    'ReqJson': req_json,
+                    'BinaryData': [binary]
+                    # 'Base': base
+                })
+            )
+            logger.info(f"header: {response.headers}")
+            if response.status_code != 200:
+                return None, False
+            resp = response.json()
+            if resp.get('code',{}) != 0:
+                logger.info(f"response error {resp}")
+                return None, False
+            binary_data = resp.get('data', {}).get('BinaryData')
+            image = Image.open(io.BytesIO(base64.b64decode(binary_data[0])))
+            return image, True
+        except Exception as e:
+            logger.exception("An error occurred during image generation.")
+            return None, False
+if __name__ == "__main__":
+    cfg_t2i = {
+        "resolution": 611
+    }
+    model_t2i = SeedT2ICaller(cfg_t2i)
+    model_t2i.generate("a beautiful girl")
+    image_path = "./t2i_image.png"
+    with open(image_path, 'rb') as image:
+        image_bytes = image.read()
+        model_edit = SeedEditCaller(cfg_t2i)
+        model_edit.edit(image=image_bytes,edit="please edit to a good man")

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+gradio
+numpy
+loguru
+Pillow
+requests

uni_test/test.jpg ADDED Viewed