Spaces:

jdh-algo
/

JoyType

Runtime error

File size: 15,591 Bytes

3c3804b

# encoding=utf8


import os
import cv2
import gradio as gr
import numpy as np
import re
import json

from huggingface_hub import login
from functions import *
from gradio.components import Component

login(token=os.getenv('LOGIN_TOKEN'))
css = './css/style.css'

# Initial a Gradio Block with specific theme
block = gr.Blocks(
    theme=gr.themes.Base(),
    css=css
).queue()

# Load javascript plugin
with open('javascript/bboxHint.js', 'r', encoding="utf-8") as file:
    value = file.read()
escaped_value = json.dumps(value)

with block:
    block.load(
        fn=None,
        _js=f"""() => {{
                const script = document.createElement("script");
                const text =  document.createTextNode({escaped_value});
                script.appendChild(text);
                document.head.appendChild(script);
            }}"""
    )
    gr.HTML(
        '<div style="text-align: center; margin: 20px auto;"> \
        <h1 style="font-size:5em">JoyType</h1> \
        <h1 style="font-size:2.5em">A Robust Design for Multilingual Visual Text Creation</h1> \
        </div>'
    )
    with gr.Row():
        with gr.Column(scale=3):
            with gr.Accordion('Basic Settings(基础设置)', open=True):
                with gr.Row(variant='compact'):
                    usr_prompt = gr.Textbox(label='Prompt(提示词)', elem_id='usr_prompt')
                with gr.Row(variant='compact'):
                    base_model = gr.Dropdown(
                        value='JoyType.v1.0', choices=model_list,
                        label='Base Model(基模型)', elem_id='base_model', allow_custom_value=False
                    )

            with gr.Accordion('Advanced Settings(高级设置)', open=False):
                with gr.Row(variant='compact'):
                    image_width = gr.Slider(label='Image Width(宽度)', minimum=256, maximum=768, value=512, step=32)
                    image_height = gr.Slider(label='Image Height(高度)', minimum=256, maximum=768, value=512, step=32)
                with gr.Row(variant='compact'):
                    num_samples = gr.Slider(label='Samples(生成数量)', minimum=1, maximum=4, value=2, step=1)
                    inference_steps = gr.Slider(label='Steps(推理步数)', minimum=10, maximum=50, value=20, step=1)
                with gr.Row(variant='compact'):
                    conditioning_scale = gr.Slider(label='Text Strength(文字强度)', minimum=0.1, maximum=2., value=1., step=0.1)
                    cfg_scale = gr.Slider(label='CFG Scale(CFG制强度)', minimum=1, maximum=20, value=7.5, step=0.5)
                with gr.Row(variant='compact'):
                    seed = gr.Slider(label='Seed(随机种子)', minimum=-1, maximum=2147483647, value=-1, step=1)
                    scheduler_name = gr.Dropdown(
                        value='PNDM', choices=[
                            'PNDM', 'LMS', 'Euler', 'DPM', 'DDIM', 'Heun', 'Euler-Ancestral'
                        ],
                        label='Scheduler(采样器)', allow_custom_value=False
                    )
                with gr.Row(variant='compact'):
                    a_prompt = gr.Textbox(
                        label='Added Prompt(附加提示词)', max_lines=2,
                        value='best quality, extremely detailed, supper legible text, '
                              'clear text edges, clear strokes, neat writing, no watermarks'
                    )
                with gr.Row(variant='compact'):
                    n_prompt = gr.Textbox(
                        label='Negative Prompt(负向提示词)', max_lines=2,
                        value='low-res, bad anatomy, extra digit, fewer digits, cropped, worst quality, '
                              'low quality, watermark, unreadable text, messy words, distorted text, '
                              'disorganized writing, advertising picture'
                    )

                base_model.change(
                    fn=change_settings,
                    inputs=base_model,
                    outputs=[inference_steps, cfg_scale, scheduler_name]
                )

            with gr.Row():
                with gr.Tab('Text Editing(文字编辑)', elem_id='MD-tab-t2i'):
                    with gr.Row(variant='compact'):
                        choice = gr.Slider(
                            label=f'Text Boxes(可编辑文字框)',
                            minimum=0, maximum=8, step=1, value=BBOX_INI_NUM
                        )

                    with gr.Row():
                        with gr.Column(scale=2):
                            rect_img = gr.Image(
                                value=create_canvas(), label='Rect Position',
                                elem_id='MD-bbox-rect-t2i', show_label=False, visible=True,
                                height=300
                            )
                        with gr.Column(scale=3):
                            rect_cb_list: list[Component] = []
                            rect_box_list: list[Component] = []
                            rect_font_name_list: list[Component] = []
                            rect_usr_text_list: list[Component] = []

                            with gr.Column():
                                with gr.Row(elem_id='row_show'):
                                    with gr.Column(scale=1, min_width=20):
                                        gr.Markdown('<p align="center">Font(字体)</p>', elem_id='markdown_1')
                                    with gr.Column(scale=2, min_width=20):
                                        gr.Markdown('<p align="center">Text(文字内容)</p>', elem_id='markdown_2')

                                row_layout = [gr.Row() for _ in range(BBOX_MAX_NUM)]
                                for i in range(BBOX_MAX_NUM):
                                    visible = True if i < BBOX_INI_NUM else False
                                    with row_layout[i]:
                                        fn = gr.Dropdown(
                                            choices=font_list,
                                            label='Font(字体)', value='CHN-华文行楷', visible=visible,
                                            show_label=False, scale=1, allow_custom_value=False,
                                            min_width=90, elem_id=f'font_input_{i}', container=False
                                        )
                                        ut = gr.Textbox(
                                            label='Text(文字内容)', visible=visible, scale=2,
                                            show_label=False, elem_id=f'text_input_{i}', container=False, max_lines=1
                                        )
                                    e = gr.Checkbox(label=f'{i}', value=visible, visible=False, min_width=10)

                                    x = gr.Slider(label='x', value=0.4, minimum=0.0, maximum=1.0, step=0.0001,
                                                  elem_id=f'MD-t2i-{i}-x',
                                                  visible=False)
                                    y = gr.Slider(label='y', value=0.4, minimum=0.0, maximum=1.0, step=0.0001,
                                                  elem_id=f'MD-t2i-{i}-y',
                                                  visible=False)
                                    w = gr.Slider(label='w', value=0.2, minimum=0.0, maximum=1.0, step=0.0001,
                                                  elem_id=f'MD-t2i-{i}-w',
                                                  visible=False)
                                    h = gr.Slider(label='h', value=0.2, minimum=0.0, maximum=1.0, step=0.0001,
                                                  elem_id=f'MD-t2i-{i}-h',
                                                  visible=False)
                                    x.change(fn=None, inputs=x, outputs=x, _js=f'v => onBoxChange({i}, "x", v)',
                                             show_progress=False, queue=False)
                                    y.change(fn=None, inputs=y, outputs=y, _js=f'v => onBoxChange({i}, "y", v)',
                                             show_progress=False, queue=False)
                                    w.change(fn=None, inputs=w, outputs=w, _js=f'v => onBoxChange({i}, "w", v)',
                                             show_progress=False, queue=False)
                                    h.change(fn=None, inputs=h, outputs=h, _js=f'v => onBoxChange({i}, "h", v)',
                                             show_progress=False, queue=False)
                                    e.change(fn=None, inputs=e, outputs=e, _js=f'e => onBoxEnableClick({i}, e)',
                                             queue=False)

                                    rect_cb_list.extend([e])
                                    rect_box_list.extend([x, y, w, h])
                                    rect_font_name_list.extend([fn])
                                    rect_usr_text_list.extend([ut])

                            choice.change(
                                fn=update_box_num,
                                inputs=[choice],
                                outputs=[
                                    *rect_cb_list, *rect_font_name_list, *rect_usr_text_list, *rect_box_list
                                ]
                            )
                    with gr.Row():
                        gr.Markdown('')
                        run_edit = gr.Button(value='Run(运行)', elem_classes='run', elem_id='run_edit')
                        gr.Markdown('')
                    with gr.Row():
                        with gr.Accordion(label='Examples(示例)', open=True):
                            img_container = gr.Image(visible=False, label='Text Layout(文字布局)')
                            example_id = gr.Textbox(value=-1, visible=False, label='ID(编号)')
                            gen_examples = gr.Examples(
                                [
                                    [1, 'templates/1.png', 'landscape, Chinese style, ink peaks, poster', model_list[0], 1648703813, 3, 1],
                                    [2, 'templates/2.png', 'a clock and medicine bottle has texts and "time"', model_list[0], 1654615998, 2, 1],
                                    [3, 'templates/3.png', '漂亮的风景照，很多山峰，清澈的湖水', model_list[3], 2078698098, 3, 1],
                                    [4, 'templates/4.png', 'a vodka, on the bar, dim background', model_list[2], 443791646, 3, 1],
                                    [5, 'templates/5.png', '画有玫瑰的卡片，明亮的背景', model_list[4], 516210890, 2, 1],
                                    [6, 'templates/6.png', 'posters on the table, with pens, clear background, starry sky, moon', model_list[1], 228167646, 4, 1],
                                    [7, 'templates/7.png', 'snowy landscape, domed cabin, winter scene, cozy atmosphere, soft lighting', model_list[5], 695897181, 3, 1],
                                    [8, 'templates/8.png', '一张关于健康教育的卡片，上面有一些文字，有一些食物图标，背景里有一些水果喝饮料的图标，且背景是模糊的', model_list[1], 936188591, 6, 1],
                                ],
                                [example_id, img_container, usr_prompt, base_model, seed, choice, num_samples],
                                examples_per_page=5,
                                label=''
                            )

                        example_id.change(
                            fn=load_box_list,
                            inputs=[example_id, choice],
                            outputs=[
                                *rect_cb_list, *rect_font_name_list, *rect_usr_text_list, *rect_box_list, example_id
                            ]
                        )

                    rect_img.clear(re_edit, None, [*rect_box_list, rect_img, image_width, image_height])
                    image_width.release(resize_w, [image_width, rect_img], rect_img)
                    image_height.release(resize_h, [image_height, rect_img], rect_img)
                    
        with gr.Column(scale=2):
            with gr.Row():
                result_gallery = gr.Gallery(
                    label='Result(结果)', show_label=True, preview=True, columns=8,
                    allow_preview=True, elem_id='gallery'
                )
            with gr.Row():
                with gr.Tab("Introduction"):
                    gr.Markdown('<span style="color:#3B5998;font-size:20px">What we can do</span>')
                    gr.Markdown(
                        '<span style="color:black;font-size:15px">Generating images with accurately represented text in multi-language.</span>')
                    gr.Markdown('<span style="color:#3B5998;font-size:20px">How to use</span>')
                    gr.Markdown(
                        '<span style="color:black;font-size:15px">Enter a description of the image you want to generate in the "Prompt" text box.</span>')
                    gr.Markdown('<span style="color:#3B5998;font-size:18px">Text Editing</span>')
                    gr.Markdown(
                        '<span style="color:black;font-size:15px">You can drag the "Text Boxes" slider to set the number of text to be laid out, '
                        'and set the corresponding font and text content respectively, Note that there must be no overlap between the text boxes, '
                        'or the model will not generate an image.</span>')
                    gr.Markdown(
                        '<span style="color:black;font-size:15px">Finally, click the Run button to generate a picture!</span>')
                with gr.Tab("说明"):
                    gr.Markdown('<span style="color:#3B5998;font-size:20px">我们能做什么</span>')
                    gr.Markdown('<span style="color:black;font-size:15px">在多种语言上生成具有准确文本的图像</span>')
                    gr.Markdown('<span style="color:#3B5998;font-size:20px">如何使用</span>')
                    gr.Markdown(
                        '<span style="color:black;font-size:15px">在“提示词”文本框中输入你想要生成的图片所对应的文字描述。</span>')
                    gr.Markdown('<span style="color:#3B5998;font-size:18px">文本编辑</span>')
                    gr.Markdown(
                        '<span style="color:black;font-size:15px">你可以拖动“可编辑文字框”滑块来设置需要布局的文字数量，并分别设置对应的字体和文字内容；'
                        '请注意，文本框之间不能有重叠，否则模型将不会生成图片。</span>')
                    gr.Markdown('<span style="color:black;font-size:15px">最后点击运行按钮，即可生成图片！</span>')
            with gr.Row():
                result_info = gr.Markdown('debug', visible=False)

    args = [
        num_samples, a_prompt, n_prompt,
        conditioning_scale, cfg_scale, inference_steps, seed, usr_prompt, 
        rect_img, base_model, scheduler_name, gr.State(BBOX_MAX_NUM),
        *(rect_cb_list + rect_box_list + rect_font_name_list + rect_usr_text_list)
    ]
    run_edit.click(
        fn=process,
        inputs=args,
        outputs=[result_gallery, result_info]
    )


if __name__ == "__main__":
    block.launch(
        server_name='0.0.0.0',
        share=True,
    )