# encoding=utf8 import os import cv2 import gradio as gr import numpy as np import re import json from huggingface_hub import login from functions import * from gradio.components import Component login(token=os.getenv('LOGIN_TOKEN')) css = './css/style.css' # Initial a Gradio Block with specific theme block = gr.Blocks( theme=gr.themes.Base(), css=css ).queue() # Load javascript plugin with open('javascript/bboxHint.js', 'r', encoding="utf-8") as file: value = file.read() escaped_value = json.dumps(value) with block: block.load( fn=None, _js=f"""() => {{ const script = document.createElement("script"); const text = document.createTextNode({escaped_value}); script.appendChild(text); document.head.appendChild(script); }}""" ) gr.HTML( '

JoyType

A Robust Design for Multilingual Visual Text Creation

' ) with gr.Row(): with gr.Column(scale=3): with gr.Accordion('Basic Settings(基础设置)', open=True): with gr.Row(variant='compact'): usr_prompt = gr.Textbox(label='Prompt(提示词)', elem_id='usr_prompt') with gr.Row(variant='compact'): base_model = gr.Dropdown( value='JoyType.v1.0', choices=model_list, label='Base Model(基模型)', elem_id='base_model', allow_custom_value=False ) with gr.Accordion('Advanced Settings(高级设置)', open=False): with gr.Row(variant='compact'): image_width = gr.Slider(label='Image Width(宽度)', minimum=256, maximum=768, value=512, step=32) image_height = gr.Slider(label='Image Height(高度)', minimum=256, maximum=768, value=512, step=32) with gr.Row(variant='compact'): num_samples = gr.Slider(label='Samples(生成数量)', minimum=1, maximum=4, value=2, step=1) inference_steps = gr.Slider(label='Steps(推理步数)', minimum=10, maximum=50, value=20, step=1) with gr.Row(variant='compact'): conditioning_scale = gr.Slider(label='Text Strength(文字强度)', minimum=0.1, maximum=2., value=1., step=0.1) cfg_scale = gr.Slider(label='CFG Scale(CFG制强度)', minimum=1, maximum=20, value=7.5, step=0.5) with gr.Row(variant='compact'): seed = gr.Slider(label='Seed(随机种子)', minimum=-1, maximum=2147483647, value=-1, step=1) scheduler_name = gr.Dropdown( value='PNDM', choices=[ 'PNDM', 'LMS', 'Euler', 'DPM', 'DDIM', 'Heun', 'Euler-Ancestral' ], label='Scheduler(采样器)', allow_custom_value=False ) with gr.Row(variant='compact'): a_prompt = gr.Textbox( label='Added Prompt(附加提示词)', max_lines=2, value='best quality, extremely detailed, supper legible text, ' 'clear text edges, clear strokes, neat writing, no watermarks' ) with gr.Row(variant='compact'): n_prompt = gr.Textbox( label='Negative Prompt(负向提示词)', max_lines=2, value='low-res, bad anatomy, extra digit, fewer digits, cropped, worst quality, ' 'low quality, watermark, unreadable text, messy words, distorted text, ' 'disorganized writing, advertising picture' ) base_model.change( fn=change_settings, inputs=base_model, outputs=[inference_steps, cfg_scale, scheduler_name] ) with gr.Row(): with gr.Tab('Text Editing(文字编辑)', elem_id='MD-tab-t2i'): with gr.Row(variant='compact'): choice = gr.Slider( label=f'Text Boxes(可编辑文字框)', minimum=0, maximum=8, step=1, value=BBOX_INI_NUM ) with gr.Row(): with gr.Column(scale=2): rect_img = gr.Image( value=create_canvas(), label='Rect Position', elem_id='MD-bbox-rect-t2i', show_label=False, visible=True, height=300 ) with gr.Column(scale=3): rect_cb_list: list[Component] = [] rect_box_list: list[Component] = [] rect_font_name_list: list[Component] = [] rect_usr_text_list: list[Component] = [] with gr.Column(): with gr.Row(elem_id='row_show'): with gr.Column(scale=1, min_width=20): gr.Markdown('

Font(字体)

', elem_id='markdown_1') with gr.Column(scale=2, min_width=20): gr.Markdown('

Text(文字内容)

', elem_id='markdown_2') row_layout = [gr.Row() for _ in range(BBOX_MAX_NUM)] for i in range(BBOX_MAX_NUM): visible = True if i < BBOX_INI_NUM else False with row_layout[i]: fn = gr.Dropdown( choices=font_list, label='Font(字体)', value='CHN-华文行楷', visible=visible, show_label=False, scale=1, allow_custom_value=False, min_width=90, elem_id=f'font_input_{i}', container=False ) ut = gr.Textbox( label='Text(文字内容)', visible=visible, scale=2, show_label=False, elem_id=f'text_input_{i}', container=False, max_lines=1 ) e = gr.Checkbox(label=f'{i}', value=visible, visible=False, min_width=10) x = gr.Slider(label='x', value=0.4, minimum=0.0, maximum=1.0, step=0.0001, elem_id=f'MD-t2i-{i}-x', visible=False) y = gr.Slider(label='y', value=0.4, minimum=0.0, maximum=1.0, step=0.0001, elem_id=f'MD-t2i-{i}-y', visible=False) w = gr.Slider(label='w', value=0.2, minimum=0.0, maximum=1.0, step=0.0001, elem_id=f'MD-t2i-{i}-w', visible=False) h = gr.Slider(label='h', value=0.2, minimum=0.0, maximum=1.0, step=0.0001, elem_id=f'MD-t2i-{i}-h', visible=False) x.change(fn=None, inputs=x, outputs=x, _js=f'v => onBoxChange({i}, "x", v)', show_progress=False, queue=False) y.change(fn=None, inputs=y, outputs=y, _js=f'v => onBoxChange({i}, "y", v)', show_progress=False, queue=False) w.change(fn=None, inputs=w, outputs=w, _js=f'v => onBoxChange({i}, "w", v)', show_progress=False, queue=False) h.change(fn=None, inputs=h, outputs=h, _js=f'v => onBoxChange({i}, "h", v)', show_progress=False, queue=False) e.change(fn=None, inputs=e, outputs=e, _js=f'e => onBoxEnableClick({i}, e)', queue=False) rect_cb_list.extend([e]) rect_box_list.extend([x, y, w, h]) rect_font_name_list.extend([fn]) rect_usr_text_list.extend([ut]) choice.change( fn=update_box_num, inputs=[choice], outputs=[ *rect_cb_list, *rect_font_name_list, *rect_usr_text_list, *rect_box_list ] ) with gr.Row(): gr.Markdown('') run_edit = gr.Button(value='Run(运行)', elem_classes='run', elem_id='run_edit') gr.Markdown('') with gr.Row(): with gr.Accordion(label='Examples(示例)', open=True): img_container = gr.Image(visible=False, label='Text Layout(文字布局)') example_id = gr.Textbox(value=-1, visible=False, label='ID(编号)') gen_examples = gr.Examples( [ [1, 'templates/1.png', 'landscape, Chinese style, ink peaks, poster', model_list[0], 1648703813, 3, 1], [2, 'templates/2.png', 'a clock and medicine bottle has texts and "time"', model_list[0], 1654615998, 2, 1], [3, 'templates/3.png', '漂亮的风景照，很多山峰，清澈的湖水', model_list[3], 2078698098, 3, 1], [4, 'templates/4.png', 'a vodka, on the bar, dim background', model_list[2], 443791646, 3, 1], [5, 'templates/5.png', '画有玫瑰的卡片，明亮的背景', model_list[4], 516210890, 2, 1], [6, 'templates/6.png', 'posters on the table, with pens, clear background, starry sky, moon', model_list[1], 228167646, 4, 1], [7, 'templates/7.png', 'snowy landscape, domed cabin, winter scene, cozy atmosphere, soft lighting', model_list[5], 695897181, 3, 1], [8, 'templates/8.png', '一张关于健康教育的卡片，上面有一些文字，有一些食物图标，背景里有一些水果喝饮料的图标，且背景是模糊的', model_list[1], 936188591, 6, 1], ], [example_id, img_container, usr_prompt, base_model, seed, choice, num_samples], examples_per_page=5, label='' ) example_id.change( fn=load_box_list, inputs=[example_id, choice], outputs=[ *rect_cb_list, *rect_font_name_list, *rect_usr_text_list, *rect_box_list, example_id ] ) rect_img.clear(re_edit, None, [*rect_box_list, rect_img, image_width, image_height]) image_width.release(resize_w, [image_width, rect_img], rect_img) image_height.release(resize_h, [image_height, rect_img], rect_img) with gr.Column(scale=2): with gr.Row(): result_gallery = gr.Gallery( label='Result(结果)', show_label=True, preview=True, columns=8, allow_preview=True, elem_id='gallery' ) with gr.Row(): with gr.Tab("Introduction"): gr.Markdown('What we can do') gr.Markdown( 'Generating images with accurately represented text in multi-language.') gr.Markdown('How to use') gr.Markdown( 'Enter a description of the image you want to generate in the "Prompt" text box.') gr.Markdown('Text Editing') gr.Markdown( 'You can drag the "Text Boxes" slider to set the number of text to be laid out, ' 'and set the corresponding font and text content respectively, Note that there must be no overlap between the text boxes, ' 'or the model will not generate an image.') gr.Markdown( 'Finally, click the Run button to generate a picture!') with gr.Tab("说明"): gr.Markdown('我们能做什么') gr.Markdown('在多种语言上生成具有准确文本的图像') gr.Markdown('如何使用') gr.Markdown( '在“提示词”文本框中输入你想要生成的图片所对应的文字描述。') gr.Markdown('文本编辑') gr.Markdown( '你可以拖动“可编辑文字框”滑块来设置需要布局的文字数量，并分别设置对应的字体和文字内容；' '请注意，文本框之间不能有重叠，否则模型将不会生成图片。') gr.Markdown('最后点击运行按钮，即可生成图片！') with gr.Row(): result_info = gr.Markdown('debug', visible=False) args = [ num_samples, a_prompt, n_prompt, conditioning_scale, cfg_scale, inference_steps, seed, usr_prompt, rect_img, base_model, scheduler_name, gr.State(BBOX_MAX_NUM), *(rect_cb_list + rect_box_list + rect_font_name_list + rect_usr_text_list) ] run_edit.click( fn=process, inputs=args, outputs=[result_gallery, result_info] ) if __name__ == "__main__": block.launch( server_name='0.0.0.0', share=True, )