File size: 9,740 Bytes
b7cfcd0
641c88c
6118f2d
641c88c
 
 
 
 
3c811bc
a0fc1c5
1aaeb30
641c88c
39c8500
 
 
 
 
 
6d52164
a0fc1c5
 
3c811bc
1aaeb30
 
 
 
6d52164
641c88c
 
 
 
 
1fc0a5a
641c88c
 
 
 
 
 
 
6d52164
641c88c
 
 
 
 
 
 
 
 
6d52164
c8be5fc
 
 
 
320761b
6118f2d
320761b
 
4503ce7
 
 
f34a981
4503ce7
f34a981
4503ce7
f34a981
4503ce7
 
6118f2d
 
465251b
6118f2d
 
 
 
 
 
641c88c
6118f2d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
641c88c
6118f2d
 
 
 
 
 
 
 
 
 
641c88c
6118f2d
 
465251b
6118f2d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1aaeb30
 
 
 
 
 
 
6118f2d
 
 
 
af3605b
6118f2d
 
 
 
af3605b
6118f2d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
641c88c
6118f2d
 
 
 
 
 
641c88c
6118f2d
 
 
 
 
 
641c88c
1aaeb30
 
c8be5fc
 
1aaeb30
 
320761b
6118f2d
fae7447
08e8da7
fae7447
6118f2d
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
import gradio as gr
import io
import os
from PIL import Image
import base64
from scripts.process_utils import initialize, process_image_as_base64, image_to_base64
from scripts.anime import init_model
from scripts.generate_prompt import load_wd14_tagger_model
from datetime import datetime
from pytz import timezone
from scripts.survey import handle_form_submission, handle_visit_choice, handle_proceed, localize, script, generate_image, send_feedback

def initialize_models():
    # 初期化
    initialize(_use_local=False, use_gpu=True, use_dotenv=True)
    init_model(use_local=False)
    load_wd14_tagger_model()

def process_image(input_image, mode, weight1=None, weight2=None):
    tokyo_time = datetime.now(timezone('Asia/Tokyo')).strftime("%Y-%m-%d %H:%M:%S")  # 日本時間のタイムスタンプ
    print(f"[{tokyo_time}] Processing image with mode={mode}, weight1={weight1}, weight2={weight2}")

    # feedback用のファイル名
    tokyo_time = datetime.now(timezone('Asia/Tokyo')).strftime("%Y%m%d_%H%M%S")
    filename = f"{tokyo_time}_mode={mode}_weight1={weight1}_weight2={weight2}.png"

    # 既存の画像処理ロジック
    if mode == "original":
        sotai_image, sketch_image = process_image_as_base64(input_image, mode, None, None)
    elif mode == "refine":
        sotai_image, sketch_image = process_image_as_base64(input_image, mode, weight1, weight2)

    return sotai_image, sketch_image, None, filename

def mix_images(sotai_image_data, sketch_image_data, opacity1, opacity2):
    sotai_image = Image.open(io.BytesIO(base64.b64decode(sotai_image_data))).convert('RGBA')
    sketch_image = Image.open(io.BytesIO(base64.b64decode(sketch_image_data))).convert('RGBA')

    if sotai_image.size != sketch_image.size:
        sketch_image = sketch_image.resize(sotai_image.size, Image.Resampling.LANCZOS)

    mixed_image = Image.new('RGBA', sotai_image.size, (255, 255, 255, 255))

    sotai_alpha = sotai_image.getchannel('A').point(lambda x: int(x * opacity1))
    sketch_alpha = sketch_image.getchannel('A').point(lambda x: int(x * opacity2))

    mixed_image.paste(sketch_image, (0, 0), mask=sketch_alpha)
    mixed_image.paste(sotai_image, (0, 0), mask=sotai_alpha)

    return mixed_image

def send_mixed_feedback(sotai_image_data, sketch_image_data, filename):
    mixed_image = mix_images(sotai_image_data, sketch_image_data, 0.5, 0.5)
    return send_feedback(mixed_image, filename)

with gr.Blocks() as demo:
    form_visible_flag = gr.Textbox(value="false", elem_id="form_flag", visible=False)
    # title
    gr.HTML("<h1>Image2Body demo</h1>")
    # description with translations and additional notes
    gr.HTML("""
        <p>Upload an image and select processing options to generate body and sketch images.</p>
        <p>まだstandingタグのついた女性キャラクターの1000枚の画像しか学習していないため、他のポーズは上手くできないことをご了承ください。</p>
        <p>さらなる情報は<a href="https://x.com/Yeq6X" target="_blank">@Yeq6X</a>までお問い合わせください。</p>
        <p>Note: Currently, the model has been trained on only 1000 images of female characters with the 'standing' tag, so other poses may not be processed accurately.</p>
        <p>For more information, please contact <a href="https://x.com/Yeq6X" target="_blank">@Yeq6X</a>.</p>
        <p>注意:目前模型仅使用带有“standing”标签的1000张女性角色图像进行训练,因此其他姿势可能无法准确处理。</p>
        <p>如需更多信息,请联系<a href="https://x.com/Yeq6X" target="_blank">@Yeq6X</a>。</p>
    """)

    # 訪問回数の選択
    with gr.Column(visible=False) as visit_section:
        # 言語選択セクション
        with gr.Row():
            language_choice = gr.Radio(
                choices=["en", "ja", "zh"],
                label="Select Language / 言語を選択 / 选择语言",
                value="en"
            )

        localized = localize("en")
        welcome_message = gr.HTML(localized["welcome_message"])
        visit_choice = gr.Radio(choices=localized["visit_choices"], label="")

    # 初回訪問のアンケートセクション
    with gr.Column(visible=False) as survey_section:
        # フォームセクション
        form_section = gr.HTML(localize("en")["form_html"])

    # 2回目以降の進むボタンセクション
    with gr.Column(visible=False) as proceed_section:
        # gr.HTML("<h2>再訪ありがとうございます!</h2>")
        # proceed_button = gr.Button("進む")
        proceed_message = gr.HTML(localize("en")["returning_message"])
        proceed_button = gr.Button(localize("en")["proceed_button"], variant="primary")

    # 言語選択変更時の更新
    def update_language(language):
        localized = localize(language)
        return (
            gr.update(value=localized["welcome_message"]),
            gr.update(choices=localized["visit_choices"]),
            gr.update(value=localized["returning_message"]),
            gr.update(value=localized["proceed_button"]),
            gr.update(value=localized["form_html"])
        )

    language_choice.change(
        update_language,
        inputs=[language_choice],
        outputs=[welcome_message, visit_choice, proceed_message, proceed_button, form_section]
    )

    # フォーム送信時の画面切り替え
    def handle_submit():
        return gr.update(visible=False), gr.update(visible=True)

    submit_flag = gr.Textbox(visible=False, value="false")
    submit_flag.change(
        handle_submit,
        inputs=[],
        outputs=[form_section]
    )

    # メイン画面セクション
    with gr.Column(visible=True) as main_section:
        # interface
        submit = None
        with gr.Row():
            with gr.Column() as input_col:
                input_image = gr.Image(type="pil", label="Input Image", height=512)
                with gr.Tab("original"):
                    original_mode = gr.Text("original", label="Mode", visible=False)
                    original_submit = gr.Button("Submit", variant="primary")
                with gr.Tab("refine"):
                    refine_input = [
                        gr.Text("refine", label="Mode", visible=False),
                        gr.Slider(0, 2, value=0.6, step=0.05, label="Weight 1 (Sketch)"),
                        gr.Slider(0, 1, value=0.05, step=0.025, label="Weight 2 (Body)")
                    ]
                    refine_submit = gr.Button("Submit", variant="primary")
                gr.Examples(
                    examples=[f"images/sample{i}.png" for i in [1, 2, 4, 5, 6, 7, 10, 16, 18, 19]],
                    inputs=[input_image]
                )
            with gr.Column() as output_col:
                sotai_image_data = gr.Text(label="Sotai Image data", visible=False)
                sketch_image_data = gr.Text(label="Sketch Image data", visible=False)
                mixed_image = gr.Image(label="Output Image", elem_id="output_image")
                opacity_slider1 = gr.Slider(0, 1, value=0.5, step=0.05, label="Opacity (Sotai)")
                opacity_slider2 = gr.Slider(0, 1, value=0.5, step=0.05, label="Opacity (Sketch)")
                send_filename = gr.Textbox(label="Feedback", visible=False)
                gr.HTML("<h3>Send Feedback Image/画像を送信</h3>")
                gr.HTML("<p>Images are used only for developer review and will not be shared.</p>")
                gr.HTML("<p>画像は開発者が確認するためだけに使用され、公開されません。</p>")
                send_feedback_button = gr.Button("Contribute as Feedback to Developer/開発者へのフィードバックとして協力する")
                feed_back_result = gr.Textbox(label="Feedback Result")


        original_submit.click(
            process_image,
            inputs=[input_image, original_mode],
            outputs=[sotai_image_data, sketch_image_data, mixed_image, send_filename]
        )
        refine_submit.click(
            process_image,
            inputs=[input_image, refine_input[0], refine_input[1], refine_input[2]],
            outputs=[sotai_image_data, sketch_image_data, mixed_image, send_filename]
        )
        sotai_image_data.change(
            mix_images,
            inputs=[sotai_image_data, sketch_image_data, opacity_slider1, opacity_slider2],
            outputs=mixed_image
        )
        opacity_slider1.change(
            mix_images,
            inputs=[sotai_image_data, sketch_image_data, opacity_slider1, opacity_slider2],
            outputs=mixed_image
        )
        opacity_slider2.change(
            mix_images,
            inputs=[sotai_image_data, sketch_image_data, opacity_slider1, opacity_slider2],
            outputs=mixed_image
        )

    # フラグ変更時に画面切り替え
    form_visible_flag.change(
        handle_form_submission,
        inputs=[form_visible_flag],
        outputs=[survey_section, main_section]
    )

    # 選択肢に応じてセクションを切り替え
    visit_choice.change(
        handle_visit_choice,
        inputs=[visit_choice, language_choice],
        outputs=[visit_section, survey_section, proceed_section]
    )

    # 進むボタン押下時の画面遷移
    proceed_button.click(
        handle_proceed,
        inputs=[],
        outputs=[proceed_section, main_section]
    )
    
    send_feedback_button.click(
        send_mixed_feedback,
        inputs=[sotai_image_data, sketch_image_data, send_filename],
        outputs=[feed_back_result],
    )

    # JavaScriptの読み込み
    demo.load(js=script)

initialize_models()
demo.launch()