Spaces:

usbunist
/

destroy_deepfake

Sleeping

App Files Files Community

hanriv commited on Jul 31, 2024

Commit

2bd1102

verified ·

1 Parent(s): 5879110

Update app.py

Browse files

Files changed (1) hide show

app.py +303 -4

app.py CHANGED Viewed

@@ -1,7 +1,306 @@
-import streamlit as st
-x = st.slider('Select a value')
-st.write(x, 'squared is', x * x)
-# dhaahha

+# 아래 코드는 illusion diffusion에서 작성한 것을 참고하기 위해 가져온 것임.
+import spaces
+import torch
+import gradio as gr
+from gradio import processing_utils, utils
+from PIL import Image
+import random
+from diffusers import (
+    DiffusionPipeline,
+    AutoencoderKL,
+    StableDiffusionControlNetPipeline,
+    ControlNetModel,
+    StableDiffusionLatentUpscalePipeline,
+    StableDiffusionImg2ImgPipeline,
+    StableDiffusionControlNetImg2ImgPipeline,
+    DPMSolverMultistepScheduler,
+    EulerDiscreteScheduler
+)
+import tempfile
+import time
+from share_btn import community_icon_html, loading_icon_html, share_js
+import user_history
+from illusion_style import css
+import os
+# from transformers import CLIPImageProcessor
+from diffusers.pipelines.stable_diffusion.safety_checker import StableDiffusionSafetyChecker
+BASE_MODEL = ""
+# BASE_MODEL = "SG161222/Realistic_Vision_V5.1_noVAE"
+# Initialize both pipelines
+vae = AutoencoderKL.from_pretrained("stabilityai/sd-vae-ft-mse", torch_dtype=torch.float16)
+controlnet = ControlNetModel.from_pretrained("monster-labs/control_v1p_sd15_qrcode_monster", torch_dtype=torch.float16)
+# Initialize the safety checker conditionally
+# 보안 관련.
+SAFETY_CHECKER_ENABLED = os.environ.get("SAFETY_CHECKER", "0") == "1"
+safety_checker = None
+# feature_extractor = None
+if SAFETY_CHECKER_ENABLED:
+    safety_checker = StableDiffusionSafetyChecker.from_pretrained("CompVis/stable-diffusion-safety-checker").to("cuda")
+    # feature_extractor = CLIPImageProcessor.from_pretrained("openai/clip-vit-base-patch32")
+main_pipe = StableDiffusionControlNetPipeline.from_pretrained(
+    BASE_MODEL,
+    controlnet=controlnet,
+    vae=vae,
+    safety_checker=safety_checker,
+    # feature_extractor=feature_extractor,
+    torch_dtype=torch.float16,
+).to("cuda")
+# Function to check NSFW images
+#def check_nsfw_images(images: list[Image.Image]) -> tuple[list[Image.Image], list[bool]]:
+#    if SAFETY_CHECKER_ENABLED:
+#        safety_checker_input = feature_extractor(images, return_tensors="pt").to("cuda")
+#        has_nsfw_concepts = safety_checker(
+#            images=[images],
+#            clip_input=safety_checker_input.pixel_values.to("cuda")
+#        )
+#        return images, has_nsfw_concepts
+#    else:
+#        return images, [False] * len(images)
+#main_pipe.unet = torch.compile(main_pipe.unet, mode="reduce-overhead", fullgraph=True)
+#main_pipe.unet.to(memory_format=torch.channels_last)
+#main_pipe.unet = torch.compile(main_pipe.unet, mode="reduce-overhead", fullgraph=True)
+#model_id = "stabilityai/sd-x2-latent-upscaler"
+image_pipe = StableDiffusionControlNetImg2ImgPipeline(**main_pipe.components)
+#image_pipe.unet = torch.compile(image_pipe.unet, mode="reduce-overhead", fullgraph=True)
+#upscaler = StableDiffusionLatentUpscalePipeline.from_pretrained(model_id, torch_dtype=torch.float16)
+#upscaler.to("cuda")
+# Sampler map
+SAMPLER_MAP = {
+    "DPM++ Karras SDE": lambda config: DPMSolverMultistepScheduler.from_config(config, use_karras=True, algorithm_type="sde-dpmsolver++"),
+    "Euler": lambda config: EulerDiscreteScheduler.from_config(config),
+}
+#이미지 짧은 쪽 기준으로 정사각형 크기, 중심 기준으로 자를 영역. 자른 결과 반환
+def center_crop_resize(img, output_size=(512, 512)):
+    width, height = img.size
+    # Calculate dimensions to crop to the center
+    new_dimension = min(width, height)
+    left = (width - new_dimension)/2
+    top = (height - new_dimension)/2
+    right = (width + new_dimension)/2
+    bottom = (height + new_dimension)/2
+    # Crop and resize
+    img = img.crop((left, top, right, bottom))
+    img = img.resize(output_size)
+    return img
+#이미지 확대 시 빈 공간에 픽셀을 끼워 넣어 자연스럽게 만들어 주는
+def common_upscale(samples, width, height, upscale_method, crop=False):
+        if crop == "center":
+            old_width = samples.shape[3]
+            old_height = samples.shape[2]
+            old_aspect = old_width / old_height
+            new_aspect = width / height
+            x = 0
+            y = 0
+            if old_aspect > new_aspect:
+                x = round((old_width - old_width * (new_aspect / old_aspect)) / 2)
+            elif old_aspect < new_aspect:
+                y = round((old_height - old_height * (old_aspect / new_aspect)) / 2)
+            s = samples[:,:,y:old_height-y,x:old_width-x]
+        else:
+            s = samples
+        return torch.nn.functional.interpolate(s, size=(height, width), mode=upscale_method)
+#위와 마찬가지로 업스케일링
+def upscale(samples, upscale_method, scale_by):
+        #s = samples.copy()
+        width = round(samples["images"].shape[3] * scale_by)
+        height = round(samples["images"].shape[2] * scale_by)
+        s = common_upscale(samples["images"], width, height, upscale_method, "disabled")
+        return (s)
+# 사용자가 빈 값을 입력 하는지 안 하는지
+def check_inputs(prompt: str, control_image: Image.Image):
+    if control_image is None:
+        raise gr.Error("Please select or upload an Input Illusion")
+    if prompt is None or prompt == "":
+        raise gr.Error("Prompt is required")
+# Base64 -> PIL
+def convert_to_pil(base64_image):
+    pil_image = Image.open(base64_image)
+    return pil_image
+# PIL -> Base64
+def convert_to_base64(pil_image):
+    with tempfile.NamedTemporaryFile(suffix='.png', delete=False) as temp_file:
+        image.save(temp_file.name)
+    return temp_file.name
+# Inference function
+@spaces.GPU
+def inference(
+    control_image: Image.Image,
+    prompt: str,
+    negative_prompt: str,
+    guidance_scale: float = 8.0,
+    controlnet_conditioning_scale: float = 1,
+    control_guidance_start: float = 1,
+    control_guidance_end: float = 1,
+    upscaler_strength: float = 0.5,
+    seed: int = -1,
+    sampler = "DPM++ Karras SDE",
+    progress = gr.Progress(track_tqdm=True),
+    profile: gr.OAuthProfile | None = None,
+):
+    start_time = time.time()
+    start_time_struct = time.localtime(start_time)
+    start_time_formatted = time.strftime("%H:%M:%S", start_time_struct)
+    print(f"Inference started at {start_time_formatted}")
+    # Generate the initial image
+    #init_image = init_pipe(prompt).images[0]
+    # Rest of your existing code
+    control_image_small = center_crop_resize(control_image)
+    control_image_large = center_crop_resize(control_image, (1024, 1024))
+    main_pipe.scheduler = SAMPLER_MAP[sampler](main_pipe.scheduler.config)
+    my_seed = random.randint(0, 2**32 - 1) if seed == -1 else seed
+    generator = torch.Generator(device="cuda").manual_seed(my_seed)
+    out = main_pipe(
+        prompt=prompt,
+        negative_prompt=negative_prompt,
+        image=control_image_small,
+        guidance_scale=float(guidance_scale),
+        controlnet_conditioning_scale=float(controlnet_conditioning_scale),
+        generator=generator,
+        control_guidance_start=float(control_guidance_start),
+        control_guidance_end=float(control_guidance_end),
+        num_inference_steps=15,
+        output_type="latent"
+    )
+    upscaled_latents = upscale(out, "nearest-exact", 2)
+    out_image = image_pipe(
+        prompt=prompt,
+        negative_prompt=negative_prompt,
+        control_image=control_image_large,
+        image=upscaled_latents,
+        guidance_scale=float(guidance_scale),
+        generator=generator,
+        num_inference_steps=20,
+        strength=upscaler_strength,
+        control_guidance_start=float(control_guidance_start),
+        control_guidance_end=float(control_guidance_end),
+        controlnet_conditioning_scale=float(controlnet_conditioning_scale)
+    )
+    end_time = time.time()
+    end_time_struct = time.localtime(end_time)
+    end_time_formatted = time.strftime("%H:%M:%S", end_time_struct)
+    print(f"Inference ended at {end_time_formatted}, taking {end_time-start_time}s")
+    # Save image + metadata
+    # 메타 데이터도 있어 나중에 분석 시 용이할 듯.
+    user_history.save_image(
+        label=prompt,
+        image=out_image["images"][0],
+        profile=profile,
+        metadata={
+            "prompt": prompt,
+            "negative_prompt": negative_prompt,
+            "guidance_scale": guidance_scale,
+            "controlnet_conditioning_scale": controlnet_conditioning_scale,
+            "control_guidance_start": control_guidance_start,
+            "control_guidance_end": control_guidance_end,
+            "upscaler_strength": upscaler_strength,
+            "seed": seed,
+            "sampler": sampler,
+        },
+    )
+    return out_image["images"][0], gr.update(visible=True), gr.update(visible=True), my_seed
+with gr.Blocks() as app:
+    gr.Markdown(
+        '''
+        <div style="text-align: center;">
+            <h1>Destroy Deepfake, Protect Image 🌀</h1>
+            <p style="font-size:16px;">Generate your image with a protective shield. Try it now!</p>
+            <p>When you upload an image, a protective filter is applied and the modified image is outputted. Even if malicious users try to use the protected photo for deepfake synthesis, the protective filter will ensure that the results are distorted.</p>
+            <p>If you have any questions, please contact us at the email address on the right. <a href="[email protected]"></p>
+            <p>Please send your feedback to this address. <a href="https://여기에 피드백할 구글폼 만들어 올린다거나.."> It will greatly help us improve our service. Given a prompt and your pattern, we use a QR code conditioned controlnet to create a stunning illusion! Credit to: <a href="https://twitter.com/MrUgleh">MrUgleh</a> for discovering the workflow :)</p>
+        </div>
+        '''
+    )
+    # 입출력 이미지 저장 시 사용
+    # state_img_input = gr.State()
+    # state_img_output = gr.State()
+    with gr.Row():
+        with gr.Column():
+            control_image = gr.Image(label="Input your image", type="pil", elem_id="control_image")
+            controlnet_conditioning_scale = gr.Slider(minimum=0.0, maximum=5.0, step=0.01, value=0.8, label="protecting strength", elem_id="illusion_strength", info="ControlNet conditioning scale")
+            # gr.Examples(examples=["checkers.png", "checkers_mid.jpg", "pattern.png", "ultra_checkers.png", "spiral.jpeg", "funky.jpeg" ], inputs=control_image)
+            '''
+            prompt = gr.Textbox(label="Prompt", elem_id="prompt", info="Type what you want to generate", placeholder="Medieval village scene with busy streets and castle in the distance")
+            negative_prompt = gr.Textbox(label="Negative Prompt", info="Type what you don't want to see", value="low quality", elem_id="negative_prompt")
+            with gr.Accordion(label="Advanced Options", open=False):
+                guidance_scale = gr.Slider(minimum=0.0, maximum=50.0, step=0.25, value=7.5, label="Guidance Scale")
+                sampler = gr.Dropdown(choices=list(SAMPLER_MAP.keys()), value="Euler")
+                control_start = gr.Slider(minimum=0.0, maximum=1.0, step=0.1, value=0, label="Start of ControlNet")
+                control_end = gr.Slider(minimum=0.0, maximum=1.0, step=0.1, value=1, label="End of ControlNet")
+                strength = gr.Slider(minimum=0.0, maximum=1.0, step=0.1, value=1, label="Strength of the upscaler")
+                seed = gr.Slider(minimum=-1, maximum=9999999999, step=1, value=-1, label="Seed", info="-1 means random seed")
+                used_seed = gr.Number(label="Last seed used",interactive=False)
+            run_btn = gr.Button("Run")
+        with gr.Column():
+            result_image = gr.Image(label="Illusion Diffusion Output", interactive=False, elem_id="output")
+            with gr.Group(elem_id="share-btn-container", visible=False) as share_group:
+                community_icon = gr.HTML(community_icon_html)
+                loading_icon = gr.HTML(loading_icon_html)
+                share_button = gr.Button("Share to community", elem_id="share-btn")
+    prompt.submit(
+        check_inputs,
+        inputs=[prompt, control_image],
+        queue=False
+    ).success(
+        inference,
+        inputs=[control_image, prompt, negative_prompt, guidance_scale, controlnet_conditioning_scale, control_start, control_end, strength, seed, sampler],
+        outputs=[result_image, result_image, share_group, used_seed])
+    '''
+        run_btn = gr.Button("Run")
+    run_btn.click(
+        check_inputs,
+        inputs=[prompt, control_image],
+        queue=False
+    ).success(
+        inference,
+        inputs=[control_image, prompt, negative_prompt, guidance_scale, controlnet_conditioning_scale, control_start, control_end, strength, seed, sampler],
+        outputs=[result_image, result_image, share_group, used_seed])
+    share_button.click(None, [], [], js=share_js)
+with gr.Blocks(css=css) as app_with_history:
+    with gr.Tab("Demo"):
+        app.render()
+    with gr.Tab("Past generations"):
+        user_history.render()
+app_with_history.queue(max_size=20,api_open=False )
+if __name__ == "__main__":
+    app_with_history.launch(max_threads=400)