nuking

Runtime error

File size: 3,773 Bytes

dd67556
 
 
 
 
 
 
 
 
fc9e8ce
 
dd67556
 
 
fc9e8ce
dd67556
fc9e8ce
 
dd67556
fc9e8ce
dd67556
 
 
 
5801493
e84892b
dc146a8
 
 
 
 
fc9e8ce
dd67556
fc9e8ce
dc146a8
e84892b
fc9e8ce
dc146a8
 
a6a92bb
dc146a8
e84892b
a6a92bb
fc9e8ce
a6a92bb
 
 
 
 
 
 
 
 
 
dc146a8
 
fc9e8ce
e84892b
 
 
dd67556
e84892b
ca70732
a6a92bb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e84892b
 
597ebe6
ca70732
 
 
e84892b
 
ca70732
 
5801493
 
ca70732
e84892b

import numpy as np
import torch
import torch.nn.functional as F
from torchvision.transforms.functional import normalize
from huggingface_hub import hf_hub_download
import gradio as gr
from briarmbg import BriaRMBG
from PIL import Image

# 모델 초기화 및 로드
net = BriaRMBG()
model_path = hf_hub_download("briaai/RMBG-1.4", 'model.pth')
if torch.cuda.is_available():
    net.load_state_dict(torch.load(model_path))
    net = net.cuda()
else:
    net.load_state_dict(torch.load(model_path, map_location="cpu"))
net.eval()

def resize_image(image, model_input_size=(1024, 1024)):
    image = image.convert('RGB')
    image = image.resize(model_input_size, Image.BILINEAR)
    return image

def process(image, background_image=None):
    # 이미지 준비
    orig_image = Image.fromarray(image).convert("RGBA")
    w, h = orig_im_size = orig_image.size
    image = resize_image(orig_image)
    im_np = np.array(image)
    im_tensor = torch.tensor(im_np, dtype=torch.float32).permute(2, 0, 1).unsqueeze(0) / 255.0
    im_tensor = normalize(im_tensor, [0.5, 0.5, 0.5], [1.0, 1.0, 1.0])
    if torch.cuda.is_available():
        im_tensor = im_tensor.cuda()

    # 추론
    with torch.no_grad():
        result = net(im_tensor)
    
# 후처리
    result = torch.squeeze(F.interpolate(result[0][0], size=(h, w), mode='bilinear', align_corners=False), 0)
    result = torch.sigmoid(result)
    mask = (result * 255).byte().cpu().numpy()  # 마스크를 0~255 사이의 값으로 변환

# mask 배열이 예상대로 2차원인지 확인하고, 아니라면 조정합니다.
    if mask.ndim > 2:
        mask = mask.squeeze()  # 차원 축소

# mask 배열을 명확히 uint8로 변환합니다.
    mask = mask.astype(np.uint8)

# mask를 PIL 이미지로 변환
    mask_image = Image.fromarray(mask, 'L')  # 'L' 모드는 그레이스케일 이미지를 나타냅니다.
    
    final_image = Image.new("RGBA", orig_image.size)
    final_image.paste(orig_image, mask=mask_image)

    # 선택적 배경 이미지 처리
    if background_image is not None:
        final_image = merge_images(background_image, final_image)

    return final_image

def merge_images(background_image, foreground_image):
    """
    배경 이미지에 배경이 제거된 이미지를 투명하게 삽입합니다.
    배경이 제거된 이미지는 배경 이미지 중앙에 30% 크기로 축소되어 삽입됩니다.
    """
    background = background_image.convert("RGBA")
    foreground = foreground_image.convert("RGBA")
    
    # 전경 이미지를 배경 이미지의 30% 크기로 조정
    scale_factor = 0.3
    foreground_width = int(background.width * scale_factor)
    foreground_height = int(foreground.height * foreground_width / foreground.width)
    new_size = (foreground_width, foreground_height)
    foreground_resized = foreground.resize(new_size, Image.Resampling.LANCZOS)
    
    # 전경 이미지를 배경 이미지의 가운데에 위치시키기 위한 좌표 계산
    x = (background.width - foreground_width) // 2
    y = (background.height - foreground_height) // 2
    
    # 배경 이미지 위에 전경 이미지를 붙임
    background.paste(foreground_resized, (x, y), foreground_resized)
    
    return background


title = "Background Removal"
description = "This is a demo for BRIA RMBG 1.4 using the BRIA RMBG-1.4 image matting model as backbone."

demo = gr.Interface(
    fn=process,
    inputs=[
        gr.Image(type="numpy", label="Image to remove background"),
        gr.Image(type="pil", label="Optional: Background Image")  # 'optional=True'는 Gradio 버전에 따라 필요 없을 수 있음
    ],
    outputs="image",
    title=title,
    description=description
)

if __name__ == "__main__":
    demo.launch()