Spaces:

ECCV2022
/

Screen_Image_Demoireing

Running

App Files Files Community

Andyx commited on Jul 27, 2022

Commit

b1c6042

0 Parent(s):

0

Browse files

Files changed (12) hide show

.gitattributes +3 -0
001.jpg +3 -0
002.jpg +3 -0
003.jpg +3 -0
004.jpg +3 -0
005.jpg +3 -0
README.md +12 -0
app.py +115 -0
mix.pth +3 -0
model/nets.py +259 -0
requirements.txt +6 -0
uhdm_checkpoint.pth +3 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,3 @@

+*.pth filter=lfs diff=lfs merge=lfs -text
+*.jpg filter=lfs diff=lfs merge=lfs -text
+.jpg filter=lfs diff=lfs merge=lfs -text

001.jpg ADDED Viewed

Git LFS Details

SHA256: a57fa193ce0c4e532f9ce55169eee2f83475b0422485744fa82a3ae3abfcc3b6
Pointer size: 132 Bytes
Size of remote file: 5.07 MB

002.jpg ADDED Viewed

Git LFS Details

SHA256: b9181c80dd860b54fbc8da4dee1565aeffb5c55b24fd2d5a819edf13ba4a2993
Pointer size: 132 Bytes
Size of remote file: 4.8 MB

003.jpg ADDED Viewed

Git LFS Details

SHA256: 03d8605cf8d695d775a1c4fe172e6313447cf74a34fa9272f168df13ffb04d09
Pointer size: 132 Bytes
Size of remote file: 4.84 MB

004.jpg ADDED Viewed

Git LFS Details

SHA256: 9ac79dfac7ab723dd3f07589aa7ae7e680ee22c6a37800bd79cce6cd82940c35
Pointer size: 129 Bytes
Size of remote file: 8.12 kB

005.jpg ADDED Viewed

Git LFS Details

SHA256: 3213c47088e5d0e78a23a1e51abc9d3ce202b16524705d2a7a54cf91a6979819
Pointer size: 129 Bytes
Size of remote file: 7.75 kB

README.md ADDED Viewed

	@@ -0,0 +1,12 @@

+---
+title: Screen Image Demoireing
+emoji: ⚡
+colorFrom: purple
+colorTo: purple
+sdk: gradio
+sdk_version: 3.1.1
+app_file: app.py
+pinned: false
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

app.py ADDED Viewed

	@@ -0,0 +1,115 @@

+import gradio as gr
+from model.nets import my_model
+import torch
+import cv2
+import torch.utils.data as data
+import torchvision.transforms as transforms
+import PIL
+from PIL import Image
+from PIL import ImageFile
+import math
+import os
+import torch.nn.functional as F
+os.environ["CUDA_VISIBLE_DEVICES"] = "1"
+device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+model1 = my_model(en_feature_num=48,
+                     en_inter_num=32,
+                     de_feature_num=64,
+                     de_inter_num=32,
+                     sam_number=1,
+                     ).to(device)
+load_path1 = "./mix.pth"
+model_state_dict1 = torch.load(load_path1, map_location=device)
+model1.load_state_dict(model_state_dict1)
+model2 = my_model(en_feature_num=48,
+                     en_inter_num=32,
+                     de_feature_num=64,
+                     de_inter_num=32,
+                     sam_number=1,
+                     ).to(device)
+load_path2 = "./uhdm_checkpoint.pth"
+model_state_dict2 = torch.load(load_path2, map_location=device)
+model2.load_state_dict(model_state_dict2)
+def default_toTensor(img):
+    t_list = [transforms.ToTensor()]
+    composed_transform = transforms.Compose(t_list)
+    return composed_transform(img)
+def predict1(img):
+    in_img = transforms.ToTensor()(img).to(device).unsqueeze(0)
+    b, c, h, w = in_img.size()
+    # pad image such that the resolution is a multiple of 32
+    w_pad = (math.ceil(w / 32) * 32 - w) // 2
+    h_pad = (math.ceil(h / 32) * 32 - h) // 2
+    in_img = img_pad(in_img, w_r=w_pad, h_r=h_pad)
+    with torch.no_grad():
+        out_1, out_2, out_3 = model1(in_img)
+        if h_pad != 0:
+            out_1 = out_1[:, :, h_pad:-h_pad, :]
+        if w_pad != 0:
+            out_1 = out_1[:, :, :, w_pad:-w_pad]
+    out_1 = out_1.squeeze(0)
+    out_1 = PIL.Image.fromarray(torch.clamp(out_1 * 255, min=0, max=255
+    ).byte().permute(1, 2, 0).cpu().numpy())
+    return out_1
+def predict2(img):
+    in_img = transforms.ToTensor()(img).to(device).unsqueeze(0)
+    b, c, h, w = in_img.size()
+    # pad image such that the resolution is a multiple of 32
+    w_pad = (math.ceil(w / 32) * 32 - w) // 2
+    h_pad = (math.ceil(h / 32) * 32 - h) // 2
+    in_img = img_pad(in_img, w_r=w_pad, h_r=h_pad)
+    with torch.no_grad():
+        out_1, out_2, out_3 = model2(in_img)
+        if h_pad != 0:
+            out_1 = out_1[:, :, h_pad:-h_pad, :]
+        if w_pad != 0:
+            out_1 = out_1[:, :, :, w_pad:-w_pad]
+    out_1 = out_1.squeeze(0)
+    out_1 = PIL.Image.fromarray(torch.clamp(out_1 * 255, min=0, max=255
+    ).byte().permute(1, 2, 0).cpu().numpy())
+    return out_1
+def img_pad(x, h_r=0, w_r=0):
+    '''
+    Here the padding values are determined by the average r,g,b values across the training set
+    in FHDMi dataset. For the evaluation on the UHDM, you can also try the commented lines where
+    the mean values are calculated from UHDM training set, yielding similar performance.
+    '''
+    x1 = F.pad(x[:, 0:1, ...], (w_r, w_r, h_r, h_r), value=0.3827)
+    x2 = F.pad(x[:, 1:2, ...], (w_r, w_r, h_r, h_r), value=0.4141)
+    x3 = F.pad(x[:, 2:3, ...], (w_r, w_r, h_r, h_r), value=0.3912)
+    y = torch.cat([x1, x2, x3], dim=1)
+    return y
+img1 = Image.open('./imgs/001.jpg').convert('RGB')
+img2 = Image.open('./imgs/002.jpg').convert('RGB')
+img3 = Image.open('./imgs/003.jpg').convert('RGB')
+img4 = Image.open('./imgs/004.jpg').convert('RGB')
+img5 = Image.open('./imgs/005.jpg').convert('RGB')
+iface1 = gr.Interface(fn=predict1,
+             inputs=gr.inputs.Image(type="pil"),
+             outputs=gr.inputs.Image(type="pil"))
+iface2 = gr.Interface(fn=predict2,
+             inputs=gr.inputs.Image(type="pil"),
+             outputs=gr.inputs.Image(type="pil"))
+iface_all = gr.mix.Parallel(
+    iface1, iface2,
+    examples=[img1, img2, img3, img4, img5]
+)
+iface_all.launch()

mix.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bdcdd33f11e1d5eb836671f15991ecb42134bd5ba98c1e4de3b8e2f4138fdb2b
+size 23895301

model/nets.py ADDED Viewed

	@@ -0,0 +1,259 @@

+"""
+Implementation of ESDNet for image demoireing
+"""
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import torchvision
+from torch.nn.parameter import Parameter
+class my_model(nn.Module):
+    def __init__(self,
+                 en_feature_num,
+                 en_inter_num,
+                 de_feature_num,
+                 de_inter_num,
+                 sam_number=1,
+                 ):
+        super(my_model, self).__init__()
+        self.encoder = Encoder(feature_num=en_feature_num, inter_num=en_inter_num, sam_number=sam_number)
+        self.decoder = Decoder(en_num=en_feature_num, feature_num=de_feature_num, inter_num=de_inter_num,
+                               sam_number=sam_number)
+    def forward(self, x):
+        y_1, y_2, y_3 = self.encoder(x)
+        out_1, out_2, out_3 = self.decoder(y_1, y_2, y_3)
+        return out_1, out_2, out_3
+    def _initialize_weights(self):
+        for m in self.modules():
+            if isinstance(m, nn.Conv2d):
+                m.weight.data.normal_(0.0, 0.02)
+                if m.bias is not None:
+                    m.bias.data.normal_(0.0, 0.02)
+            if isinstance(m, nn.ConvTranspose2d):
+                m.weight.data.normal_(0.0, 0.02)
+class Decoder(nn.Module):
+    def __init__(self, en_num, feature_num, inter_num, sam_number):
+        super(Decoder, self).__init__()
+        self.preconv_3 = conv_relu(4 * en_num, feature_num, 3, padding=1)
+        self.decoder_3 = Decoder_Level(feature_num, inter_num, sam_number)
+        self.preconv_2 = conv_relu(2 * en_num + feature_num, feature_num, 3, padding=1)
+        self.decoder_2 = Decoder_Level(feature_num, inter_num, sam_number)
+        self.preconv_1 = conv_relu(en_num + feature_num, feature_num, 3, padding=1)
+        self.decoder_1 = Decoder_Level(feature_num, inter_num, sam_number)
+    def forward(self, y_1, y_2, y_3):
+        x_3 = y_3
+        x_3 = self.preconv_3(x_3)
+        out_3, feat_3 = self.decoder_3(x_3)
+        x_2 = torch.cat([y_2, feat_3], dim=1)
+        x_2 = self.preconv_2(x_2)
+        out_2, feat_2 = self.decoder_2(x_2)
+        x_1 = torch.cat([y_1, feat_2], dim=1)
+        x_1 = self.preconv_1(x_1)
+        out_1 = self.decoder_1(x_1, feat=False)
+        return out_1, out_2, out_3
+class Encoder(nn.Module):
+    def __init__(self, feature_num, inter_num, sam_number):
+        super(Encoder, self).__init__()
+        self.conv_first = nn.Sequential(
+            nn.Conv2d(12, feature_num, kernel_size=5, stride=1, padding=2, bias=True),
+            nn.ReLU(inplace=True)
+        )
+        self.encoder_1 = Encoder_Level(feature_num, inter_num, level=1, sam_number=sam_number)
+        self.encoder_2 = Encoder_Level(2 * feature_num, inter_num, level=2, sam_number=sam_number)
+        self.encoder_3 = Encoder_Level(4 * feature_num, inter_num, level=3, sam_number=sam_number)
+    def forward(self, x):
+        x = F.pixel_unshuffle(x, 2)
+        x = self.conv_first(x)
+        out_feature_1, down_feature_1 = self.encoder_1(x)
+        out_feature_2, down_feature_2 = self.encoder_2(down_feature_1)
+        out_feature_3 = self.encoder_3(down_feature_2)
+        return out_feature_1, out_feature_2, out_feature_3
+class Encoder_Level(nn.Module):
+    def __init__(self, feature_num, inter_num, level, sam_number):
+        super(Encoder_Level, self).__init__()
+        self.rdb = RDB(in_channel=feature_num, d_list=(1, 2, 1), inter_num=inter_num)
+        self.sam_blocks = nn.ModuleList()
+        for _ in range(sam_number):
+            sam_block = SAM(in_channel=feature_num, d_list=(1, 2, 3, 2, 1), inter_num=inter_num)
+            self.sam_blocks.append(sam_block)
+        if level < 3:
+            self.down = nn.Sequential(
+                nn.Conv2d(feature_num, 2 * feature_num, kernel_size=3, stride=2, padding=1, bias=True),
+                nn.ReLU(inplace=True)
+            )
+        self.level = level
+    def forward(self, x):
+        out_feature = self.rdb(x)
+        for sam_block in self.sam_blocks:
+            out_feature = sam_block(out_feature)
+        if self.level < 3:
+            down_feature = self.down(out_feature)
+            return out_feature, down_feature
+        return out_feature
+class Decoder_Level(nn.Module):
+    def __init__(self, feature_num, inter_num, sam_number):
+        super(Decoder_Level, self).__init__()
+        self.rdb = RDB(feature_num, (1, 2, 1), inter_num)
+        self.sam_blocks = nn.ModuleList()
+        for _ in range(sam_number):
+            sam_block = SAM(in_channel=feature_num, d_list=(1, 2, 3, 2, 1), inter_num=inter_num)
+            self.sam_blocks.append(sam_block)
+        self.conv = conv(in_channel=feature_num, out_channel=12, kernel_size=3, padding=1)
+    def forward(self, x, feat=True):
+        x = self.rdb(x)
+        for sam_block in self.sam_blocks:
+            x = sam_block(x)
+        out = self.conv(x)
+        out = F.pixel_shuffle(out, 2)
+        if feat:
+            feature = F.interpolate(x, scale_factor=2, mode='bilinear')
+            return out, feature
+        else:
+            return out
+class DB(nn.Module):
+    def __init__(self, in_channel, d_list, inter_num):
+        super(DB, self).__init__()
+        self.d_list = d_list
+        self.conv_layers = nn.ModuleList()
+        c = in_channel
+        for i in range(len(d_list)):
+            dense_conv = conv_relu(in_channel=c, out_channel=inter_num, kernel_size=3, dilation_rate=d_list[i],
+                                   padding=d_list[i])
+            self.conv_layers.append(dense_conv)
+            c = c + inter_num
+        self.conv_post = conv(in_channel=c, out_channel=in_channel, kernel_size=1)
+    def forward(self, x):
+        t = x
+        for conv_layer in self.conv_layers:
+            _t = conv_layer(t)
+            t = torch.cat([_t, t], dim=1)
+        t = self.conv_post(t)
+        return t
+class SAM(nn.Module):
+    def __init__(self, in_channel, d_list, inter_num):
+        super(SAM, self).__init__()
+        self.basic_block = DB(in_channel=in_channel, d_list=d_list, inter_num=inter_num)
+        self.basic_block_2 = DB(in_channel=in_channel, d_list=d_list, inter_num=inter_num)
+        self.basic_block_4 = DB(in_channel=in_channel, d_list=d_list, inter_num=inter_num)
+        self.fusion = CSAF(3 * in_channel)
+    def forward(self, x):
+        x_0 = x
+        x_2 = F.interpolate(x, scale_factor=0.5, mode='bilinear')
+        x_4 = F.interpolate(x, scale_factor=0.25, mode='bilinear')
+        y_0 = self.basic_block(x_0)
+        y_2 = self.basic_block_2(x_2)
+        y_4 = self.basic_block_4(x_4)
+        y_2 = F.interpolate(y_2, scale_factor=2, mode='bilinear')
+        y_4 = F.interpolate(y_4, scale_factor=4, mode='bilinear')
+        y = self.fusion(y_0, y_2, y_4)
+        y = x + y
+        return y
+class CSAF(nn.Module):
+    def __init__(self, in_chnls, ratio=4):
+        super(CSAF, self).__init__()
+        self.squeeze = nn.AdaptiveAvgPool2d((1, 1))
+        self.compress1 = nn.Conv2d(in_chnls, in_chnls // ratio, 1, 1, 0)
+        self.compress2 = nn.Conv2d(in_chnls // ratio, in_chnls // ratio, 1, 1, 0)
+        self.excitation = nn.Conv2d(in_chnls // ratio, in_chnls, 1, 1, 0)
+    def forward(self, x0, x2, x4):
+        out0 = self.squeeze(x0)
+        out2 = self.squeeze(x2)
+        out4 = self.squeeze(x4)
+        out = torch.cat([out0, out2, out4], dim=1)
+        out = self.compress1(out)
+        out = F.relu(out)
+        out = self.compress2(out)
+        out = F.relu(out)
+        out = self.excitation(out)
+        out = F.sigmoid(out)
+        w0, w2, w4 = torch.chunk(out, 3, dim=1)
+        x = x0 * w0 + x2 * w2 + x4 * w4
+        return x
+class RDB(nn.Module):
+    def __init__(self, in_channel, d_list, inter_num):
+        super(RDB, self).__init__()
+        self.d_list = d_list
+        self.conv_layers = nn.ModuleList()
+        c = in_channel
+        for i in range(len(d_list)):
+            dense_conv = conv_relu(in_channel=c, out_channel=inter_num, kernel_size=3, dilation_rate=d_list[i],
+                                   padding=d_list[i])
+            self.conv_layers.append(dense_conv)
+            c = c + inter_num
+        self.conv_post = conv(in_channel=c, out_channel=in_channel, kernel_size=1)
+    def forward(self, x):
+        t = x
+        for conv_layer in self.conv_layers:
+            _t = conv_layer(t)
+            t = torch.cat([_t, t], dim=1)
+        t = self.conv_post(t)
+        return t + x
+class conv(nn.Module):
+    def __init__(self, in_channel, out_channel, kernel_size, dilation_rate=1, padding=0, stride=1):
+        super(conv, self).__init__()
+        self.conv = nn.Conv2d(in_channels=in_channel, out_channels=out_channel, kernel_size=kernel_size, stride=stride,
+                              padding=padding, bias=True, dilation=dilation_rate)
+    def forward(self, x_input):
+        out = self.conv(x_input)
+        return out
+class conv_relu(nn.Module):
+    def __init__(self, in_channel, out_channel, kernel_size, dilation_rate=1, padding=0, stride=1):
+        super(conv_relu, self).__init__()
+        self.conv = nn.Sequential(
+            nn.Conv2d(in_channels=in_channel, out_channels=out_channel, kernel_size=kernel_size, stride=stride,
+                      padding=padding, bias=True, dilation=dilation_rate),
+            nn.ReLU(inplace=True)
+        )
+    def forward(self, x_input):
+        out = self.conv(x_input)
+        return out

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+numpy==1.21.5
+torch>=1.9.0
+opencv-python==4.5.5.64
+scikit-image==0.19.2
+torchvision==0.1.8

uhdm_checkpoint.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:254235cd25f90a3f1785885385dc6cb3f2178e053291ab53d1943bd7c2f7de65
+size 23895301