Spaces:

innovatorved
/

ImageColorizationUsingGAN

Runtime error

App Files Files Community

Ved Gupta commited on Apr 16, 2023

Commit

1c7b15f

1 Parent(s): 77b60c4

initially repo created

Browse files

Files changed (12) hide show

.gitignore +1 -0
Pipfile.lock +20 -0
image-colorization-using-gan-main.ipynb +0 -0
main.py +8 -7
model/Discriminator.py +28 -13
model/Generator.py +35 -18
model/__init__.py +26 -18
model/loss.py +43 -0
model/weights.py +14 -14
requirements.txt +100 -0
utility/__init__.py +1 -1
utility/helper.py +71 -37

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ model/ImageColorizationModel.pth

Pipfile.lock ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+    "_meta": {
+        "hash": {
+            "sha256": "fedbd2ab7afd84cf16f128af0619749267b62277b4cb6989ef16d4bef6e4eef2"
+        },
+        "pipfile-spec": 6,
+        "requires": {
+            "python_version": "3.10"
+        },
+        "sources": [
+            {
+                "name": "pypi",
+                "url": "https://pypi.org/simple",
+                "verify_ssl": true
+            }
+        ]
+    },
+    "default": {},
+    "develop": {}
+}

image-colorization-using-gan-main.ipynb CHANGED Viewed

The diff for this file is too large to render. See raw diff

main.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import warnings
 warnings.filterwarnings("ignore")
 import os
@@ -28,15 +29,18 @@ model_path = "model/ImageColorizationModel.pth"
 model = None
-if not os.path.exists(model_path) :
     print("Model not find")
     download_from_drive()
     print("Model Downloaded")
 else:
-    model = load_model(model_class=MainModel , file_path=model_path)
     print("Model Loaded")
 def predict_and_return_image(image):
     data = create_lab_tensors(image)
     model.net_G.eval()
     with torch.no_grad():
@@ -48,8 +52,7 @@ def predict_and_return_image(image):
     return fake_imgs[0]
 title = "Black&White to Color image"
 description = "Transforming Black & White Image in to colored image. Upload a black and white image to see it colorized by our deep learning model."
@@ -59,7 +62,5 @@ gr.Interface(
     title=title,
     description=description,
     inputs=[gr.Image(label="Gray Scale Image")],
-    outputs=[
-        gr.Image(label="Predicted Colored Image")
-    ],
 ).launch(share=True, debug=True)

 import warnings
 warnings.filterwarnings("ignore")
 import os
 model = None
+if not os.path.exists(model_path):
     print("Model not find")
     download_from_drive()
     print("Model Downloaded")
 else:
+    model = load_model_with_cpu(model_class=MainModel, file_path=model_path)
     print("Model Loaded")
 def predict_and_return_image(image):
+    if image is None:
+        return None
     data = create_lab_tensors(image)
     model.net_G.eval()
     with torch.no_grad():
     return fake_imgs[0]
+import gradio as gr
 title = "Black&White to Color image"
 description = "Transforming Black & White Image in to colored image. Upload a black and white image to see it colorized by our deep learning model."
     title=title,
     description=description,
     inputs=[gr.Image(label="Gray Scale Image")],
+    outputs=[gr.Image(label="Predicted Colored Image")],
 ).launch(share=True, debug=True)

model/Discriminator.py CHANGED Viewed

@@ -16,22 +16,37 @@ from torch.utils.data import Dataset, DataLoader
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 class PatchDiscriminator(nn.Module):
     def __init__(self, input_c, num_filters=64, n_down=3):
         super().__init__()
         model = [self.get_layers(input_c, num_filters, norm=False)]
-        model += [self.get_layers(num_filters * 2 ** i, num_filters * 2 ** (i + 1), s=1 if i == (n_down-1) else 2)
-                          for i in range(n_down)] # the 'if' statement is taking care of not using
-                                                  # stride of 2 for the last block in this loop
-        model += [self.get_layers(num_filters * 2 ** n_down, 1, s=1, norm=False, act=False)] # Make sure to not use normalization or
-                                                                                             # activation for the last layer of the model
-        self.model = nn.Sequential(*model)
-    def get_layers(self, ni, nf, k=4, s=2, p=1, norm=True, act=True): # when needing to make some repeatitive blocks of layers,
-        layers = [nn.Conv2d(ni, nf, k, s, p, bias=not norm)]          # it's always helpful to make a separate method for that purpose
-        if norm: layers += [nn.BatchNorm2d(nf)]
-        if act: layers += [nn.LeakyReLU(0.2, True)]
         return nn.Sequential(*layers)
     def forward(self, x):
-        return self.model(x)

 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 class PatchDiscriminator(nn.Module):
     def __init__(self, input_c, num_filters=64, n_down=3):
         super().__init__()
         model = [self.get_layers(input_c, num_filters, norm=False)]
+        model += [
+            self.get_layers(
+                num_filters * 2**i,
+                num_filters * 2 ** (i + 1),
+                s=1 if i == (n_down - 1) else 2,
+            )
+            for i in range(n_down)
+        ]  # the 'if' statement is taking care of not using
+        # stride of 2 for the last block in this loop
+        model += [
+            self.get_layers(num_filters * 2**n_down, 1, s=1, norm=False, act=False)
+        ]  # Make sure to not use normalization or
+        # activation for the last layer of the model
+        self.model = nn.Sequential(*model)
+    def get_layers(
+        self, ni, nf, k=4, s=2, p=1, norm=True, act=True
+    ):  # when needing to make some repeatitive blocks of layers,
+        layers = [
+            nn.Conv2d(ni, nf, k, s, p, bias=not norm)
+        ]  # it's always helpful to make a separate method for that purpose
+        if norm:
+            layers += [nn.BatchNorm2d(nf)]
+        if act:
+            layers += [nn.LeakyReLU(0.2, True)]
         return nn.Sequential(*layers)
     def forward(self, x):
+        return self.model(x)

model/Generator.py CHANGED Viewed

@@ -16,40 +16,53 @@ from torch.utils.data import Dataset, DataLoader
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 class UnetBlock(nn.Module):
-    def __init__(self, nf, ni, submodule=None, input_c=None, dropout=False,
-                 innermost=False, outermost=False):
         super().__init__()
         self.outermost = outermost
-        if input_c is None: input_c = nf
-        downconv = nn.Conv2d(input_c, ni, kernel_size=4,
-                             stride=2, padding=1, bias=False)
         downrelu = nn.LeakyReLU(0.2, True)
         downnorm = nn.BatchNorm2d(ni)
         uprelu = nn.ReLU(True)
         upnorm = nn.BatchNorm2d(nf)
         if outermost:
-            upconv = nn.ConvTranspose2d(ni * 2, nf, kernel_size=4,
-                                        stride=2, padding=1)
             down = [downconv]
             up = [uprelu, upconv, nn.Tanh()]
             model = down + [submodule] + up
         elif innermost:
-            upconv = nn.ConvTranspose2d(ni, nf, kernel_size=4,
-                                        stride=2, padding=1, bias=False)
             down = [downrelu, downconv]
             up = [uprelu, upconv, upnorm]
             model = down + up
         else:
-            upconv = nn.ConvTranspose2d(ni * 2, nf, kernel_size=4,
-                                        stride=2, padding=1, bias=False)
             down = [downrelu, downconv, downnorm]
             up = [uprelu, upconv, upnorm]
-            if dropout: up += [nn.Dropout(0.5)]
             model = down + [submodule] + up
         self.model = nn.Sequential(*model)
     def forward(self, x):
         if self.outermost:
             return self.model(x)
@@ -62,12 +75,16 @@ class Unet(nn.Module):
         super().__init__()
         unet_block = UnetBlock(num_filters * 8, num_filters * 8, innermost=True)
         for _ in range(n_down - 5):
-            unet_block = UnetBlock(num_filters * 8, num_filters * 8, submodule=unet_block, dropout=True)
         out_filters = num_filters * 8
         for _ in range(3):
             unet_block = UnetBlock(out_filters // 2, out_filters, submodule=unet_block)
             out_filters //= 2
-        self.model = UnetBlock(output_c, out_filters, input_c=input_c, submodule=unet_block, outermost=True)
     def forward(self, x):
-        return self.model(x)

 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 class UnetBlock(nn.Module):
+    def __init__(
+        self,
+        nf,
+        ni,
+        submodule=None,
+        input_c=None,
+        dropout=False,
+        innermost=False,
+        outermost=False,
+    ):
         super().__init__()
         self.outermost = outermost
+        if input_c is None:
+            input_c = nf
+        downconv = nn.Conv2d(
+            input_c, ni, kernel_size=4, stride=2, padding=1, bias=False
+        )
         downrelu = nn.LeakyReLU(0.2, True)
         downnorm = nn.BatchNorm2d(ni)
         uprelu = nn.ReLU(True)
         upnorm = nn.BatchNorm2d(nf)
         if outermost:
+            upconv = nn.ConvTranspose2d(ni * 2, nf, kernel_size=4, stride=2, padding=1)
             down = [downconv]
             up = [uprelu, upconv, nn.Tanh()]
             model = down + [submodule] + up
         elif innermost:
+            upconv = nn.ConvTranspose2d(
+                ni, nf, kernel_size=4, stride=2, padding=1, bias=False
+            )
             down = [downrelu, downconv]
             up = [uprelu, upconv, upnorm]
             model = down + up
         else:
+            upconv = nn.ConvTranspose2d(
+                ni * 2, nf, kernel_size=4, stride=2, padding=1, bias=False
+            )
             down = [downrelu, downconv, downnorm]
             up = [uprelu, upconv, upnorm]
+            if dropout:
+                up += [nn.Dropout(0.5)]
             model = down + [submodule] + up
         self.model = nn.Sequential(*model)
     def forward(self, x):
         if self.outermost:
             return self.model(x)
         super().__init__()
         unet_block = UnetBlock(num_filters * 8, num_filters * 8, innermost=True)
         for _ in range(n_down - 5):
+            unet_block = UnetBlock(
+                num_filters * 8, num_filters * 8, submodule=unet_block, dropout=True
+            )
         out_filters = num_filters * 8
         for _ in range(3):
             unet_block = UnetBlock(out_filters // 2, out_filters, submodule=unet_block)
             out_filters //= 2
+        self.model = UnetBlock(
+            output_c, out_filters, input_c=input_c, submodule=unet_block, outermost=True
+        )
     def forward(self, x):
+        return self.model(x)

model/__init__.py CHANGED Viewed

@@ -14,46 +14,54 @@ from torchvision import transforms
 from torchvision.utils import make_grid
 from torch.utils.data import Dataset, DataLoader
-from .Generator import UnetBlock , Unet
 from .Discriminator import PatchDiscriminator
 from .weights import init_weights
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 def init_model(model, device):
     model = model.to(device)
     model = init_weights(model)
     return model
 class MainModel(nn.Module):
-    def __init__(self, net_G=None, lr_G=2e-4, lr_D=2e-4,
-                 beta1=0.5, beta2=0.999, lambda_L1=100.):
         super().__init__()
         self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         self.lambda_L1 = lambda_L1
         if net_G is None:
-            self.net_G = init_model(Unet(input_c=1, output_c=2, n_down=8, num_filters=64), self.device)
         else:
             self.net_G = net_G.to(self.device)
-        self.net_D = init_model(PatchDiscriminator(input_c=3, n_down=3, num_filters=64), self.device)
-        self.GANcriterion = GANLoss(gan_mode='vanilla').to(self.device)
         self.L1criterion = nn.L1Loss()
         self.opt_G = optim.Adam(self.net_G.parameters(), lr=lr_G, betas=(beta1, beta2))
         self.opt_D = optim.Adam(self.net_D.parameters(), lr=lr_D, betas=(beta1, beta2))
     def set_requires_grad(self, model, requires_grad=True):
         for p in model.parameters():
             p.requires_grad = requires_grad
     def setup_input(self, data):
-        self.L = data['L'].to(self.device)
-        self.ab = data['ab'].to(self.device)
     def forward(self):
         self.fake_color = self.net_G(self.L)
     def backward_D(self):
         fake_image = torch.cat([self.L, self.fake_color], dim=1)
         fake_preds = self.net_D(fake_image.detach())
@@ -63,7 +71,7 @@ class MainModel(nn.Module):
         self.loss_D_real = self.GANcriterion(real_preds, True)
         self.loss_D = (self.loss_D_fake + self.loss_D_real) * 0.5
         self.loss_D.backward()
     def backward_G(self):
         fake_image = torch.cat([self.L, self.fake_color], dim=1)
         fake_preds = self.net_D(fake_image)
@@ -71,7 +79,7 @@ class MainModel(nn.Module):
         self.loss_G_L1 = self.L1criterion(self.fake_color, self.ab) * self.lambda_L1
         self.loss_G = self.loss_G_GAN + self.loss_G_L1
         self.loss_G.backward()
     def optimize(self):
         self.forward()
         self.net_D.train()
@@ -79,9 +87,9 @@ class MainModel(nn.Module):
         self.opt_D.zero_grad()
         self.backward_D()
         self.opt_D.step()
         self.net_G.train()
         self.set_requires_grad(self.net_D, False)
         self.opt_G.zero_grad()
         self.backward_G()
-        self.opt_G.step()

 from torchvision.utils import make_grid
 from torch.utils.data import Dataset, DataLoader
+from .Generator import UnetBlock, Unet
 from .Discriminator import PatchDiscriminator
 from .weights import init_weights
+from .loss import GANLoss
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 def init_model(model, device):
     model = model.to(device)
     model = init_weights(model)
     return model
 class MainModel(nn.Module):
+    def __init__(
+        self, net_G=None, lr_G=2e-4, lr_D=2e-4, beta1=0.5, beta2=0.999, lambda_L1=100.0
+    ):
         super().__init__()
         self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         self.lambda_L1 = lambda_L1
         if net_G is None:
+            self.net_G = init_model(
+                Unet(input_c=1, output_c=2, n_down=8, num_filters=64), self.device
+            )
         else:
             self.net_G = net_G.to(self.device)
+        self.net_D = init_model(
+            PatchDiscriminator(input_c=3, n_down=3, num_filters=64), self.device
+        )
+        self.GANcriterion = GANLoss(gan_mode="vanilla").to(self.device)
         self.L1criterion = nn.L1Loss()
         self.opt_G = optim.Adam(self.net_G.parameters(), lr=lr_G, betas=(beta1, beta2))
         self.opt_D = optim.Adam(self.net_D.parameters(), lr=lr_D, betas=(beta1, beta2))
     def set_requires_grad(self, model, requires_grad=True):
         for p in model.parameters():
             p.requires_grad = requires_grad
     def setup_input(self, data):
+        self.L = data["L"].to(self.device)
+        self.ab = data["ab"].to(self.device)
     def forward(self):
         self.fake_color = self.net_G(self.L)
     def backward_D(self):
         fake_image = torch.cat([self.L, self.fake_color], dim=1)
         fake_preds = self.net_D(fake_image.detach())
         self.loss_D_real = self.GANcriterion(real_preds, True)
         self.loss_D = (self.loss_D_fake + self.loss_D_real) * 0.5
         self.loss_D.backward()
     def backward_G(self):
         fake_image = torch.cat([self.L, self.fake_color], dim=1)
         fake_preds = self.net_D(fake_image)
         self.loss_G_L1 = self.L1criterion(self.fake_color, self.ab) * self.lambda_L1
         self.loss_G = self.loss_G_GAN + self.loss_G_L1
         self.loss_G.backward()
     def optimize(self):
         self.forward()
         self.net_D.train()
         self.opt_D.zero_grad()
         self.backward_D()
         self.opt_D.step()
         self.net_G.train()
         self.set_requires_grad(self.net_D, False)
         self.opt_G.zero_grad()
         self.backward_G()
+        self.opt_G.step()

model/loss.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import warnings
+warnings.filterwarnings("ignore")
+import os
+import sys
+import glob
+import time
+import numpy as np
+from PIL import Image
+from pathlib import Path
+from tqdm.notebook import tqdm
+import matplotlib.pyplot as plt
+from skimage.color import rgb2lab, lab2rgb
+import torch
+from torch import nn, optim
+from torchvision import transforms
+from torchvision.utils import make_grid
+from torch.utils.data import Dataset, DataLoader
+class GANLoss(nn.Module):
+    def __init__(self, gan_mode="vanilla", real_label=1.0, fake_label=0.0):
+        super().__init__()
+        self.register_buffer("real_label", torch.tensor(real_label))
+        self.register_buffer("fake_label", torch.tensor(fake_label))
+        if gan_mode == "vanilla":
+            self.loss = nn.BCEWithLogitsLoss()
+        elif gan_mode == "lsgan":
+            self.loss = nn.MSELoss()
+    def get_labels(self, preds, target_is_real):
+        if target_is_real:
+            labels = self.real_label
+        else:
+            labels = self.fake_label
+        return labels.expand_as(preds)
+    def __call__(self, preds, target_is_real):
+        labels = self.get_labels(preds, target_is_real)
+        loss = self.loss(preds, labels)
+        return loss

model/weights.py CHANGED Viewed

@@ -16,24 +16,24 @@ from torch.utils.data import Dataset, DataLoader
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-def init_weights(net, init='norm', gain=0.02):
     def init_func(m):
         classname = m.__class__.__name__
-        if hasattr(m, 'weight') and 'Conv' in classname:
-            if init == 'norm':
                 nn.init.normal_(m.weight.data, mean=0.0, std=gain)
-            elif init == 'xavier':
                 nn.init.xavier_normal_(m.weight.data, gain=gain)
-            elif init == 'kaiming':
-                nn.init.kaiming_normal_(m.weight.data, a=0, mode='fan_in')
-            if hasattr(m, 'bias') and m.bias is not None:
                 nn.init.constant_(m.bias.data, 0.0)
-        elif 'BatchNorm2d' in classname:
-            nn.init.normal_(m.weight.data, 1., gain)
-            nn.init.constant_(m.bias.data, 0.)
     net.apply(init_func)
     print(f"model initialized with {init} initialization")
-    return net

 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+def init_weights(net, init="norm", gain=0.02):
     def init_func(m):
         classname = m.__class__.__name__
+        if hasattr(m, "weight") and "Conv" in classname:
+            if init == "norm":
                 nn.init.normal_(m.weight.data, mean=0.0, std=gain)
+            elif init == "xavier":
                 nn.init.xavier_normal_(m.weight.data, gain=gain)
+            elif init == "kaiming":
+                nn.init.kaiming_normal_(m.weight.data, a=0, mode="fan_in")
+            if hasattr(m, "bias") and m.bias is not None:
                 nn.init.constant_(m.bias.data, 0.0)
+        elif "BatchNorm2d" in classname:
+            nn.init.normal_(m.weight.data, 1.0, gain)
+            nn.init.constant_(m.bias.data, 0.0)
     net.apply(init_func)
     print(f"model initialized with {init} initialization")
+    return net

requirements.txt ADDED Viewed

	@@ -0,0 +1,100 @@

+aiofiles==23.1.0
+aiohttp==3.8.4
+aiosignal==1.3.1
+altair==4.2.2
+anyio==3.6.2
+async-timeout==4.0.2
+attrs==23.1.0
+beautifulsoup4==4.12.2
+black==23.3.0
+certifi==2022.12.7
+charset-normalizer==3.1.0
+click==8.1.3
+cmake==3.26.3
+contourpy==1.0.7
+cycler==0.11.0
+entrypoints==0.4
+fastapi==0.95.1
+ffmpy==0.3.0
+filelock==3.11.0
+fonttools==4.39.3
+frozenlist==1.3.3
+fsspec==2023.4.0
+gdown==4.7.1
+gradio==3.27.0
+gradio_client==0.1.3
+h11==0.14.0
+httpcore==0.17.0
+httpx==0.24.0
+huggingface-hub==0.13.4
+idna==3.4
+imageio==2.27.0
+Jinja2==3.1.2
+joblib==1.2.0
+jsonschema==4.17.3
+kiwisolver==1.4.4
+lazy_loader==0.2
+linkify-it-py==2.0.0
+lit==16.0.1
+markdown-it-py==2.2.0
+MarkupSafe==2.1.2
+matplotlib==3.7.1
+mdit-py-plugins==0.3.3
+mdurl==0.1.2
+mpmath==1.3.0
+multidict==6.0.4
+mypy-extensions==1.0.0
+networkx==3.1
+numpy==1.24.2
+nvidia-cublas-cu11==11.10.3.66
+nvidia-cuda-cupti-cu11==11.7.101
+nvidia-cuda-nvrtc-cu11==11.7.99
+nvidia-cuda-runtime-cu11==11.7.99
+nvidia-cudnn-cu11==8.5.0.96
+nvidia-cufft-cu11==10.9.0.58
+nvidia-curand-cu11==10.2.10.91
+nvidia-cusolver-cu11==11.4.0.1
+nvidia-cusparse-cu11==11.7.4.91
+nvidia-nccl-cu11==2.14.3
+nvidia-nvtx-cu11==11.7.91
+orjson==3.8.10
+packaging==23.1
+pandas==2.0.0
+pathspec==0.11.1
+Pillow==9.5.0
+platformdirs==3.2.0
+pydantic==1.10.7
+pydub==0.25.1
+pyparsing==3.0.9
+pyrsistent==0.19.3
+PySocks==1.7.1
+python-dateutil==2.8.2
+python-multipart==0.0.6
+pytz==2023.3
+PyWavelets==1.4.1
+PyYAML==6.0
+requests==2.28.2
+scikit-image==0.20.0
+scikit-learn==1.2.2
+scipy==1.10.1
+semantic-version==2.10.0
+six==1.16.0
+sniffio==1.3.0
+soupsieve==2.4
+starlette==0.26.1
+sympy==1.11.1
+threadpoolctl==3.1.0
+tifffile==2023.4.12
+tomli==2.0.1
+toolz==0.12.0
+torch==2.0.0
+torchvision==0.15.1
+tqdm==4.65.0
+triton==2.0.0
+typing_extensions==4.5.0
+tzdata==2023.3
+uc-micro-py==1.0.1
+urllib3==1.26.15
+uvicorn==0.21.1
+websockets==11.0.1
+yarl==1.8.2

utility/__init__.py CHANGED Viewed

	@@ -1 +1 @@
1	- from .helper import *


1	+ from .helper import *

utility/helper.py CHANGED Viewed

@@ -19,6 +19,9 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 import requests
 import gdown
 def download_from_drive():
     url = "https://drive.google.com/uc?id=1EhuMET76c02VFyRW8Pie7BwNCDHmQiad"
     try:
@@ -33,15 +36,16 @@ def download_from_drive():
 class AverageMeter:
     def __init__(self):
         self.reset()
     def reset(self):
-        self.count, self.avg, self.sum = [0.] * 3
     def update(self, val, count=1):
         self.count += count
         self.sum += count * val
         self.avg = self.sum / self.count
 def create_loss_meters():
     loss_D_fake = AverageMeter()
     loss_D_real = AverageMeter()
@@ -49,33 +53,38 @@ def create_loss_meters():
     loss_G_GAN = AverageMeter()
     loss_G_L1 = AverageMeter()
     loss_G = AverageMeter()
-    return {'loss_D_fake': loss_D_fake,
-            'loss_D_real': loss_D_real,
-            'loss_D': loss_D,
-            'loss_G_GAN': loss_G_GAN,
-            'loss_G_L1': loss_G_L1,
-            'loss_G': loss_G}
 def update_losses(model, loss_meter_dict, count):
     for loss_name, loss_meter in loss_meter_dict.items():
         loss = getattr(model, loss_name)
         loss_meter.update(loss.item(), count=count)
 def lab_to_rgb(L, ab):
     """
     Takes a batch of images
     """
-    L = (L + 1.) * 50.
-    ab = ab * 110.
     Lab = torch.cat([L, ab], dim=1).permute(0, 2, 3, 1).cpu().numpy()
     rgb_imgs = []
     for img in Lab:
         img_rgb = lab2rgb(img)
         rgb_imgs.append(img_rgb)
     return np.stack(rgb_imgs, axis=0)
 def visualize(model, data, save=True):
     model.net_G.eval()
     with torch.no_grad():
@@ -90,7 +99,7 @@ def visualize(model, data, save=True):
     fig = plt.figure(figsize=(15, 8))
     for i in range(5):
         ax = plt.subplot(3, 5, i + 1)
-        ax.imshow(L[i][0].cpu(), cmap='gray')
         ax.axis("off")
         ax = plt.subplot(3, 5, i + 1 + 5)
         ax.imshow(fake_imgs[i])
@@ -101,11 +110,13 @@ def visualize(model, data, save=True):
     plt.show()
     if save:
         fig.savefig(f"colorization_{time.time()}.png")
 def log_results(loss_meter_dict):
     for loss_name, loss_meter in loss_meter_dict.items():
         print(f"{loss_name}: {loss_meter.avg:.5f}")
 def create_lab_tensors(image):
     """
     This function receives an image path or a direct image input and creates a dictionary of L and ab tensors.
@@ -116,22 +127,28 @@ def create_lab_tensors(image):
     """
     if isinstance(image, str):
         # Open the image and convert it to RGB format
-        img = Image.open(image).convert('RGB')
     else:
-        img = image.convert('RGB')
-    custom_transforms = transforms.Compose([
-                transforms.Resize((SIZE, SIZE),  Image.BICUBIC),
-                transforms.RandomHorizontalFlip(), # A little data augmentation!
-            ])
     img = custom_transforms(img)
     img = np.array(img)
-    img_lab = rgb2lab(img).astype("float32") # Converting RGB to L*a*b
     img_lab = transforms.ToTensor()(img_lab)
-    L = img_lab[[0], ...] / 50. - 1. # Between -1 and 1
-    L = L.unsqueeze(0)
-    ab = img_lab[[1, 2], ...] / 110. # Between -1 and 1
-    return {'L': L, 'ab': ab}
 def predict_and_visualize_single_image(model, data, save=True):
@@ -143,18 +160,19 @@ def predict_and_visualize_single_image(model, data, save=True):
     L = model.L
     fake_imgs = lab_to_rgb(L, fake_color)
     fig, axs = plt.subplots(1, 2, figsize=(8, 4))
-    axs[0].imshow(L[0][0].cpu(), cmap='gray')
     axs[0].set_title("Grey Image")
-    axs[0].axis('off')
     axs[1].imshow(fake_imgs[0])
     axs[1].set_title("Colored Image")
-    axs[1].axis('off')
     plt.show()
     if save:
         fig.savefig(f"colorization_{time.time()}.png")
-def predict_color(model , image , save=False):
     """
     This function receives an image path or a direct image input and creates a dictionary of L and ab tensors.
     Args:
@@ -165,14 +183,30 @@ def predict_color(model , image , save=False):
     predict_and_visualize_single_image(model, data, save)
-def load_model(model_class, file_path):
     """
     Load PyTorch model from file.
     Args:
         model_class (torch.nn.Module): PyTorch model class to load.
         file_path (str): File path to load the model from.
     Returns:
         model (torch.nn.Module): Loaded PyTorch model.
     """

 import requests
 import gdown
+SIZE = 256
 def download_from_drive():
     url = "https://drive.google.com/uc?id=1EhuMET76c02VFyRW8Pie7BwNCDHmQiad"
     try:
 class AverageMeter:
     def __init__(self):
         self.reset()
     def reset(self):
+        self.count, self.avg, self.sum = [0.0] * 3
     def update(self, val, count=1):
         self.count += count
         self.sum += count * val
         self.avg = self.sum / self.count
 def create_loss_meters():
     loss_D_fake = AverageMeter()
     loss_D_real = AverageMeter()
     loss_G_GAN = AverageMeter()
     loss_G_L1 = AverageMeter()
     loss_G = AverageMeter()
+    return {
+        "loss_D_fake": loss_D_fake,
+        "loss_D_real": loss_D_real,
+        "loss_D": loss_D,
+        "loss_G_GAN": loss_G_GAN,
+        "loss_G_L1": loss_G_L1,
+        "loss_G": loss_G,
+    }
 def update_losses(model, loss_meter_dict, count):
     for loss_name, loss_meter in loss_meter_dict.items():
         loss = getattr(model, loss_name)
         loss_meter.update(loss.item(), count=count)
 def lab_to_rgb(L, ab):
     """
     Takes a batch of images
     """
+    L = (L + 1.0) * 50.0
+    ab = ab * 110.0
     Lab = torch.cat([L, ab], dim=1).permute(0, 2, 3, 1).cpu().numpy()
     rgb_imgs = []
     for img in Lab:
         img_rgb = lab2rgb(img)
         rgb_imgs.append(img_rgb)
     return np.stack(rgb_imgs, axis=0)
 def visualize(model, data, save=True):
     model.net_G.eval()
     with torch.no_grad():
     fig = plt.figure(figsize=(15, 8))
     for i in range(5):
         ax = plt.subplot(3, 5, i + 1)
+        ax.imshow(L[i][0].cpu(), cmap="gray")
         ax.axis("off")
         ax = plt.subplot(3, 5, i + 1 + 5)
         ax.imshow(fake_imgs[i])
     plt.show()
     if save:
         fig.savefig(f"colorization_{time.time()}.png")
 def log_results(loss_meter_dict):
     for loss_name, loss_meter in loss_meter_dict.items():
         print(f"{loss_name}: {loss_meter.avg:.5f}")
 def create_lab_tensors(image):
     """
     This function receives an image path or a direct image input and creates a dictionary of L and ab tensors.
     """
     if isinstance(image, str):
         # Open the image and convert it to RGB format
+        img = Image.open(image).convert("RGB")
     else:
+        if isinstance(image, np.ndarray):
+            img = Image.fromarray(image)
+        else:
+            img = image
+        img = img.convert("RGB")
+    custom_transforms = transforms.Compose(
+        [
+            transforms.Resize((SIZE, SIZE), Image.BICUBIC),
+            transforms.RandomHorizontalFlip(),  # A little data augmentation!
+        ]
+    )
     img = custom_transforms(img)
     img = np.array(img)
+    img_lab = rgb2lab(img).astype("float32")  # Converting RGB to L*a*b
     img_lab = transforms.ToTensor()(img_lab)
+    L = img_lab[[0], ...] / 50.0 - 1.0  # Between -1 and 1
+    L = L.unsqueeze(0)
+    ab = img_lab[[1, 2], ...] / 110.0  # Between -1 and 1
+    return {"L": L, "ab": ab}
 def predict_and_visualize_single_image(model, data, save=True):
     L = model.L
     fake_imgs = lab_to_rgb(L, fake_color)
     fig, axs = plt.subplots(1, 2, figsize=(8, 4))
+    axs[0].imshow(L[0][0].cpu(), cmap="gray")
     axs[0].set_title("Grey Image")
+    axs[0].axis("off")
     axs[1].imshow(fake_imgs[0])
     axs[1].set_title("Colored Image")
+    axs[1].axis("off")
     plt.show()
     if save:
         fig.savefig(f"colorization_{time.time()}.png")
+def predict_color(model, image, save=False):
     """
     This function receives an image path or a direct image input and creates a dictionary of L and ab tensors.
     Args:
     predict_and_visualize_single_image(model, data, save)
+def load_model_with_cpu(model_class, file_path):
     """
     Load PyTorch model from file.
     Args:
         model_class (torch.nn.Module): PyTorch model class to load.
         file_path (str): File path to load the model from.
+    Returns:
+        model (torch.nn.Module): Loaded PyTorch model.
+    """
+    model = model_class()
+    model.load_state_dict(torch.load(file_path, map_location=torch.device("cpu")))
+    return model
+def load_model_with_gpu(model_class, file_path):
+    """
+    Load PyTorch model from file.
+    Args:
+        model_class (torch.nn.Module): PyTorch model class to load.
+        file_path (str): File path to load the model from.
     Returns:
         model (torch.nn.Module): Loaded PyTorch model.
     """