test3

Running on Zero

App Files Files Community

mikitona commited on Nov 11, 2024

Commit

595ed80

verified ·

1 Parent(s): 1230d92

Update SUPIR/util.py

Browse files

Files changed (1) hide show

SUPIR/util.py +224 -179

SUPIR/util.py CHANGED Viewed

@@ -1,179 +1,224 @@
-import os
-import torch
-import numpy as np
-import cv2
-from PIL import Image
-from torch.nn.functional import interpolate
-from omegaconf import OmegaConf
-from sgm.util import instantiate_from_config
-def get_state_dict(d):
-    return d.get('state_dict', d)
-def load_state_dict(ckpt_path, location='cpu'):
-    _, extension = os.path.splitext(ckpt_path)
-    if extension.lower() == ".safetensors":
-        import safetensors.torch
-        state_dict = safetensors.torch.load_file(ckpt_path, device=location)
-    else:
-        state_dict = get_state_dict(torch.load(ckpt_path, map_location=torch.device(location)))
-    state_dict = get_state_dict(state_dict)
-    print(f'Loaded state_dict from [{ckpt_path}]')
-    return state_dict
-def create_model(config_path):
-    config = OmegaConf.load(config_path)
-    model = instantiate_from_config(config.model).cpu()
-    print(f'Loaded model config from [{config_path}]')
-    return model
-def create_SUPIR_model(config_path, SUPIR_sign=None, load_default_setting=False):
-    config = OmegaConf.load(config_path)
-    model = instantiate_from_config(config.model).cpu()
-    print(f'Loaded model config from [{config_path}]')
-    if config.SDXL_CKPT is not None:
-        model.load_state_dict(load_state_dict(config.SDXL_CKPT), strict=False)
-    if config.SUPIR_CKPT is not None:
-        model.load_state_dict(load_state_dict(config.SUPIR_CKPT), strict=False)
-    if SUPIR_sign is not None:
-        assert SUPIR_sign in ['F', 'Q']
-        if SUPIR_sign == 'F':
-            model.load_state_dict(load_state_dict(config.SUPIR_CKPT_F), strict=False)
-        elif SUPIR_sign == 'Q':
-            model.load_state_dict(load_state_dict(config.SUPIR_CKPT_Q), strict=False)
-    if load_default_setting:
-        default_setting = config.default_setting
-        return model, default_setting
-    return model
-def load_QF_ckpt(config_path):
-    config = OmegaConf.load(config_path)
-    ckpt_F = torch.load(config.SUPIR_CKPT_F, map_location='cpu')
-    ckpt_Q = torch.load(config.SUPIR_CKPT_Q, map_location='cpu')
-    return ckpt_Q, ckpt_F
-def PIL2Tensor(img, upsacle=1, min_size=1024, fix_resize=None):
-    '''
-    PIL.Image -> Tensor[C, H, W], RGB, [-1, 1]
-    '''
-    # size
-    w, h = img.size
-    w *= upsacle
-    h *= upsacle
-    w0, h0 = round(w), round(h)
-    if min(w, h) < min_size:
-        _upsacle = min_size / min(w, h)
-        w *= _upsacle
-        h *= _upsacle
-    if fix_resize is not None:
-        _upsacle = fix_resize / min(w, h)
-        w *= _upsacle
-        h *= _upsacle
-        w0, h0 = round(w), round(h)
-    w = int(np.round(w / 64.0)) * 64
-    h = int(np.round(h / 64.0)) * 64
-    x = img.resize((w, h), Image.BICUBIC)
-    x = np.array(x).round().clip(0, 255).astype(np.uint8)
-    x = x / 255 * 2 - 1
-    x = torch.tensor(x, dtype=torch.float32).permute(2, 0, 1)
-    return x, h0, w0
-def Tensor2PIL(x, h0, w0):
-    '''
-    Tensor[C, H, W], RGB, [-1, 1] -> PIL.Image
-    '''
-    x = x.unsqueeze(0)
-    x = interpolate(x, size=(h0, w0), mode='bicubic')
-    x = (x.squeeze(0).permute(1, 2, 0) * 127.5 + 127.5).cpu().numpy().clip(0, 255).astype(np.uint8)
-    return Image.fromarray(x)
-def HWC3(x):
-    assert x.dtype == np.uint8
-    if x.ndim == 2:
-        x = x[:, :, None]
-    assert x.ndim == 3
-    H, W, C = x.shape
-    assert C == 1 or C == 3 or C == 4
-    if C == 3:
-        return x
-    if C == 1:
-        return np.concatenate([x, x, x], axis=2)
-    if C == 4:
-        color = x[:, :, 0:3].astype(np.float32)
-        alpha = x[:, :, 3:4].astype(np.float32) / 255.0
-        y = color * alpha + 255.0 * (1.0 - alpha)
-        y = y.clip(0, 255).astype(np.uint8)
-        return y
-def upscale_image(input_image, upscale, min_size=None, unit_resolution=64):
-    H, W, C = input_image.shape
-    H = float(H)
-    W = float(W)
-    H *= upscale
-    W *= upscale
-    if min_size is not None:
-        if min(H, W) < min_size:
-            _upsacle = min_size / min(W, H)
-            W *= _upsacle
-            H *= _upsacle
-    H = int(np.round(H / unit_resolution)) * unit_resolution
-    W = int(np.round(W / unit_resolution)) * unit_resolution
-    img = cv2.resize(input_image, (W, H), interpolation=cv2.INTER_LANCZOS4 if upscale > 1 else cv2.INTER_AREA)
-    img = img.round().clip(0, 255).astype(np.uint8)
-    return img
-def fix_resize(input_image, size=512, unit_resolution=64):
-    H, W, C = input_image.shape
-    H = float(H)
-    W = float(W)
-    upscale = size / min(H, W)
-    H *= upscale
-    W *= upscale
-    H = int(np.round(H / unit_resolution)) * unit_resolution
-    W = int(np.round(W / unit_resolution)) * unit_resolution
-    img = cv2.resize(input_image, (W, H), interpolation=cv2.INTER_LANCZOS4 if upscale > 1 else cv2.INTER_AREA)
-    img = img.round().clip(0, 255).astype(np.uint8)
-    return img
-def Numpy2Tensor(img):
-    '''
-    np.array[H, w, C] [0, 255] -> Tensor[C, H, W], RGB, [-1, 1]
-    '''
-    # size
-    img = np.array(img) / 255 * 2 - 1
-    img = torch.tensor(img, dtype=torch.float32).permute(2, 0, 1)
-    return img
-def Tensor2Numpy(x, h0=None, w0=None):
-    '''
-    Tensor[C, H, W], RGB, [-1, 1] -> PIL.Image
-    '''
-    if h0 is not None and w0 is not None:
-        x = x.unsqueeze(0)
-        x = interpolate(x, size=(h0, w0), mode='bicubic')
-        x = x.squeeze(0)
-    x = (x.permute(1, 2, 0) * 127.5 + 127.5).cpu().numpy().clip(0, 255).astype(np.uint8)
-    return x
-def convert_dtype(dtype_str):
-    if dtype_str == 'fp32':
-        return torch.float32
-    elif dtype_str == 'fp16':
-        return torch.float16
-    elif dtype_str == 'bf16':
-        return torch.bfloat16
-    else:
-        raise NotImplementedError

+import os
+import torch
+import numpy as np
+import cv2
+from PIL import Image
+from torch.nn.functional import interpolate
+from omegaconf import OmegaConf
+from sgm.util import instantiate_from_config
+from huggingface_hub import hf_hub_download
+def get_state_dict(d):
+    return d.get('state_dict', d)
+def load_state_dict(ckpt_path, location='cpu'):
+    _, extension = os.path.splitext(ckpt_path)
+    # Hugging Faceのリポジトリからロードするかチェック
+    if '/' in ckpt_path:  # リポジトリ形式のパスと判断
+        parts = ckpt_path.split('/')
+        if len(parts) == 3:
+            repo_id = f"{parts[0]}/{parts[1]}"
+            filename = parts[2]
+            # ダウンロードの前にログを出力
+            print(f"Attempting to download from Hugging Face Hub with repo_id: {repo_id} and filename: {filename}")
+            ckpt_path = hf_hub_download(repo_id=repo_id, filename=filename)
+            # ダウンロード後に実際のファイルパスを確認するためのログを出力
+            print(f"Downloaded file path for {filename}: {ckpt_path}")
+        else:
+            raise ValueError("Invalid format for Hugging Face path. Expected format 'username/repo/filename'.")
+    # safetensors形式でのロード
+    if extension.lower() == ".safetensors":
+        import safetensors.torch
+        state_dict = safetensors.torch.load_file(ckpt_path, device=location)
+    else:
+        state_dict = get_state_dict(torch.load(ckpt_path, map_location=torch.device(location)))
+    print(f'Loaded state_dict from [{ckpt_path}]')
+    return state_dict
+def create_model(config_path):
+    config = OmegaConf.load(config_path)
+    model = instantiate_from_config(config.model).cpu()
+    print(f'Loaded model config from [{config_path}]')
+    return model
+def create_SUPIR_model(config_path, SUPIR_sign=None, load_default_setting=False):
+    config = OmegaConf.load(config_path)
+    model = instantiate_from_config(config.model).cpu()
+    print(f'Loaded model config from [{config_path}]')
+    if config.SDXL_CKPT is not None:
+        model.load_state_dict(load_state_dict(config.SDXL_CKPT), strict=False)
+    if config.SUPIR_CKPT is not None:
+        model.load_state_dict(load_state_dict(config.SUPIR_CKPT), strict=False)
+    if SUPIR_sign is not None:
+        assert SUPIR_sign in ['F', 'Q']
+        if SUPIR_sign == 'F':
+            model.load_state_dict(load_state_dict(config.SUPIR_CKPT_F), strict=False)
+        elif SUPIR_sign == 'Q':
+            model.load_state_dict(load_state_dict(config.SUPIR_CKPT_Q), strict=False)
+    if load_default_setting:
+        default_setting = config.default_setting
+        return model, default_setting
+    return model
+def load_QF_ckpt(config_path):
+    config = OmegaConf.load(config_path)
+    # SUPIR_CKPT_F のダウンロード
+    if '/' in config.SUPIR_CKPT_F:
+        parts = config.SUPIR_CKPT_F.split('/')
+        if len(parts) == 3:
+            repo_id = f"{parts[0]}/{parts[1]}"
+            filename = parts[2]
+            print(f"Attempting to download SUPIR_CKPT_F from repo_id: {repo_id} and filename: {filename}")
+            ckpt_F_path = hf_hub_download(repo_id=repo_id, filename=filename)
+            print(f"Downloaded SUPIR_CKPT_F to: {ckpt_F_path}")
+        else:
+            raise ValueError("Invalid format for SUPIR_CKPT_F. Expected format 'username/repo/filename'.")
+    else:
+        ckpt_F_path = config.SUPIR_CKPT_F  # ローカルパスの場合
+    # SUPIR_CKPT_Q のダウンロード
+    if '/' in config.SUPIR_CKPT_Q:
+        parts = config.SUPIR_CKPT_Q.split('/')
+        if len(parts) == 3:
+            repo_id = f"{parts[0]}/{parts[1]}"
+            filename = parts[2]
+            print(f"Attempting to download SUPIR_CKPT_Q from repo_id: {repo_id} and filename: {filename}")
+            ckpt_Q_path = hf_hub_download(repo_id=repo_id, filename=filename)
+            print(f"Downloaded SUPIR_CKPT_Q to: {ckpt_Q_path}")
+        else:
+            raise ValueError("Invalid format for SUPIR_CKPT_Q. Expected format 'username/repo/filename'.")
+    else:
+        ckpt_Q_path = config.SUPIR_CKPT_Q  # ローカルパスの場合
+    # ダウンロードしたパスからロード
+    ckpt_F = torch.load(ckpt_F_path, map_location='cpu')
+    ckpt_Q = torch.load(ckpt_Q_path, map_location='cpu')
+    return ckpt_Q, ckpt_F
+def PIL2Tensor(img, upsacle=1, min_size=1024, fix_resize=None):
+    '''
+    PIL.Image -> Tensor[C, H, W], RGB, [-1, 1]
+    '''
+    # size
+    w, h = img.size
+    w *= upsacle
+    h *= upsacle
+    w0, h0 = round(w), round(h)
+    if min(w, h) < min_size:
+        _upsacle = min_size / min(w, h)
+        w *= _upsacle
+        h *= _upsacle
+    if fix_resize is not None:
+        _upsacle = fix_resize / min(w, h)
+        w *= _upsacle
+        h *= _upsacle
+        w0, h0 = round(w), round(h)
+    w = int(np.round(w / 64.0)) * 64
+    h = int(np.round(h / 64.0)) * 64
+    x = img.resize((w, h), Image.BICUBIC)
+    x = np.array(x).round().clip(0, 255).astype(np.uint8)
+    x = x / 255 * 2 - 1
+    x = torch.tensor(x, dtype=torch.float32).permute(2, 0, 1)
+    return x, h0, w0
+def Tensor2PIL(x, h0, w0):
+    '''
+    Tensor[C, H, W], RGB, [-1, 1] -> PIL.Image
+    '''
+    x = x.unsqueeze(0)
+    x = interpolate(x, size=(h0, w0), mode='bicubic')
+    x = (x.squeeze(0).permute(1, 2, 0) * 127.5 + 127.5).cpu().numpy().clip(0, 255).astype(np.uint8)
+    return Image.fromarray(x)
+def HWC3(x):
+    assert x.dtype == np.uint8
+    if x.ndim == 2:
+        x = x[:, :, None]
+    assert x.ndim == 3
+    H, W, C = x.shape
+    assert C == 1 or C == 3 or C == 4
+    if C == 3:
+        return x
+    if C == 1:
+        return np.concatenate([x, x, x], axis=2)
+    if C == 4:
+        color = x[:, :, 0:3].astype(np.float32)
+        alpha = x[:, :, 3:4].astype(np.float32) / 255.0
+        y = color * alpha + 255.0 * (1.0 - alpha)
+        y = y.clip(0, 255).astype(np.uint8)
+        return y
+def upscale_image(input_image, upscale, min_size=None, unit_resolution=64):
+    H, W, C = input_image.shape
+    H = float(H)
+    W = float(W)
+    H *= upscale
+    W *= upscale
+    if min_size is not None:
+        if min(H, W) < min_size:
+            _upsacle = min_size / min(W, H)
+            W *= _upsacle
+            H *= _upsacle
+    H = int(np.round(H / unit_resolution)) * unit_resolution
+    W = int(np.round(W / unit_resolution)) * unit_resolution
+    img = cv2.resize(input_image, (W, H), interpolation=cv2.INTER_LANCZOS4 if upscale > 1 else cv2.INTER_AREA)
+    img = img.round().clip(0, 255).astype(np.uint8)
+    return img
+def fix_resize(input_image, size=512, unit_resolution=64):
+    H, W, C = input_image.shape
+    H = float(H)
+    W = float(W)
+    upscale = size / min(H, W)
+    H *= upscale
+    W *= upscale
+    H = int(np.round(H / unit_resolution)) * unit_resolution
+    W = int(np.round(W / unit_resolution)) * unit_resolution
+    img = cv2.resize(input_image, (W, H), interpolation=cv2.INTER_LANCZOS4 if upscale > 1 else cv2.INTER_AREA)
+    img = img.round().clip(0, 255).astype(np.uint8)
+    return img
+def Numpy2Tensor(img):
+    '''
+    np.array[H, w, C] [0, 255] -> Tensor[C, H, W], RGB, [-1, 1]
+    '''
+    # size
+    img = np.array(img) / 255 * 2 - 1
+    img = torch.tensor(img, dtype=torch.float32).permute(2, 0, 1)
+    return img
+def Tensor2Numpy(x, h0=None, w0=None):
+    '''
+    Tensor[C, H, W], RGB, [-1, 1] -> PIL.Image
+    '''
+    if h0 is not None and w0 is not None:
+        x = x.unsqueeze(0)
+        x = interpolate(x, size=(h0, w0), mode='bicubic')
+        x = x.squeeze(0)
+    x = (x.permute(1, 2, 0) * 127.5 + 127.5).cpu().numpy().clip(0, 255).astype(np.uint8)
+    return x
+def convert_dtype(dtype_str):
+    if dtype_str == 'fp32':
+        return torch.float32
+    elif dtype_str == 'fp16':
+        return torch.float16
+    elif dtype_str == 'bf16':
+        return torch.bfloat16
+    else:
+        raise NotImplementedError