Spaces:

byrkbrk
/

Synthesize-super-resolution-images

Sleeping

App Files Files Community

byrkbrk commited on Aug 14, 2024

Commit

1a548a3

verified ·

1 Parent(s): 3c006e8

Upload 9 files

Browse files

Files changed (9) hide show

app.py +26 -0
low-res-images/building.png +0 -0
low-res-images/penguin.png +0 -0
low-res-images/plant.png +0 -0
low-res-images/vietnam_park.jpg +0 -0
model/eval_seemore_t_x4.yaml +12 -0
model/seemore.py +417 -0
requirements.txt +9 -0
synthesizer.py +100 -0

app.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import os
+import gradio as gr
+from synthesizer import SRSynthesizer
+from gradio_imageslider import ImageSlider
+if __name__ == "__main__":
+    sr_synthesizer = SRSynthesizer(create_dirs=False)
+    gr_interface = gr.Interface(
+        fn=lambda image: sr_synthesizer.synthesize(image,
+                                                   show=False,
+                                                   save=False,
+                                                   return_input=True),
+        inputs=[gr.Image(type="pil", label="Input")],
+        outputs=ImageSlider(type="pil", label="Output", show_download_button=True),
+        title="Super Resolution Image Synthesizer",
+        examples=[
+            [os.path.join(os.path.dirname(__file__), "low-res-images", "building.png")],
+            [os.path.join(os.path.dirname(__file__), "low-res-images", "plant.png")],
+            [os.path.join(os.path.dirname(__file__), "low-res-images", "penguin.png")],
+            [os.path.join(os.path.dirname(__file__), "low-res-images", "vietnam_park.jpg")],
+        ],
+        description="Synthesize (4x-upscaled) super-resolved images"
+    )
+    gr_interface.launch()

low-res-images/building.png ADDED Viewed

low-res-images/penguin.png ADDED Viewed

low-res-images/plant.png ADDED Viewed

low-res-images/vietnam_park.jpg ADDED Viewed

model/eval_seemore_t_x4.yaml ADDED Viewed

	@@ -0,0 +1,12 @@

+# Modified from https://huggingface.co/spaces/eduardzamfir/SeeMoreDetails/blob/main/configs/eval_seemore_t_x4.yml
+scale: 4
+in_chans: 3
+num_experts: 3
+img_range: 1.0
+num_layers: 6
+embedding_dim: 36
+use_shuffle: True
+lr_space: exp
+topk: 1
+recursive: 2
+global_kernel_size: 11

model/seemore.py ADDED Viewed

	@@ -0,0 +1,417 @@

+# Adapted from https://github.com/eduardzamfir/seemoredetails/blob/main/basicsr/archs/seemore_arch.py
+from typing import Tuple, List
+from torch import Tensor
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from einops.layers.torch import Rearrange
+######################
+# Meta Architecture
+######################
+class SeemoRe(nn.Module):
+    def __init__(self,
+                 scale: int = 4,
+                 in_chans: int = 3,
+                 num_experts: int = 6,
+                 num_layers: int = 6,
+                 embedding_dim: int = 64,
+                 img_range: float = 1.0,
+                 use_shuffle: bool = False,
+                 global_kernel_size: int = 11,
+                 recursive: int = 2,
+                 lr_space: int = 1,
+                 topk: int = 2,):
+        super().__init__()
+        self.scale = scale
+        self.num_in_channels = in_chans
+        self.num_out_channels = in_chans
+        self.img_range = img_range
+        rgb_mean = (0.4488, 0.4371, 0.4040)
+        self.mean = torch.Tensor(rgb_mean).view(1, 3, 1, 1)
+        # -- SHALLOW FEATURES --
+        self.conv_1 = nn.Conv2d(self.num_in_channels, embedding_dim, kernel_size=3, padding=1)
+        # -- DEEP FEATURES --
+        self.body = nn.ModuleList(
+            [ResGroup(in_ch=embedding_dim,
+                       num_experts=num_experts,
+                       use_shuffle=use_shuffle,
+                       topk=topk,
+                       lr_space=lr_space,
+                       recursive=recursive,
+                       global_kernel_size=global_kernel_size) for i in range(num_layers)]
+        )
+        # -- UPSCALE --
+        self.norm = LayerNorm(embedding_dim, data_format='channels_first')
+        self.conv_2 = nn.Conv2d(embedding_dim, embedding_dim, kernel_size=3, padding=1)
+        self.upsampler = nn.Sequential(
+            nn.Conv2d(embedding_dim, (scale**2) * self.num_out_channels, kernel_size=3, padding=1),
+            nn.PixelShuffle(scale)
+        )
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        self.mean = self.mean.type_as(x)
+        x = (x - self.mean) * self.img_range
+        # -- SHALLOW FEATURES --
+        x = self.conv_1(x)
+        res = x
+        # -- DEEP FEATURES --
+        for idx, layer in enumerate(self.body):
+            x = layer(x)
+        x = self.norm(x)
+        # -- HR IMAGE RECONSTRUCTION --
+        x = self.conv_2(x) + res
+        x = self.upsampler(x)
+        x = x / self.img_range + self.mean
+        return x
+#############################
+# Components
+#############################
+class ResGroup(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 num_experts: int,
+                 global_kernel_size: int = 11,
+                 lr_space: int = 1,
+                 topk: int = 2,
+                 recursive: int = 2,
+                 use_shuffle: bool = False):
+        super().__init__()
+        self.local_block = RME(in_ch=in_ch,
+                               num_experts=num_experts,
+                               use_shuffle=use_shuffle,
+                               lr_space=lr_space,
+                               topk=topk,
+                               recursive=recursive)
+        self.global_block = SME(in_ch=in_ch,
+                                kernel_size=global_kernel_size)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.local_block(x)
+        x = self.global_block(x)
+        return x
+#############################
+# Global Block
+#############################
+class SME(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 kernel_size: int = 11):
+        super().__init__()
+        self.norm_1 = LayerNorm(in_ch, data_format='channels_first')
+        self.block = StripedConvFormer(in_ch=in_ch, kernel_size=kernel_size)
+        self.norm_2 = LayerNorm(in_ch, data_format='channels_first')
+        self.ffn = GatedFFN(in_ch, mlp_ratio=2, kernel_size=3, act_layer=nn.GELU())
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.block(self.norm_1(x)) + x
+        x = self.ffn(self.norm_2(x)) + x
+        return x
+class StripedConvFormer(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 kernel_size: int):
+        super().__init__()
+        self.in_ch = in_ch
+        self.kernel_size = kernel_size
+        self.padding = kernel_size // 2
+        self.proj = nn.Conv2d(in_ch, in_ch, kernel_size=1, padding=0)
+        self.to_qv = nn.Sequential(
+            nn.Conv2d(in_ch, in_ch * 2, kernel_size=1, padding=0),
+            nn.GELU(),
+        )
+        self.attn = StripedConv2d(in_ch, kernel_size=kernel_size, depthwise=True)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        q, v = self.to_qv(x).chunk(2, dim=1)
+        q = self.attn(q)
+        x = self.proj(q * v)
+        return x
+#############################
+# Local Blocks
+#############################
+class RME(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 num_experts: int,
+                 topk: int,
+                 lr_space: int = 1,
+                 recursive: int = 2,
+                 use_shuffle: bool = False,):
+        super().__init__()
+        self.norm_1 = LayerNorm(in_ch, data_format='channels_first')
+        self.block = MoEBlock(in_ch=in_ch, num_experts=num_experts, topk=topk, use_shuffle=use_shuffle, recursive=recursive, lr_space=lr_space,)
+        self.norm_2 = LayerNorm(in_ch, data_format='channels_first')
+        self.ffn = GatedFFN(in_ch, mlp_ratio=2, kernel_size=3, act_layer=nn.GELU())
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.block(self.norm_1(x)) + x
+        x = self.ffn(self.norm_2(x)) + x
+        return x
+#################
+# MoE Layer
+#################
+class MoEBlock(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 num_experts: int,
+                 topk: int,
+                 use_shuffle: bool = False,
+                 lr_space: str = "linear",
+                 recursive: int = 2):
+        super().__init__()
+        self.use_shuffle = use_shuffle
+        self.recursive = recursive
+        self.conv_1 = nn.Sequential(
+            nn.Conv2d(in_ch, in_ch, kernel_size=3, padding=1),
+            nn.GELU(),
+            nn.Conv2d(in_ch, 2*in_ch, kernel_size=1, padding=0)
+        )
+        self.agg_conv = nn.Sequential(
+            nn.Conv2d(in_ch, in_ch, kernel_size=4, stride=4, groups=in_ch),
+            nn.GELU())
+        self.conv = nn.Sequential(
+            nn.Conv2d(in_ch, in_ch, kernel_size=3, stride=1, padding=1, groups=in_ch),
+            nn.Conv2d(in_ch, in_ch, kernel_size=1, padding=0)
+        )
+        self.conv_2 = nn.Sequential(
+            StripedConv2d(in_ch, kernel_size=3, depthwise=True),
+            nn.GELU())
+        if lr_space == "linear":
+            grow_func = lambda i: i+2
+        elif lr_space == "exp":
+            grow_func = lambda i: 2**(i+1)
+        elif lr_space == "double":
+            grow_func = lambda i: 2*i+2
+        else:
+            raise NotImplementedError(f"lr_space {lr_space} not implemented")
+        self.moe_layer = MoELayer(
+            experts=[Expert(in_ch=in_ch, low_dim=grow_func(i)) for i in range(num_experts)], # add here multiple of 2 as low_dim
+            gate=Router(in_ch=in_ch, num_experts=num_experts),
+            num_expert=topk,
+        )
+        self.proj = nn.Conv2d(in_ch, in_ch, kernel_size=1, padding=0)
+    def calibrate(self, x: torch.Tensor) -> torch.Tensor:
+        b, c, h, w = x.shape
+        res = x
+        for _ in range(self.recursive):
+            x = self.agg_conv(x)
+        x = self.conv(x)
+        x = F.interpolate(x, size=(h, w), mode="bilinear", align_corners=False)
+        return res + x
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.conv_1(x)
+        if self.use_shuffle:
+            x = channel_shuffle(x, groups=2)
+        x, k = torch.chunk(x, chunks=2, dim=1)
+        x = self.conv_2(x)
+        k = self.calibrate(k)
+        x = self.moe_layer(x, k)
+        x = self.proj(x)
+        return x
+class MoELayer(nn.Module):
+    def __init__(self, experts: List[nn.Module], gate: nn.Module, num_expert: int = 1):
+        super().__init__()
+        assert len(experts) > 0
+        self.experts = nn.ModuleList(experts)
+        self.gate = gate
+        self.num_expert = num_expert
+    def forward(self, inputs: torch.Tensor, k: torch.Tensor):
+        out = self.gate(inputs)
+        weights = F.softmax(out, dim=1, dtype=torch.float).to(inputs.dtype)
+        topk_weights, topk_experts = torch.topk(weights, self.num_expert)
+        out = inputs.clone()
+        if self.training:
+            exp_weights = torch.zeros_like(weights)
+            exp_weights.scatter_(1, topk_experts, weights.gather(1, topk_experts))
+            for i, expert in enumerate(self.experts):
+                out += expert(inputs, k) * exp_weights[:, i:i+1, None, None]
+        else:
+            selected_experts = [self.experts[i] for i in topk_experts.squeeze(dim=0)]
+            for i, expert in enumerate(selected_experts):
+                out += expert(inputs, k) * topk_weights[:, i:i+1, None, None]
+        return out
+class Expert(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 low_dim: int,):
+        super().__init__()
+        self.conv_1 = nn.Conv2d(in_ch, low_dim, kernel_size=1, padding=0)
+        self.conv_2 = nn.Conv2d(in_ch, low_dim, kernel_size=1, padding=0)
+        self.conv_3 = nn.Conv2d(low_dim, in_ch, kernel_size=1, padding=0)
+    def forward(self, x: torch.Tensor, k: torch.Tensor) -> torch.Tensor:
+        x = self.conv_1(x)
+        x = self.conv_2(k) * x # here no more sigmoid
+        x = self.conv_3(x)
+        return x
+class Router(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 num_experts: int):
+        super().__init__()
+        self.body = nn.Sequential(
+            nn.AdaptiveAvgPool2d(1),
+            Rearrange('b c 1 1 -> b c'),
+            nn.Linear(in_ch, num_experts, bias=False),
+        )
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        return self.body(x)
+#################
+# Utilities
+#################
+class StripedConv2d(nn.Module):
+    def __init__(self,
+                 in_ch: int,
+                 kernel_size: int,
+                 depthwise: bool = False):
+        super().__init__()
+        self.in_ch = in_ch
+        self.kernel_size = kernel_size
+        self.padding = kernel_size // 2
+        self.conv = nn.Sequential(
+            nn.Conv2d(in_ch, in_ch, kernel_size=(1, self.kernel_size), padding=(0, self.padding), groups=in_ch if depthwise else 1),
+            nn.Conv2d(in_ch, in_ch, kernel_size=(self.kernel_size, 1), padding=(self.padding, 0), groups=in_ch if depthwise else 1),
+        )
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        return self.conv(x)
+def channel_shuffle(x, groups=2):
+    bat_size, channels, w, h = x.shape
+    group_c = channels // groups
+    x = x.view(bat_size, groups, group_c, w, h)
+    x = torch.transpose(x, 1, 2).contiguous()
+    x = x.view(bat_size, -1, w, h)
+    return x
+class GatedFFN(nn.Module):
+    def __init__(self,
+                 in_ch,
+                 mlp_ratio,
+                 kernel_size,
+                 act_layer,):
+        super().__init__()
+        mlp_ch = in_ch * mlp_ratio
+        self.fn_1 = nn.Sequential(
+            nn.Conv2d(in_ch, mlp_ch, kernel_size=1, padding=0),
+            act_layer,
+        )
+        self.fn_2 = nn.Sequential(
+            nn.Conv2d(in_ch, in_ch, kernel_size=1, padding=0),
+            act_layer,
+        )
+        self.gate = nn.Conv2d(mlp_ch // 2, mlp_ch // 2,
+                              kernel_size=kernel_size, padding=kernel_size // 2, groups=mlp_ch // 2)
+    def feat_decompose(self, x):
+        s = x - self.gate(x)
+        x = x + self.sigma * s
+        return x
+    def forward(self, x: torch.Tensor):
+        x = self.fn_1(x)
+        x, gate = torch.chunk(x, 2, dim=1)
+        gate = self.gate(gate)
+        x = x * gate
+        x = self.fn_2(x)
+        return x
+class LayerNorm(nn.Module):
+    r""" LayerNorm that supports two data formats: channels_last (default) or channels_first.
+    The ordering of the dimensions in the inputs. channels_last corresponds to inputs with
+    shape (batch_size, height, width, channels) while channels_first corresponds to inputs
+    with shape (batch_size, channels, height, width).
+    """
+    def __init__(self, normalized_shape, eps=1e-6, data_format="channels_last"):
+        super().__init__()
+        self.weight = nn.Parameter(torch.ones(normalized_shape))
+        self.bias = nn.Parameter(torch.zeros(normalized_shape))
+        self.eps = eps
+        self.data_format = data_format
+        if self.data_format not in ["channels_last", "channels_first"]:
+            raise NotImplementedError
+        self.normalized_shape = (normalized_shape, )
+    def forward(self, x):
+        if self.data_format == "channels_last":
+            return F.layer_norm(x, self.normalized_shape, self.weight, self.bias, self.eps)
+        elif self.data_format == "channels_first":
+            u = x.mean(1, keepdim=True)
+            s = (x - u).pow(2).mean(1, keepdim=True)
+            x = (x - u) / torch.sqrt(s + self.eps)
+            x = self.weight[:, None, None] * x + self.bias[:, None, None]
+            return x

requirements.txt ADDED Viewed

	@@ -0,0 +1,9 @@

+torch
+numpy
+torchvision
+einops
+gradio
+huggingface-hub
+pillow
+PyYAML
+gradio_imageslider

synthesizer.py ADDED Viewed

	@@ -0,0 +1,100 @@

+import os
+import yaml
+import torch
+from torchvision import transforms
+from PIL import Image
+from model.seemore import SeemoRe
+from huggingface_hub import hf_hub_download
+class SRSynthesizer(object):
+    repo_id = "eduardzamfir/SeemoRe-T"
+    checkpoint_name = "SeemoRe_T_X4.pth"
+    model_config_name = "eval_seemore_t_x4.yaml"
+    def __init__(self,
+                 device: str = None,
+                 create_dirs: bool = True):
+        self.module_dir = os.path.dirname(__file__)
+        self.device = self.initialize_device(device)
+        self.download_model_checkpoint(self.__class__.repo_id,
+                                       self.__class__.checkpoint_name)
+        self.model = self.instantiate_model(self.__class__.checkpoint_name,
+                                            self.__class__.model_config_name,
+                                            self.device)
+        if create_dirs: self.create_dirs(self.module_dir)
+    @torch.inference_mode()
+    def synthesize(self, image, show=True, save=True, return_input=False):
+        """Returns synthesized image for given image"""
+        if isinstance(image, str):
+            synthesized_image_name = image
+            image = self.read_image(self.module_dir, "low-res-images", image)
+        else:
+            synthesized_image_name = "synthesized_image.png"
+        synthesized_image = self.model(transforms.ToTensor()(image).to(self.device))
+        synthesized_image = transforms.Compose([lambda x: torch.clamp(x, 0, 1),
+                                                transforms.ToPILImage()])(synthesized_image.squeeze().cpu())
+        if show:
+            image.show()
+            synthesized_image.show()
+        if save:
+            synthesized_image.save(os.path.join(self.module_dir,
+                                                "synthesized-images",
+                                                synthesized_image_name))
+        if return_input:
+            return image, synthesized_image
+        return synthesized_image
+    def instantiate_model(self, checkpoint_name, model_config_name, device):
+        """Returns instantiated model for given arguments"""
+        model = SeemoRe(**self.read_model_config_file(model_config_name)).to(device)
+        model.load_state_dict(self.load_checkpoint(checkpoint_name, device))
+        return model
+    def read_model_config_file(self, config_name):
+        """Returns read yaml file for given config name"""
+        root = self.module_dir
+        base_folder = "model"
+        with open(os.path.join(root, base_folder, config_name), "r") as file:
+            return yaml.safe_load(file)
+    def load_checkpoint(self, checkpoint_name, device):
+        """Loads the checkpoint from memory for given checkpoint name"""
+        root = self.module_dir
+        base_folder = "model"
+        checkpoint = torch.load(os.path.join(root, base_folder, checkpoint_name),
+                                weights_only=True,
+                                map_location=device)
+        return checkpoint["params"]
+    def download_model_checkpoint(self, repo_id, checkpoint_name, location=None):
+        """Downloads the model checkpoint from huggingface to given location"""
+        if location is None:
+            location = os.path.join(self.module_dir, "model")
+        hf_hub_download(repo_id=repo_id,
+                        filename=checkpoint_name,
+                        local_dir=location)
+    def initialize_device(self, device: str):
+        """Returns device based on GPU availability"""
+        if device is None:
+            if torch.cuda.is_available():
+                device = "cuda"
+            elif torch.backends.mps.is_available():
+                device = "mps"
+            else:
+                device = "cpu"
+        return torch.device(device)
+    def read_image(self, root, base_folder, image_name):
+        """Returns opened image file for given image name"""
+        return Image.open(os.path.join(root, base_folder, image_name))
+    def create_dirs(self, root: str) -> None:
+        """Creates required directories during inference under root"""
+        dir_names = ["low-res-images", "synthesized-images"]
+        for dir_name in dir_names:
+            os.makedirs(os.path.join(root, dir_name), exist_ok=True)