Spaces:

snehilchatterjee
/

deepclarity

Sleeping

App Files Files Community

snehilchatterjee commited on Jul 2, 2024

Commit

8a1af8c

verified ·

1 Parent(s): c6ea043

Upload 10 files

Browse files

Files changed (10) hide show

app.py +401 -0
requirements.txt +12 -0
weights/SRGAN.pt +3 -0
weights/fsrcnn_x4.pth +3 -0
weights/method1(0.668).pt +3 -0
weights/method2(0.960).pt +3 -0
weights/miniSRGAN.pt +3 -0
weights/miniSRResNET.pt +3 -0
weights/mobile_sr.pt +3 -0
weights/tinySRGAN.pt +3 -0

app.py ADDED Viewed

	@@ -0,0 +1,401 @@

+import torch
+import warnings
+import gradio as gr
+import cv2
+import torchvision
+from torch import nn
+from torchvision.models import mobilenet_v3_small
+import numpy as np
+from PIL import Image
+from torchvision import transforms
+device = "cuda" if torch.cuda.is_available() else "cpu"
+warnings.filterwarnings("ignore")
+def flip_text(x):
+    return x[::-1]
+def method2_prep(image):
+    transforms = torchvision.transforms.Compose([
+        torchvision.transforms.Resize((256, 256)),
+        torchvision.transforms.CenterCrop((224, 224))
+    ])
+    t_lower = 50
+    t_upper = 150
+    height, width = image.shape[:2]
+    x = (width - 1920) // 2
+    y = (height - 1080) // 2
+    image = image[y:y+1080, x:x+1920]
+    img = torch.from_numpy(cv2.Canny(image, t_lower, t_upper)[np.newaxis, ...])
+    img = torch.vstack((img, img, img))
+    return transforms(img.type(torch.float32))
+def model2_inf(x):
+    print("Method 2")
+    image = method2_prep(x).unsqueeze(dim=0)
+    model = mobilenet_v3_small(weights='DEFAULT')
+    model.classifier[3] = nn.Linear(in_features=1024, out_features=2, bias=True)
+    image_np = image[0].permute(1, 2, 0).cpu().numpy()
+    image_np = (image_np * 255).astype(np.uint8)  # Ensure the image is of type uint8
+    model.load_state_dict(torch.load('./weights/method2(0.960).pt'))
+    #print("\nModel weights loaded successfully")
+    model.eval()  # Set the model to evaluation mode
+    with torch.inference_mode():
+        model = model.to(device)
+        image = image.to(device)
+        output = torch.softmax(model(image), dim=1).detach().cpu()
+        prediction = torch.argmax(output, dim=1).item()
+        del model
+        torch.cuda.empty_cache()
+        if prediction == 0:
+            return "The image is not pixelated", None
+        else:
+            return "The image is pixelated", translate_image(Image.fromarray(x), False, 'TinySRGAN', 'False')
+class _conv(nn.Conv2d):
+    def __init__(self, in_channels, out_channels, kernel_size, stride, padding, bias):
+        super(_conv, self).__init__(in_channels = in_channels, out_channels = out_channels,
+                               kernel_size = kernel_size, stride = stride, padding = (kernel_size) // 2, bias = True)
+        self.weight.data = torch.normal(torch.zeros((out_channels, in_channels, kernel_size, kernel_size)), 0.02)
+        self.bias.data = torch.zeros((out_channels))
+        for p in self.parameters():
+            p.requires_grad = True
+class conv(nn.Module):
+    def __init__(self, in_channel, out_channel, kernel_size, BN = False, act = None, stride = 1, bias = True):
+        super(conv, self).__init__()
+        m = []
+        m.append(_conv(in_channels = in_channel, out_channels = out_channel,
+                               kernel_size = kernel_size, stride = stride, padding = (kernel_size) // 2, bias = True))
+        if BN:
+            m.append(nn.BatchNorm2d(num_features = out_channel))
+        if act is not None:
+            m.append(act)
+        self.body = nn.Sequential(*m)
+    def forward(self, x):
+        out = self.body(x)
+        return out
+class ResBlock(nn.Module):
+    def __init__(self, channels, kernel_size, act = nn.ReLU(inplace = True), bias = True):
+        super(ResBlock, self).__init__()
+        m = []
+        m.append(conv(channels, channels, kernel_size, BN = True, act = act))
+        m.append(conv(channels, channels, kernel_size, BN = True, act = None))
+        self.body = nn.Sequential(*m)
+    def forward(self, x):
+        res = self.body(x)
+        res += x
+        return res
+class BasicBlock(nn.Module):
+    def __init__(self, in_channels, out_channels, kernel_size, num_res_block, act = nn.ReLU(inplace = True)):
+        super(BasicBlock, self).__init__()
+        m = []
+        self.conv = conv(in_channels, out_channels, kernel_size, BN = False, act = act)
+        for i in range(num_res_block):
+            m.append(ResBlock(out_channels, kernel_size, act))
+        m.append(conv(out_channels, out_channels, kernel_size, BN = True, act = None))
+        self.body = nn.Sequential(*m)
+    def forward(self, x):
+        res = self.conv(x)
+        out = self.body(res)
+        out += res
+        return out
+class Upsampler(nn.Module):
+    def __init__(self, channel, kernel_size, scale, act = nn.ReLU(inplace = True)):
+        super(Upsampler, self).__init__()
+        m = []
+        m.append(conv(channel, channel * scale * scale, kernel_size))
+        m.append(nn.PixelShuffle(scale))
+        if act is not None:
+            m.append(act)
+        self.body = nn.Sequential(*m)
+    def forward(self, x):
+        out = self.body(x)
+        return out
+class discrim_block(nn.Module):
+    def __init__(self, in_feats, out_feats, kernel_size, act = nn.LeakyReLU(inplace = True)):
+        super(discrim_block, self).__init__()
+        m = []
+        m.append(conv(in_feats, out_feats, kernel_size, BN = True, act = act))
+        m.append(conv(out_feats, out_feats, kernel_size, BN = True, act = act, stride = 2))
+        self.body = nn.Sequential(*m)
+    def forward(self, x):
+        out = self.body(x)
+        return out
+class TinySRGAN(nn.Module):
+    def __init__(self, img_feat = 3, n_feats = 32, kernel_size = 3, num_block = 6, act = nn.PReLU(), scale=4):
+        super(TinySRGAN, self).__init__()
+        self.conv01 = conv(in_channel = img_feat, out_channel = n_feats, kernel_size = 9, BN = False, act = act)
+        resblocks = [ResBlock(channels = n_feats, kernel_size = 3, act = act) for _ in range(num_block)]
+        self.body = nn.Sequential(*resblocks)
+        self.conv02 = conv(in_channel = n_feats, out_channel = n_feats, kernel_size = 3, BN = True, act = None)
+        if(scale == 4):
+            upsample_blocks = [Upsampler(channel = n_feats, kernel_size = 3, scale = 2, act = act) for _ in range(2)]
+        else:
+            upsample_blocks = [Upsampler(channel = n_feats, kernel_size = 3, scale = scale, act = act)]
+        self.tail = nn.Sequential(*upsample_blocks)
+        self.last_conv = conv(in_channel = n_feats, out_channel = img_feat, kernel_size = 3, BN = False, act = nn.Tanh())
+    def forward(self, x):
+        x = self.conv01(x)
+        _skip_connection = x
+        x = self.body(x)
+        x = self.conv02(x)
+        feat = x + _skip_connection
+        x = self.tail(feat)
+        x = self.last_conv(x)
+        return x, feat
+def build_generator():
+    class ResidualBlock(nn.Module):
+        def __init__(self, in_channels, out_channels, expansion=6, stride=1, alpha=1.0):
+            super(ResidualBlock, self).__init__()
+            self.expansion = expansion
+            self.stride = stride
+            self.in_channels = in_channels
+            self.out_channels = int(out_channels * alpha)
+            self.pointwise_conv_filters = self._make_divisible(self.out_channels, 8)
+            self.conv1 = nn.Conv2d(in_channels, in_channels * expansion, kernel_size=1, stride=1, padding=0, bias=True)
+            self.bn1 = nn.BatchNorm2d(in_channels * expansion)
+            self.conv2 = nn.Conv2d(in_channels * expansion, in_channels * expansion, kernel_size=3, stride=stride, padding=1, groups=in_channels * expansion, bias=True)
+            self.bn2 = nn.BatchNorm2d(in_channels * expansion)
+            self.conv3 = nn.Conv2d(in_channels * expansion, self.pointwise_conv_filters, kernel_size=1, stride=1, padding=0, bias=True)
+            self.bn3 = nn.BatchNorm2d(self.pointwise_conv_filters)
+            self.relu = nn.ReLU(inplace=True)
+            self.skip_add = (stride == 1 and in_channels == self.pointwise_conv_filters)
+        def forward(self, x):
+            identity = x
+            out = self.conv1(x)
+            out = self.bn1(out)
+            out = self.relu(out)
+            out = self.conv2(out)
+            out = self.bn2(out)
+            out = self.relu(out)
+            out = self.conv3(out)
+            out = self.bn3(out)
+            if self.skip_add:
+                out = out + identity
+            return out
+        @staticmethod
+        def _make_divisible(v, divisor, min_value=None):
+            if min_value is None:
+                min_value = divisor
+            new_v = max(min_value, int(v + divisor / 2) // divisor * divisor)
+            if new_v < 0.9 * v:
+                new_v += divisor
+            return new_v
+    class Generator(nn.Module):
+        def __init__(self, in_channels, num_residual_blocks, gf):
+            super(Generator, self).__init__()
+            self.num_residual_blocks = num_residual_blocks
+            self.gf = gf
+            self.conv1 = nn.Conv2d(in_channels, gf, kernel_size=3, stride=1, padding=1)
+            self.bn1 = nn.BatchNorm2d(gf)
+            self.prelu1 = nn.PReLU()
+            self.residual_blocks = self.make_layer(ResidualBlock, gf, num_residual_blocks)
+            self.conv2 = nn.Conv2d(gf, gf, kernel_size=3, stride=1, padding=1)
+            self.bn2 = nn.BatchNorm2d(gf)
+            self.upsample1 = nn.Sequential(
+                nn.Upsample(scale_factor=2, mode='bilinear', align_corners=True),
+                nn.Conv2d(gf, gf, kernel_size=3, stride=1, padding=1),
+                nn.PReLU()
+            )
+            self.upsample2 = nn.Sequential(
+                nn.Upsample(scale_factor=2, mode='bilinear', align_corners=True),
+                nn.Conv2d(gf, gf, kernel_size=3, stride=1, padding=1),
+                nn.PReLU()
+            )
+            self.conv3 = nn.Conv2d(gf, 3, kernel_size=3, stride=1, padding=1)
+            self.tanh = nn.Tanh()
+        def make_layer(self, block, out_channels, blocks):
+            layers = []
+            for _ in range(blocks):
+                layers.append(block(out_channels, out_channels))
+            return nn.Sequential(*layers)
+        def forward(self, x):
+            out1 = self.prelu1(self.bn1(self.conv1(x)))
+            out = self.residual_blocks(out1)
+            out = self.bn2(self.conv2(out))
+            out = out + out1
+            out = self.upsample1(out)
+            out = self.upsample2(out)
+            out = self.tanh(self.conv3(out))
+            return out
+    return Generator(3, 6, 32)
+def numpify(imgs):
+    all_images = []
+    for img in imgs:
+        img = img.permute(1,2,0).to('cpu') ### MIGHT CRASH HERE
+        all_images.append(img)
+    return np.stack(all_images, axis=0)
+transform = transforms.Compose([
+            transforms.ToTensor()
+        ])
+# Function to translate the image
+def translate_image(image, sharpen, model_name, save):
+    print('Translating!')
+    desired_width = 480
+    original_width, original_height = image.size
+    desired_height = int((original_height / original_width) * desired_width)
+    resized_image = image.resize((desired_width, desired_height))
+    if(model_name=='MobileSR'):
+        model=build_generator().to(device)
+        model.load_state_dict(torch.load('./weights/mobile_sr.pt'))
+        low_res = transform(resized_image)
+        low_res = low_res.unsqueeze(dim=0).to(device)
+        model.eval()
+        with torch.no_grad():
+            sr = model(low_res)
+        fake_imgs = numpify(sr)
+        sr_img = Image.fromarray((((fake_imgs[0] + 1) / 2) * 255).astype(np.uint8))
+    elif(model_name=='MiniSRGAN'):
+        model = MiniSRGAN().to(device)
+        model.load_state_dict(torch.load('./weights/miniSRGAN.pt'))
+        model.eval()
+        inputs = np.array(resized_image)
+        inputs = (inputs / 127.5) - 1.0
+        inputs = torch.tensor(inputs.transpose(2, 0, 1).astype(np.float32)).to(device)
+        with torch.no_grad():
+            output, _ = model(torch.unsqueeze(inputs,dim=0))
+        output = output[0].cpu().numpy()
+        output = np.clip(output, -1.0, 1.0)
+        output = (output + 1.0) / 2.0
+        output = output.transpose(1, 2, 0)
+        sr_img = Image.fromarray((output * 255.0).astype(np.uint8))
+    elif(model_name=='TinySRGAN'):
+        model = TinySRGAN().to(device)
+        model.load_state_dict(torch.load('./weights/tinySRGAN.pt'))
+        inputs = np.array(resized_image)
+        inputs = (inputs / 127.5) - 1.0
+        inputs = torch.tensor(inputs.transpose(2, 0, 1).astype(np.float32)).to(device)
+        model.eval()
+        with torch.no_grad():
+            output, _ = model(torch.unsqueeze(inputs,dim=0))
+        output = output[0].cpu().numpy()
+        output = (output + 1.0) / 2.0
+        output = output.transpose(1, 2, 0)
+        sr_img = Image.fromarray((output * 255.0).astype(np.uint8))
+    if sharpen:
+        sr_img_cv = np.array(sr_img)
+        sr_img_cv = cv2.cvtColor(sr_img_cv, cv2.COLOR_RGB2BGR)
+        kernel = np.array([[0, -1, 0], [-1, 5, -1], [0, -1, 0]])
+        sharpened_sr_img_cv = cv2.filter2D(sr_img_cv, -1, kernel)
+        sharpened_sr_img = Image.fromarray(cv2.cvtColor(sharpened_sr_img_cv, cv2.COLOR_BGR2RGB))
+        if(save=="True"):
+            sharpened_sr_img.save('super_resolved_image.png')
+        return sharpened_sr_img
+    else:
+        if(save=="True"):
+            sr_img.save('super_resolved_image.png')
+        return sr_img
+# Gradio interface
+interface = gr.Interface(
+    fn=model2_inf,
+    inputs=gr.Image(type="numpy"),
+    outputs=[gr.Textbox(label="Result"), gr.Image(label="Processed Image")],
+    title="Pixelation Detection App",
+    description="Upload an image to check if it is pixelated. If the image is pixelated, the processed image will be displayed.",
+    allow_flagging='never'
+)
+interface.launch()
+# Launch the Gradio app
+interface.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+gradio==4.32.2
+torch==2.1.0
+torchvision==0.16.0
+pillow==10.0.1
+numpy==1.26.0
+opencv-python==4.9.0.80
+scikit-learn==1.3.2
+matplotlib==3.8.2
+tqdm==4.66.1
+timm==0.9.12
+super_image==0.1.7

weights/SRGAN.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13f8c4779fb4e0d9b6e56e460fe6df81870ac388e6db20926b2aa9f2fd49bb61
+size 6209971

weights/fsrcnn_x4.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c15150d6787d487f38a68e66be5ec8a964182403af494e6a935fa03eeb56a630
+size 54998

weights/method1(0.668).pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8df654bb1bb5c4dad3a6aa3251236cf2cf86957b62e3363c66b8e3438a41e70d
+size 6214802

weights/method2(0.960).pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af08d7011d16d43cdf5bacf03dcd12723f26464013571e597a6160dff2081c65
+size 6214802

weights/miniSRGAN.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36c68e89673cb8858629133f0aa95f21926382cb82d69f19f8b840866226031e
+size 3827430

weights/miniSRResNET.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a00e5ef9b5b029293e1804d358e1697ef81e0a70bb4c52a96274a1498fe8c2a9
+size 3828022

weights/mobile_sr.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:63ccbec678b30e8d1c25523413928dd2d1d9229519ceae107ae9fc80571d89ba
+size 556457

weights/tinySRGAN.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e873fd2427142c84278466802fc250607713c51c2671f289b48a82d1979b59f
+size 855730