WSSS_ResNet50 / app.py
kittendev's picture
Update app.py
8274714 verified
raw
history blame
5.94 kB
# Copyright (C) 2020 * Ltd. All rights reserved.
# author : Sanghyeon Jo <[email protected]>
import gradio as gr
import os
import sys
import copy
import shutil
import random
import argparse
import numpy as np
import imageio
import torch
import torch.nn as nn
import torch.nn.functional as F
from torchvision import transforms
from torch.utils.tensorboard import SummaryWriter
from torch.utils.data import DataLoader
from core.puzzle_utils import *
from core.networks import *
from core.datasets import *
from tools.general.io_utils import *
from tools.general.time_utils import *
from tools.general.json_utils import *
from tools.ai.log_utils import *
from tools.ai.demo_utils import *
from tools.ai.optim_utils import *
from tools.ai.torch_utils import *
from tools.ai.evaluate_utils import *
from tools.ai.augment_utils import *
from tools.ai.randaugment import *
parser = argparse.ArgumentParser()
###############################################################################
# Dataset
###############################################################################
parser.add_argument('--seed', default=2606, type=int)
parser.add_argument('--num_workers', default=4, type=int)
parser.add_argument('--data_dir', default='../VOCtrainval_11-May-2012/', type=str)
###############################################################################
# Network
###############################################################################
parser.add_argument('--architecture', default='DeepLabv3+', type=str)
parser.add_argument('--backbone', default='resnet50', type=str)
parser.add_argument('--mode', default='fix', type=str)
parser.add_argument('--use_gn', default=True, type=str2bool)
###############################################################################
# Inference parameters
###############################################################################
parser.add_argument('--tag', default='', type=str)
parser.add_argument('--domain', default='val', type=str)
parser.add_argument('--scales', default='0.5,1.0,1.5,2.0', type=str)
parser.add_argument('--iteration', default=10, type=int)
if __name__ == '__main__':
###################################################################################
# Arguments
###################################################################################
args = parser.parse_args()
model_dir = create_directory('./experiments/models/')
model_path = model_dir + f'DeepLabv3+@ResNet-50@[email protected]'
if 'train' in args.domain:
args.tag += '@train'
else:
args.tag += '@' + args.domain
args.tag += '@scale=%s' % args.scales
args.tag += '@iteration=%d' % args.iteration
set_seed(args.seed)
log_func = lambda string='': print(string)
###################################################################################
# Transform, Dataset, DataLoader
###################################################################################
imagenet_mean = [0.485, 0.456, 0.406]
imagenet_std = [0.229, 0.224, 0.225]
normalize_fn = Normalize(imagenet_mean, imagenet_std)
# for mIoU
meta_dic = read_json('./data/VOC_2012.json')
###################################################################################
# Network
###################################################################################
if args.architecture == 'DeepLabv3+':
model = DeepLabv3_Plus(args.backbone, num_classes=meta_dic['classes'] + 1, mode=args.mode,
use_group_norm=args.use_gn)
elif args.architecture == 'Seg_Model':
model = Seg_Model(args.backbone, num_classes=meta_dic['classes'] + 1)
elif args.architecture == 'CSeg_Model':
model = CSeg_Model(args.backbone, num_classes=meta_dic['classes'] + 1)
model = model.cuda()
model.eval()
log_func('[i] Architecture is {}'.format(args.architecture))
log_func('[i] Total Params: %.2fM' % (calculate_parameters(model)))
log_func()
load_model(model, model_path, parallel=False)
#################################################################################################
# Evaluation
#################################################################################################
eval_timer = Timer()
scales = [float(scale) for scale in args.scales.split(',')]
model.eval()
eval_timer.tik()
def inference(images, image_size):
images = images.cuda()
logits = model(images)
logits = resize_for_tensors(logits, image_size)
logits = logits[0] + logits[1].flip(-1)
logits = get_numpy_from_tensor(logits).transpose((1, 2, 0))
return logits
def predict_image(ori_image):
with torch.no_grad():
ori_w, ori_h = ori_image.size
cams_list = []
for scale in scales:
image = copy.deepcopy(ori_image)
image = image.resize((round(ori_w * scale), round(ori_h * scale)), resample=PIL.Image.BICUBIC)
image = normalize_fn(image)
image = image.transpose((2, 0, 1))
image = torch.from_numpy(image)
flipped_image = image.flip(-1)
images = torch.stack([image, flipped_image])
cams = inference(images, (ori_h, ori_w))
cams_list.append(cams)
preds = np.sum(cams_list, axis=0)
preds = F.softmax(torch.from_numpy(preds), dim=-1).numpy()
if args.iteration > 0:
preds = crf_inference(np.asarray(ori_image), preds.transpose((2, 0, 1)), t=args.iteration)
pred_mask = np.argmax(preds, axis=0)
else:
pred_mask = np.argmax(preds, axis=-1)
return pred_mask.astype(np.uint8)
demo = gr.Interface(
fn=predict_image,
inputs="image",
outputs="image"
)